Gather data
This commit is contained in:
5
pom.xml
5
pom.xml
@@ -12,6 +12,11 @@
|
||||
</properties>
|
||||
|
||||
<dependencies>
|
||||
<dependency>
|
||||
<groupId>com.google.code.gson</groupId>
|
||||
<artifactId>gson</artifactId>
|
||||
<version>2.13.2</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.postgresql</groupId>
|
||||
<artifactId>postgresql</artifactId>
|
||||
|
||||
@@ -137,7 +137,6 @@ public class Main {
|
||||
System.out.printf(Locale.ROOT, " %-14s: %s%n", "wordsPath", o.wordsPath);
|
||||
System.out.printf(Locale.ROOT, " %-14s: %.2f%n", "minSimplicity", o.minSimplicity);
|
||||
System.out.printf(Locale.ROOT, " %-14s: %d%n", "threads", o.threads);
|
||||
System.out.printf(Locale.ROOT, " %-14s: %d%n", "maxTries", o.tries);
|
||||
}
|
||||
|
||||
private static String fmtPoint(int r, int c) { return String.format(Locale.ROOT, "(%d,%d)", r, c); }
|
||||
@@ -181,8 +180,7 @@ public class Main {
|
||||
|
||||
Defaults:
|
||||
--pop 18
|
||||
--gens 600
|
||||
--tries = threads
|
||||
--gens 500
|
||||
--words nl_score_hints.csv
|
||||
--min-simplicity 0 (no limit)
|
||||
--threads %d
|
||||
@@ -245,33 +243,62 @@ public class Main {
|
||||
|
||||
section("Search");
|
||||
|
||||
var deadline = System.currentTimeMillis() + 40_000;
|
||||
var fillTimeout = 20_000;
|
||||
|
||||
if (opts.threads > 1) {
|
||||
info("mode : multi-threaded (" + opts.threads + ")");
|
||||
var executor = Executors.newFixedThreadPool(opts.threads);
|
||||
var executor = Executors.newFixedThreadPool(opts.threads);
|
||||
var completionService = new ExecutorCompletionService<PuzzleResult>(executor);
|
||||
int submitted = 0;
|
||||
|
||||
try {
|
||||
var tasks = new ArrayList<Callable<PuzzleResult>>();
|
||||
for (var i = 1; i <= opts.tries; i++) {
|
||||
final var attempt = i;
|
||||
tasks.add(() -> {
|
||||
// Keep at least some tasks in flight
|
||||
for (int i = 0; i < opts.threads; i++) {
|
||||
final int attempt = ++submitted;
|
||||
completionService.submit(() -> {
|
||||
var threadRng = new Rng(opts.seed + attempt);
|
||||
var mask = generateMask(threadRng, dict.lenCounts(), opts.pop, opts.gens, false);
|
||||
var filled = fillMask(threadRng, mask, dict.index(), dict.words(), 200, 30000, false);
|
||||
var filled = fillMask(threadRng, mask, dict.index(), dict.words(), 200, fillTimeout, false);
|
||||
|
||||
if (filled.ok && (opts.minSimplicity <= 0 || filled.simplicity >= opts.minSimplicity)) {
|
||||
info("status : SOLVED");
|
||||
info("foundAtTry : " + attempt);
|
||||
return new PuzzleResult(dict, mask, filled);
|
||||
}
|
||||
throw new RuntimeException("No solution in try " + attempt);
|
||||
return null;
|
||||
});
|
||||
}
|
||||
return executor.invokeAny(tasks);
|
||||
|
||||
while (System.currentTimeMillis() < deadline) {
|
||||
var future = completionService.poll(deadline - System.currentTimeMillis(), TimeUnit.MILLISECONDS);
|
||||
if (future == null) break;
|
||||
|
||||
var result = future.get();
|
||||
if (result != null) {
|
||||
info("status : SOLVED");
|
||||
return result;
|
||||
}
|
||||
|
||||
// Submit another task if we still have time
|
||||
if (System.currentTimeMillis() < deadline) {
|
||||
final int attempt = ++submitted;
|
||||
completionService.submit(() -> {
|
||||
var threadRng = new Rng(opts.seed + attempt);
|
||||
var mask = generateMask(threadRng, dict.lenCounts(), opts.pop, opts.gens, false);
|
||||
var filled = fillMask(threadRng, mask, dict.index(), dict.words(), 200, fillTimeout, false);
|
||||
|
||||
if (filled.ok && (opts.minSimplicity <= 0 || filled.simplicity >= opts.minSimplicity)) {
|
||||
return new PuzzleResult(dict, mask, filled);
|
||||
}
|
||||
return null;
|
||||
});
|
||||
}
|
||||
}
|
||||
warn("status : UNSOLVED (timeout)");
|
||||
} catch (InterruptedException e) {
|
||||
Thread.currentThread().interrupt();
|
||||
warn("status : INTERRUPTED");
|
||||
} catch (ExecutionException e) {
|
||||
// all failed
|
||||
warn("status : UNSOLVED");
|
||||
warn("status : ERROR (" + e.getMessage() + ")");
|
||||
} finally {
|
||||
executor.shutdownNow();
|
||||
}
|
||||
@@ -279,13 +306,15 @@ public class Main {
|
||||
|
||||
} else {
|
||||
info("mode : single-threaded");
|
||||
var rng = new Rng(opts.seed);
|
||||
var rng = new Rng(opts.seed);
|
||||
int attempt = 0;
|
||||
|
||||
for (var attempt = 1; attempt <= opts.tries; attempt++) {
|
||||
info("try : " + attempt + "/" + opts.tries);
|
||||
while (System.currentTimeMillis() < deadline) {
|
||||
attempt++;
|
||||
info("try : " + attempt + " (remaining: " + (deadline - System.currentTimeMillis()) / 1000 + "s)");
|
||||
|
||||
var mask = generateMask(rng, dict.lenCounts(), opts.pop, opts.gens, true);
|
||||
var filled = fillMask(rng, mask, dict.index(), dict.words(), 200, 30000, true);
|
||||
var filled = fillMask(rng, mask, dict.index(), dict.words(), 200, fillTimeout, true);
|
||||
|
||||
if (filled.ok && (opts.minSimplicity <= 0 || filled.simplicity >= opts.minSimplicity)) {
|
||||
info("status : SOLVED");
|
||||
@@ -301,7 +330,7 @@ public class Main {
|
||||
}
|
||||
}
|
||||
|
||||
info("status : UNSOLVED");
|
||||
info("status : UNSOLVED (timeout)");
|
||||
return null;
|
||||
}
|
||||
}
|
||||
@@ -397,7 +426,7 @@ public class Main {
|
||||
|
||||
info("Rebuilding index from: " + PUZZLE_DIR);
|
||||
|
||||
List<String> records = new ArrayList<>();
|
||||
var records = new ArrayList<String>();
|
||||
try (var stream = Files.list(PUZZLE_DIR)) {
|
||||
stream.filter(p -> p.toString().endsWith(".json") && !p.getFileName().toString().equals("index.json"))
|
||||
.sorted(Comparator.comparing(Path::getFileName).reversed())
|
||||
|
||||
@@ -5,7 +5,7 @@ import java.nio.charset.StandardCharsets;
|
||||
import java.nio.file.Files;
|
||||
import java.nio.file.Path;
|
||||
import java.util.*;
|
||||
import java.util.concurrent.*;
|
||||
import java.util.function.Predicate;
|
||||
import java.util.stream.Collectors;
|
||||
|
||||
/**
|
||||
@@ -132,7 +132,7 @@ public class SwedishGenerator {
|
||||
int[] data() { return a; } // note: may have extra capacity
|
||||
}
|
||||
|
||||
static record DictEntry(ArrayList<String> words, IntList[][] pos) {
|
||||
static record DictEntry(ArrayList<Lemma> words, IntList[][] pos) {
|
||||
|
||||
public DictEntry(int L) {
|
||||
this(new ArrayList<>(), new IntList[L][26]);
|
||||
@@ -142,14 +142,14 @@ public class SwedishGenerator {
|
||||
}
|
||||
}
|
||||
|
||||
static record WordDifficulty(String word, int difficulty, int simpel, int score, int cross, ArrayList<String> clue) {
|
||||
static record Lemma(String word, int difficulty, int simpel, int score, int cross, ArrayList<String> clue) {
|
||||
|
||||
public WordDifficulty(String word, int simpel, int score, String clue) {
|
||||
var difficulty1 = 0 + ((8 - word.length()) * 30) + ((10 - score) * 15);
|
||||
var crossScore = ThemePoolBuilderLength.crossabilityScore(word);
|
||||
var list = new ArrayList<String>(10);
|
||||
public Lemma(String word, int simpel, int score, String clue) {
|
||||
var complex = 0 + ((8 - word.length()) * 30) + ((10 - score) * 15);
|
||||
var crossScore = ThemePoolBuilderLength.crossabilityScore(word);
|
||||
var list = new ArrayList<String>(10);
|
||||
list.add(clue);
|
||||
this(word, difficulty1, simpel, score, (crossScore * 7) + ((score) * 30) + ((word.length()) * 15), list);
|
||||
this(word, complex, simpel, score, (crossScore * 7) + ((score) * 30) + ((word.length()) * 15), list);
|
||||
|
||||
// Prioritize simple words (high lScore) and long words.
|
||||
// lScore (1-10) adds up to 1000 points (weight 100).
|
||||
@@ -161,9 +161,10 @@ public class SwedishGenerator {
|
||||
// Length impact: up to 8 * 10 = 80
|
||||
// Score impact: up to 10 * 15 = 150
|
||||
}
|
||||
char charAt(int idx) { return word.charAt(idx); }
|
||||
}
|
||||
|
||||
public static record Dict(Map<String, WordDifficulty> words,
|
||||
public static record Dict(Map<String, Lemma> words,
|
||||
HashMap<Integer, DictEntry> index,
|
||||
HashMap<Integer, Integer> lenCounts) { }
|
||||
static Dict loadWords(String wordsPath) {
|
||||
@@ -171,10 +172,11 @@ public class SwedishGenerator {
|
||||
try {
|
||||
raw = Files.readString(Path.of(wordsPath), StandardCharsets.UTF_8);
|
||||
} catch (IOException e) {
|
||||
e.printStackTrace();
|
||||
raw = "WOORD,level_1_to_10,hint\nEU,2,hint\nUUR,2,hint\nAUTO,2,hint\nBOOM,2,hint\nHUIS,2,hint\nKAT,2,hint\nZEE,2,hint\nRODE,2,hint\nDRAAD,2,hint\nKENNIS,2,hint\nNETWERK,2,hint\nPAKTE,2,hint\n";
|
||||
}
|
||||
|
||||
var map = new HashMap<String, WordDifficulty>();
|
||||
var map = new HashMap<String, Lemma>();
|
||||
boolean first = true;
|
||||
for (var line : raw.split("\\R")) {
|
||||
if (line.isBlank()) continue;
|
||||
@@ -200,7 +202,7 @@ public class SwedishGenerator {
|
||||
if (map.containsKey(s)) {
|
||||
map.get(s).clue.add(rawClue);
|
||||
} else {
|
||||
map.put(s, new WordDifficulty(s, simpel, score, rawClue));
|
||||
map.put(s, new Lemma(s, simpel, score, rawClue));
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -223,7 +225,7 @@ public class SwedishGenerator {
|
||||
}
|
||||
|
||||
var idx = entry.words.size();
|
||||
entry.words.add(w.word);
|
||||
entry.words.add(w);
|
||||
|
||||
for (var i = 0; i < L; i++) {
|
||||
var letter = w.word.charAt(i) - 'A';
|
||||
@@ -618,7 +620,7 @@ public class SwedishGenerator {
|
||||
return cross * 10 + s.len;
|
||||
}
|
||||
|
||||
static Undo placeWord(char[][] grid, Slot s, String w) {
|
||||
static Undo placeWord(char[][] grid, Slot s, Lemma w) {
|
||||
var urs = new int[s.len];
|
||||
var ucs = new int[s.len];
|
||||
var up = new char[s.len];
|
||||
@@ -648,7 +650,7 @@ public class SwedishGenerator {
|
||||
}
|
||||
|
||||
static FillResult fillMask(Rng rng, char[][] mask, HashMap<Integer, DictEntry> dictIndex,
|
||||
Map<String, WordDifficulty> llmScores,
|
||||
Map<String, Lemma> llmScores,
|
||||
int logEveryMs, int timeLimitMs, boolean verbose) {
|
||||
|
||||
var grid = deepCopyGrid(mask);
|
||||
@@ -757,9 +759,9 @@ public class SwedishGenerator {
|
||||
var entry = dictIndex.get(s.len);
|
||||
var pat = patternForSlot(grid, s);
|
||||
|
||||
java.util.function.Function<String, Boolean> tryWord = (String w) -> {
|
||||
Predicate<Lemma> tryWord = (Lemma w) -> {
|
||||
if (w == null) return false;
|
||||
if (used.contains(w)) return false;
|
||||
if (used.contains(w.word())) return false;
|
||||
|
||||
for (var i = 0; i < pat.length; i++) {
|
||||
if (pat[i] != 0 && pat[i] != w.charAt(i)) return false;
|
||||
@@ -768,8 +770,8 @@ public class SwedishGenerator {
|
||||
var undo = placeWord(grid, s, w);
|
||||
if (undo == null) return false;
|
||||
|
||||
used.add(w);
|
||||
assigned.put(k, w);
|
||||
used.add(w.word());
|
||||
assigned.put(k, w.word());
|
||||
|
||||
if (backtrack()) return true;
|
||||
|
||||
@@ -792,7 +794,7 @@ public class SwedishGenerator {
|
||||
int idxInArray = (int) (r * r * r * L);
|
||||
var idx = idxs[idxInArray];
|
||||
var w = entry.words.get(idx);
|
||||
if (tryWord.apply(w)) return true;
|
||||
if (tryWord.test(w)) return true;
|
||||
}
|
||||
stats.backtracks++;
|
||||
return false;
|
||||
@@ -809,7 +811,7 @@ public class SwedishGenerator {
|
||||
double r = rng.nextFloat();
|
||||
int idxInArray = (int) (r * r * r * N);
|
||||
var w = entry.words.get(idxInArray);
|
||||
if (tryWord.apply(w)) return true;
|
||||
if (tryWord.test(w)) return true;
|
||||
}
|
||||
|
||||
stats.backtracks++;
|
||||
|
||||
Reference in New Issue
Block a user