Increase temperature and min-p a bit new-templates
authorSvjatoslav Agejenko <svjatoslav@svjatoslav.eu>
Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
committerSvjatoslav Agejenko <svjatoslav@svjatoslav.eu>
Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
src/main/java/eu/svjatoslav/alyverkko_cli/AiTask.java

index 2ebc22b..896f69b 100644 (file)
@@ -176,14 +176,13 @@ public class AiTask {
                 "--threads " + configuration.getThreadCount(),
                 "--threads-batch " + configuration.getBatchThreadCount(),
 
-                "--top-k 20", // Restricts token selection to the K tokens with the highest probabilities.
-                             // 1 mean true greedy decoding.
+                "--top-k 20",   // Restricts token selection to the K tokens with the highest probabilities.
 
-                "--top-p 0.95",   // Restricts token selection to the smallest possible set
-                               // of tokens whose cumulative probability exceeds the specified
-                               // threshold P.
+                "--top-p 0.95", // Restricts token selection to the smallest possible set
+                                // of tokens whose cumulative probability exceeds the specified
+                                // threshold P.
 
-                "--min-p 0",    // Filters the vocabulary to include only tokens whose
+                "--min-p 0.1",  // Filters the vocabulary to include only tokens whose
                                 // probability is at least a certain fraction (Min P) of the
                                 // probability of the most likely token.
 
@@ -205,7 +204,7 @@ public class AiTask {
                 "--no-display-prompt",
                 "--no-warmup",
                 "--flash-attn",
-                "--temp 0", // Coding tasks need precision, not randomness
+                "--temp 0.6",
                 "--ctx-size " + mailQuery.model.contextSizeTokens,
                 "--batch-size 512",
                 "--single-turn", // run conversation for a single turn only, then exit when done