Increase temperature and min-p a bit

author Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>

Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)

committer Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>

Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
author Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>
Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
committer Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>
Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
diff --git a/src/main/java/eu/svjatoslav/alyverkko_cli/AiTask.java b/src/main/java/eu/svjatoslav/alyverkko_cli/AiTask.java

index 2ebc22b..896f69b 100644 (file)
--- a/src/main/java/eu/svjatoslav/alyverkko_cli/AiTask.java
+++ b/src/main/java/eu/svjatoslav/alyverkko_cli/AiTask.java
@@ -176,14 +176,13 @@ public class AiTask {
                  "--threads " + configuration.getThreadCount(),
                  "--threads-batch " + configuration.getBatchThreadCount(),
  
-                "--top-k 20", // Restricts token selection to the K tokens with the highest probabilities.
-                             // 1 mean true greedy decoding.
+                "--top-k 20",   // Restricts token selection to the K tokens with the highest probabilities.
  
-                "--top-p 0.95",   // Restricts token selection to the smallest possible set
-                               // of tokens whose cumulative probability exceeds the specified
-                               // threshold P.
+                "--top-p 0.95", // Restricts token selection to the smallest possible set
+                                // of tokens whose cumulative probability exceeds the specified
+                                // threshold P.
  
-                "--min-p 0",    // Filters the vocabulary to include only tokens whose
+                "--min-p 0.1",  // Filters the vocabulary to include only tokens whose
                                  // probability is at least a certain fraction (Min P) of the
                                  // probability of the most likely token.
  
@@ -205,7 +204,7 @@ public class AiTask {
                  "--no-display-prompt",
                  "--no-warmup",
                  "--flash-attn",
-                "--temp 0", // Coding tasks need precision, not randomness
+                "--temp 0.6",
                  "--ctx-size " + mailQuery.model.contextSizeTokens,
                  "--batch-size 512",
                  "--single-turn", // run conversation for a single turn only, then exit when done
author	Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>
	Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)
committer	Svjatoslav Agejenko <svjatoslav@svjatoslav.eu>
	Sun, 20 Jul 2025 14:03:47 +0000 (17:03 +0300)