common : change defaults [no ci]

2024-12-28 12:24:35 +00:00 · 2024-11-24 15:39:07 +02:00 · 2024-11-24 15:39:07 +02:00 · 4eb126fff0
commit 4eb126fff0
parent 7f9cc2058c
1 changed files with 2 additions and 2 deletions
--- a/common/common.h
+++ b/common/common.h
@ -157,8 +157,8 @@ struct common_params_sampling {
 struct common_params_speculative {
    int32_t n_ctx        =  4096; // draft context size
-    int32_t n_max        =     5; // maximum number of tokens to draft during speculative decoding
+    int32_t n_max        =    16; // maximum number of tokens to draft during speculative decoding
-    int32_t n_min        =     0; // minimum number of draft tokens to use for speculative decoding
+    int32_t n_min        =     5; // minimum number of draft tokens to use for speculative decoding
    int32_t n_gpu_layers =    -1; // number of layers to store in VRAM for the draft model (-1 - use default)
    float   p_split      =  0.1f; // speculative decoding split probability
    float   p_min        =  0.9f; // minimum speculative decoding probability (greedy)