common : YAYF (yet another YARN fix) (#3925)

ggml-ci
2024-12-25 05:48:47 +01:00 · 2023-11-03 09:24:00 +02:00 · 2023-11-03 09:24:00 +02:00 · 05816027d6
commit 05816027d6
parent 3fdbe6b66b
2 changed files with 27 additions and 27 deletions
--- a/common/common.h
+++ b/common/common.h
@ -61,9 +61,9 @@ struct gpt_params {
    int32_t n_beams                         = 0;     // if non-zero then use beam search of given width.
    float   rope_freq_base                  = 0.0f;  // RoPE base frequency
    float   rope_freq_scale                 = 0.0f;  // RoPE frequency scaling factor
-    float   yarn_ext_factor                 = NAN;  // YaRN extrapolation mix factor
+    float   yarn_ext_factor                 = -1.0f; // YaRN extrapolation mix factor
    float   yarn_attn_factor                = 1.0f;  // YaRN magnitude scaling factor
-    float   yarn_beta_fast                  = 32.0f;// YaRN low correction dim
+    float   yarn_beta_fast                  = 32.0f; // YaRN low correction dim
    float   yarn_beta_slow                  = 1.0f;  // YaRN high correction dim
    int32_t yarn_orig_ctx                   = 0;     // YaRN original context length
    int8_t  rope_scaling_type               = LLAMA_ROPE_SCALING_UNSPECIFIED;