llama : do not quantize expert gating tensors

2025-01-30 05:43:03 +01:00 · 2023-12-10 13:00:13 +02:00 · 2023-12-10 13:00:13 +02:00 · d1259b7b35
commit d1259b7b35
parent 6cfb31f9ea
1 changed files with 3 additions and 0 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -8443,6 +8443,9 @@ static void llama_model_quantize_internal(const std::string & fname_inp, const s
        quantize &= params->quantize_output_tensor || name != "output.weight";
        quantize &= !params->only_copy;

+        // do not quantize expert gating tensors
+        quantize &= name.find("ffn_gate_inp.weight") == std::string::npos;
+
        enum ggml_type new_type;
        void * new_data;
        size_t new_size;