From b2440f1943f88243938e438acef18ad072b9004e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?M=2E=20Yusuf=20Sar=C4=B1g=C3=B6z?= Date: Fri, 11 Aug 2023 11:29:50 +0300 Subject: [PATCH] gguf : start implementing gguf_file_saver (WIP) --- gguf-llama.cpp | 15 ++++++++++++--- 1 file changed, 12 insertions(+), 3 deletions(-) diff --git a/gguf-llama.cpp b/gguf-llama.cpp index e88dc6a08..08b700435 100644 --- a/gguf-llama.cpp +++ b/gguf-llama.cpp @@ -647,9 +647,14 @@ struct gguf_file_saver { } void write_hparams(enum llama_ftype new_ftype) { - const llama_hparams & hparams = any_file_loader->hparams; - GGML_UNUSED(hparams); - GGML_UNUSED(new_ftype); + const int32_t n_kv = gguf_get_n_kv(any_file_loader->gguf_ctx); + for (int i = 0; i < n_kv; ++i) { + const char * key = gguf_get_key(any_file_loader->gguf_ctx, i); + if (strcmp(key, "general.quantization_version") == 0) { + file.write_val("general.quantization_version", GGUF_TYPE_UINT32, new_ftype); + } + } + } void write_vocab() { @@ -658,6 +663,10 @@ struct gguf_file_saver { } void write_tensor(llama_load_tensor & tensor, enum ggml_type new_type, const void * new_data, size_t new_size) { + GGML_UNUSED(tensor); + GGML_UNUSED(new_data); + GGML_UNUSED(new_size); + switch (new_type) { case GGML_TYPE_F32: case GGML_TYPE_F16: