mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-07 11:23:56 +01:00
gguf : write sample tensors to read
This commit is contained in:
parent
08dc8fd884
commit
06f423a8e1
10
gguf.py
10
gguf.py
@ -179,14 +179,12 @@ class GGUFWriter:
|
|||||||
def write_tensors(self):
|
def write_tensors(self):
|
||||||
offset_data = GGUFWriter.ggml_pad(self.fout.tell(), constants.GGUF_DEFAULT_ALIGNMENT)
|
offset_data = GGUFWriter.ggml_pad(self.fout.tell(), constants.GGUF_DEFAULT_ALIGNMENT)
|
||||||
pad = offset_data - self.fout.tell()
|
pad = offset_data - self.fout.tell()
|
||||||
print(f"pad: {pad}")
|
|
||||||
if pad != 0:
|
if pad != 0:
|
||||||
self.fout.write(bytes([0] * pad))
|
self.fout.write(bytes([0] * pad))
|
||||||
|
|
||||||
for tensor in self.tensors:
|
for tensor in self.tensors:
|
||||||
tensor.tofile(self.fout)
|
tensor.tofile(self.fout)
|
||||||
pad = GGUFWriter.ggml_pad(tensor.nbytes, constants.GGUF_DEFAULT_ALIGNMENT) - tensor.nbytes
|
pad = GGUFWriter.ggml_pad(tensor.nbytes, constants.GGUF_DEFAULT_ALIGNMENT) - tensor.nbytes
|
||||||
print(f"pad: {pad}")
|
|
||||||
if pad != 0:
|
if pad != 0:
|
||||||
self.fout.write(bytes([0] * pad))
|
self.fout.write(bytes([0] * pad))
|
||||||
|
|
||||||
@ -282,10 +280,10 @@ if __name__ == "__main__":
|
|||||||
gguf_writer.write_architecture("llama")
|
gguf_writer.write_architecture("llama")
|
||||||
gguf_writer.write_uint32("answer", 42) # Write a 32-bit integer
|
gguf_writer.write_uint32("answer", 42) # Write a 32-bit integer
|
||||||
gguf_writer.write_float32("answer_in_float", 42.0) # Write a 32-bit float
|
gguf_writer.write_float32("answer_in_float", 42.0) # Write a 32-bit float
|
||||||
tensor1 = np.ones((7, 8, 3), dtype=np.float32)
|
tensor1 = np.ones((32,), dtype=np.float32) * 100.0
|
||||||
tensor2 = np.ones((7, 8, 3), dtype=np.float32)
|
tensor2 = np.ones((32,), dtype=np.float32) * 101.0
|
||||||
gguf_writer.write_tensor_info("tensor1", tensor1)
|
gguf_writer.write_tensor_info("tensor0", tensor1)
|
||||||
gguf_writer.write_tensor_info("tensor2", tensor2)
|
gguf_writer.write_tensor_info("tensor1", tensor2)
|
||||||
gguf_writer.write_tensors()
|
gguf_writer.write_tensors()
|
||||||
|
|
||||||
gguf_writer.close()
|
gguf_writer.close()
|
||||||
|
Loading…
Reference in New Issue
Block a user