mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-01 09:01:57 +00:00
gguf : start implementing quantization (WIP)
This commit is contained in:
@@ -778,8 +778,7 @@ struct gguf_file_saver {
|
||||
}
|
||||
|
||||
write_tensor_info(tensor);
|
||||
// file.write_raw(new_data);
|
||||
GGML_UNUSED(new_data);
|
||||
file.write_raw(new_data, new_size);
|
||||
size_t padded_size = GGML_PAD(new_size, GGUF_DEFAULT_ALIGNMENT); // TODO: handle custom alignment
|
||||
size_t pad = padded_size - new_size;
|
||||
file.write_zeros(pad);
|
||||
|
||||
Reference in New Issue
Block a user