mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-10-27 08:21:30 +00:00
gguf-py : allow previewing reflinked size on non-Linux platforms
This commit is contained in:
@@ -738,7 +738,6 @@ class TextModel(ModelBase):
|
||||
super().prepare_metadata(vocab_only=vocab_only)
|
||||
|
||||
total_params = self.gguf_writer.get_total_parameter_count()[0]
|
||||
|
||||
# Extract the encoding scheme from the file type name. e.g. 'gguf.LlamaFileType.MOSTLY_Q8_0' --> 'Q8_0'
|
||||
output_type: str = self.ftype.name.partition("_")[2]
|
||||
|
||||
|
||||
@@ -624,7 +624,7 @@ struct gguf_context * gguf_init_from_file_impl(FILE * file, struct gguf_init_par
|
||||
ctx->size = 0;
|
||||
for (size_t i = 0; i < ctx->info.size(); ++i) {
|
||||
const gguf_tensor_info & ti = ctx->info[i];
|
||||
// alignment offset is only necessary for GGUF converted with reflinks
|
||||
// alignment offset only exists for GGUF converted with reflinks
|
||||
const size_t align_offset = ti.offset % ctx->alignment;
|
||||
if (ti.offset - align_offset != ctx->size) {
|
||||
GGML_LOG_ERROR("%s: tensor '%s' has offset %" PRIu64 ", expected %zu\n",
|
||||
|
||||
@@ -93,7 +93,7 @@ class GGUFWriter:
|
||||
self.arch = arch
|
||||
self.endianess = endianess
|
||||
self.data_alignment = GGUF_DEFAULT_ALIGNMENT
|
||||
self.use_reflinks = use_reflinks and hasattr(os, "copy_file_range")
|
||||
self.use_reflinks = use_reflinks
|
||||
self.use_temp_file = False if self.use_reflinks else use_temp_file
|
||||
self.temp_file = None
|
||||
self.tensors = [{}]
|
||||
|
||||
Reference in New Issue
Block a user