mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	gguf-py : allow previewing reflinked size on non-Linux platforms
This commit is contained in:
		| @@ -738,7 +738,6 @@ class TextModel(ModelBase): | |||||||
|         super().prepare_metadata(vocab_only=vocab_only) |         super().prepare_metadata(vocab_only=vocab_only) | ||||||
|  |  | ||||||
|         total_params = self.gguf_writer.get_total_parameter_count()[0] |         total_params = self.gguf_writer.get_total_parameter_count()[0] | ||||||
|  |  | ||||||
|         # Extract the encoding scheme from the file type name. e.g. 'gguf.LlamaFileType.MOSTLY_Q8_0' --> 'Q8_0' |         # Extract the encoding scheme from the file type name. e.g. 'gguf.LlamaFileType.MOSTLY_Q8_0' --> 'Q8_0' | ||||||
|         output_type: str = self.ftype.name.partition("_")[2] |         output_type: str = self.ftype.name.partition("_")[2] | ||||||
|  |  | ||||||
|   | |||||||
| @@ -624,7 +624,7 @@ struct gguf_context * gguf_init_from_file_impl(FILE * file, struct gguf_init_par | |||||||
|         ctx->size = 0; |         ctx->size = 0; | ||||||
|         for (size_t i = 0; i < ctx->info.size(); ++i) { |         for (size_t i = 0; i < ctx->info.size(); ++i) { | ||||||
|             const gguf_tensor_info & ti = ctx->info[i]; |             const gguf_tensor_info & ti = ctx->info[i]; | ||||||
|             // alignment offset is only necessary for GGUF converted with reflinks |             // alignment offset only exists for GGUF converted with reflinks | ||||||
|             const size_t align_offset = ti.offset % ctx->alignment; |             const size_t align_offset = ti.offset % ctx->alignment; | ||||||
|             if (ti.offset - align_offset != ctx->size) { |             if (ti.offset - align_offset != ctx->size) { | ||||||
|                 GGML_LOG_ERROR("%s: tensor '%s' has offset %" PRIu64 ", expected %zu\n", |                 GGML_LOG_ERROR("%s: tensor '%s' has offset %" PRIu64 ", expected %zu\n", | ||||||
|   | |||||||
| @@ -93,7 +93,7 @@ class GGUFWriter: | |||||||
|         self.arch = arch |         self.arch = arch | ||||||
|         self.endianess = endianess |         self.endianess = endianess | ||||||
|         self.data_alignment = GGUF_DEFAULT_ALIGNMENT |         self.data_alignment = GGUF_DEFAULT_ALIGNMENT | ||||||
|         self.use_reflinks = use_reflinks and hasattr(os, "copy_file_range") |         self.use_reflinks = use_reflinks | ||||||
|         self.use_temp_file = False if self.use_reflinks else use_temp_file |         self.use_temp_file = False if self.use_reflinks else use_temp_file | ||||||
|         self.temp_file = None |         self.temp_file = None | ||||||
|         self.tensors = [{}] |         self.tensors = [{}] | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Francis Couture-Harpin
					Francis Couture-Harpin