imatrix : use GGUF regardless of the output filename

The legacy format can only be produced with --output-format dat
2025-10-31 08:51:55 +00:00 · 2025-07-23 23:08:03 -04:00
parent 53f65c354e
commit 1ef3cc1a87
4 changed files with 14 additions and 17 deletions
--- a/common/common.h
+++ b/common/common.h
@@ -233,12 +233,6 @@ enum common_reasoning_format {
    COMMON_REASONING_FORMAT_DEEPSEEK,        // Extract thinking tag contents and return as `message.reasoning_content`, including in streaming deltas.
 };

-enum common_imatrix_format_type {
-    COMMON_IMATRIX_FORMAT_AUTO,
-    COMMON_IMATRIX_FORMAT_GGUF,
-    COMMON_IMATRIX_FORMAT_DAT,  // legacy
-};
-
 struct common_params {
    int32_t n_predict             =    -1; // new tokens to predict
    int32_t n_ctx                 =  4096; // context size
@@ -437,7 +431,7 @@ struct common_params {
    int32_t n_out_freq  = 10; // output the imatrix every n_out_freq iterations
    int32_t n_save_freq =  0; // save the imatrix every n_save_freq iterations
    int32_t i_chunk     =  0; // start processing from this chunk
-    common_imatrix_format_type imat_out_type = COMMON_IMATRIX_FORMAT_AUTO; // format of the output imatrix
+    bool    imat_dat    = false; // whether the legacy imatrix.dat format should be output

    bool process_output  = false; // collect data for the output tensor
    bool compute_ppl     = true;  // whether to compute perplexity