ggml-zdnn: tighten memory usage, change string allocation

Signed-off-by: Aaron Teo <aaron.teo1@ibm.com>
This commit is contained in:
Aaron Teo
2025-07-28 15:55:42 +08:00
parent aef93b3908
commit bee7dd3020
2 changed files with 3 additions and 5 deletions

View File

@@ -59,13 +59,13 @@ typedef unsigned long long ulong64x2_t __attribute__((vector_size(16)));
struct ggml_backend_zdnn_buffer {
void * data;
size_t size;
ggml_backend_zdnn_buffer * extra; // for bias etc.
zdnn_tensor_desc pre_tfm_desc;
zdnn_tensor_desc tfm_desc;
zdnn_ztensor ztensor;
char name[GGML_MAX_NAME];
struct ggml_backend_zdnn_buffer * extra; // for bias etc.
ggml_backend_zdnn_buffer() : extra(nullptr) {}
};