mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-10 10:27:03 +00:00
sycl: refactor quantization to q8_1 (#14815)
* sycl: quantization to q8_1 refactor * Refactored src1 copy logic in op_mul_mat
This commit is contained in:
committed by
GitHub
parent
a5771c9eea
commit
afc0e89698
@@ -28,6 +28,7 @@
|
||||
#include "mmvq.hpp"
|
||||
#include "norm.hpp"
|
||||
#include "outprod.hpp"
|
||||
#include "quantize.hpp"
|
||||
#include "quants.hpp"
|
||||
#include "rope.hpp"
|
||||
#include "set_rows.hpp"
|
||||
|
||||
Reference in New Issue
Block a user