mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-06 09:46:50 +00:00
feat: Add s_off as a parameter in the args struct
This may not be necessary, but it more closely mirrors the CUDA kernel Branch: GraniteFourPerf Signed-off-by: Gabe Goodhart <ghart@us.ibm.com>
This commit is contained in:
@@ -519,6 +519,7 @@ typedef struct {
|
|||||||
int64_t n_group;
|
int64_t n_group;
|
||||||
int64_t n_seq_tokens;
|
int64_t n_seq_tokens;
|
||||||
int64_t n_seqs;
|
int64_t n_seqs;
|
||||||
|
int64_t s_off;
|
||||||
uint64_t nb01;
|
uint64_t nb01;
|
||||||
uint64_t nb02;
|
uint64_t nb02;
|
||||||
uint64_t nb03;
|
uint64_t nb03;
|
||||||
|
|||||||
Reference in New Issue
Block a user