mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-10-28 08:31:25 +00:00
ggml : sync ggml (add GPT-NeoX RoPE implementation)
This commit is contained in:
3
ggml.h
3
ggml.h
@@ -630,7 +630,8 @@ struct ggml_tensor * ggml_soft_max(
|
||||
|
||||
// rotary position embedding
|
||||
// in-place, returns view(a)
|
||||
// if mode == 1, skip n_past elements
|
||||
// if mode & 1 == 1, skip n_past elements
|
||||
// if mode & 2 == 1, GPT-NeoX style
|
||||
// TODO: avoid creating a new tensor every time
|
||||
struct ggml_tensor * ggml_rope(
|
||||
struct ggml_context * ctx,
|
||||
|
||||
Reference in New Issue
Block a user