mirror of
https://github.com/ggerganov/llama.cpp
synced 2026-05-01 03:42:01 +02:00
ggml : remove KQ mask padding
This commit is contained in:
parent
f914544b16
commit
3ad533689c
@ -2220,7 +2220,7 @@ extern "C" {
|
||||
struct ggml_tensor * a,
|
||||
int k);
|
||||
|
||||
#define GGML_KQ_MASK_PAD 64
|
||||
#define GGML_KQ_MASK_PAD 1
|
||||
|
||||
// q: [n_embd_k, n_batch, n_head, ne3 ]
|
||||
// k: [n_embd_k, n_kv, n_head_kv, ne3 ]
|
||||
|
||||
Loading…
Reference in New Issue
Block a user