We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3c36213 commit 9dede37Copy full SHA for 9dede37
llama.cpp
@@ -4997,7 +4997,6 @@ struct llm_build_context {
4997
struct ggml_cgraph * gf = ggml_new_graph_custom(ctx0, LLAMA_MAX_NODES, false);
4998
4999
const int64_t n_embd_head = hparams.n_embd_head_v;
5000
- const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5001
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5002
5003
const int64_t n_rot = n_embd_head_k / 2;
@@ -5210,7 +5209,6 @@ struct llm_build_context {
5210
5209
5211
5212
5213
5214
5215
5216
struct ggml_tensor * cur;
0 commit comments