@@ -4776,7 +4776,6 @@ struct llm_build_context {
4776
4776
const int64_t n_embd_head = hparams.n_embd_head_v;
4777
4777
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
4778
4778
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
4779
- GGML_ASSERT(n_embd_gqa == n_embd);
4780
4779
4781
4780
struct ggml_tensor * cur;
4782
4781
struct ggml_tensor * inpL;
@@ -4900,7 +4899,6 @@ struct llm_build_context {
4900
4899
const int64_t n_embd_head = hparams.n_embd_head_v;
4901
4900
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
4902
4901
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
4903
- GGML_ASSERT(n_embd_gqa == n_embd);
4904
4902
4905
4903
struct ggml_tensor * cur;
4906
4904
struct ggml_tensor * pos;
@@ -5001,7 +4999,6 @@ struct llm_build_context {
5001
4999
const int64_t n_embd_head = hparams.n_embd_head_v;
5002
5000
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5003
5001
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5004
- GGML_ASSERT(n_embd_gqa == n_embd);
5005
5002
5006
5003
const int64_t n_rot = n_embd_head_k / 2;
5007
5004
@@ -5215,7 +5212,6 @@ struct llm_build_context {
5215
5212
const int64_t n_embd_head = hparams.n_embd_head_v;
5216
5213
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5217
5214
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5218
- GGML_ASSERT(n_embd_gqa == n_embd);
5219
5215
5220
5216
struct ggml_tensor * cur;
5221
5217
struct ggml_tensor * inpL;
@@ -5308,7 +5304,6 @@ struct llm_build_context {
5308
5304
const int64_t n_embd_head = hparams.n_embd_head_v;
5309
5305
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5310
5306
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5311
- GGML_ASSERT(n_embd_gqa == n_embd);
5312
5307
5313
5308
struct ggml_tensor * cur;
5314
5309
struct ggml_tensor * inpL;
@@ -5404,7 +5399,6 @@ struct llm_build_context {
5404
5399
const int64_t n_embd_head = hparams.n_embd_head_v;
5405
5400
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5406
5401
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5407
- GGML_ASSERT(n_embd_gqa == n_embd);
5408
5402
5409
5403
struct ggml_tensor * cur;
5410
5404
struct ggml_tensor * inpL;
@@ -5731,7 +5725,6 @@ struct llm_build_context {
5731
5725
const int64_t n_embd_head = hparams.n_embd_head_v;
5732
5726
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5733
5727
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5734
- GGML_ASSERT(n_embd_gqa == n_embd);
5735
5728
5736
5729
struct ggml_tensor * cur;
5737
5730
struct ggml_tensor * attn_norm_output;
@@ -5955,7 +5948,6 @@ struct llm_build_context {
5955
5948
const int64_t n_embd_head = hparams.n_embd_head_v;
5956
5949
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
5957
5950
GGML_ASSERT(n_embd_head == hparams.n_embd_head_k);
5958
- GGML_ASSERT(n_embd_gqa == n_embd);
5959
5951
5960
5952
struct ggml_tensor * cur;
5961
5953
struct ggml_tensor * pos;
0 commit comments