Skip to content

Commit 06a0719

Browse files
committed
Apply rebase edits and remove ggml_cont call that is now unnecessary
1 parent a959a1f commit 06a0719

File tree

2 files changed

+11
-17
lines changed

2 files changed

+11
-17
lines changed

src/llama-model.cpp

Lines changed: 4 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -18620,7 +18620,7 @@ struct llm_build_cogvlm : public llm_graph_context {
1862018620

1862118621
ggml_tensor * inp_pos = build_inp_pos();
1862218622

18623-
auto * inp_attn = build_attn_inp_kv_unified();
18623+
auto * inp_attn = build_attn_inp_kv();
1862418624

1862518625
// check ubatch to see if we have input tokens (text)
1862618626
// or an input embedding vector (image)
@@ -18662,15 +18662,13 @@ struct llm_build_cogvlm : public llm_graph_context {
1866218662
qkv->nb[1], 0);
1866318663
ggml_tensor * Kcur = ggml_view_3d(ctx0, qkv, n_embd_head, n_head_kv, n_tokens, n_embd_head * sizeof(float),
1866418664
qkv->nb[1], n_embd * ggml_element_size(qkv));
18665-
ggml_tensor * Vcur = ggml_cont(ctx0, ggml_view_2d(ctx0, qkv, n_embd, n_tokens,
18666-
qkv->nb[1], 2 * n_embd * ggml_element_size(qkv)));
18667-
18668-
Vcur = ggml_reshape_3d(ctx0, Vcur, n_embd_head, n_head_kv, n_tokens);
18665+
ggml_tensor * Vcur = ggml_view_3d(ctx0, qkv, n_embd_head, n_head_kv, n_tokens, n_embd_head * sizeof(float),
18666+
qkv->nb[1], 2 * n_embd * ggml_element_size(qkv));
1866918667

1867018668
Qcur = ggml_rope(ctx0, Qcur, inp_pos, n_embd_head, rope_type);
1867118669
Kcur = ggml_rope(ctx0, Kcur, inp_pos, n_embd_head, rope_type);
1867218670

18673-
cur = build_attn(inp_attn, wo, nullptr, Qcur, Kcur, Vcur, nullptr, nullptr, kq_scale, il);
18671+
cur = build_attn(inp_attn, wo, nullptr, Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, kq_scale, il);
1867418672
cb(cur, "attn_out", il);
1867518673
}
1867618674

tools/mtmd/clip.cpp

Lines changed: 7 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1645,16 +1645,12 @@ struct clip_graph {
16451645

16461646
cur = ggml_add(ctx0, cur, layer.qkv_b);
16471647

1648-
ggml_tensor * Qcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, n_pos,
1649-
cur->nb[1], 0));
1650-
ggml_tensor * Kcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, n_pos,
1651-
cur->nb[1], n_embd * sizeof(float)));
1652-
ggml_tensor * Vcur = ggml_cont(ctx0, ggml_view_2d(ctx0, cur, n_embd, n_pos,
1653-
cur->nb[1], 2 * n_embd * sizeof(float)));
1654-
1655-
Qcur = ggml_reshape_3d(ctx0, Qcur, d_head, n_head, n_pos);
1656-
Kcur = ggml_reshape_3d(ctx0, Kcur, d_head, n_head, n_pos);
1657-
Vcur = ggml_reshape_3d(ctx0, Vcur, d_head, n_head, n_pos);
1648+
ggml_tensor * Qcur = ggml_view_3d(ctx0, cur, d_head, n_head, n_pos, d_head*sizeof(float),
1649+
cur->nb[1], 0);
1650+
ggml_tensor * Kcur = ggml_view_3d(ctx0, cur, d_head, n_head, n_pos, d_head*sizeof(float),
1651+
cur->nb[1], n_embd * sizeof(float));
1652+
ggml_tensor * Vcur = ggml_view_3d(ctx0, cur, d_head, n_head, n_pos, d_head*sizeof(float),
1653+
cur->nb[1], 2 * n_embd * sizeof(float));
16581654

16591655
cb(Qcur, "Qcur", il);
16601656
cb(Kcur, "Kcur", il);
@@ -3968,7 +3964,7 @@ int clip_n_output_tokens(const struct clip_ctx * ctx, struct clip_image_f32 * im
39683964
} break;
39693965
case PROJECTOR_TYPE_COGVLM:
39703966
{
3971-
n_patches_sq += 2;
3967+
n_patches += 2;
39723968
} break;
39733969
default:
39743970
GGML_ABORT("unsupported projector type");

0 commit comments

Comments
 (0)