Skip to content

Commit 3dba017

Browse files
committed
fix
1 parent 5001dee commit 3dba017

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/llama.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -603,7 +603,7 @@ static struct ggml_tensor * llm_build_kqv(
603603
ggml_flash_attn_ext_set_prec(cur, GGML_PREC_F32);
604604

605605
if (n_embd_head_v < n_embd_head_k) {
606-
cur = ggml_reshape_3d(ctx, cur, n_embd_head_v, n_head, n_tokens);
606+
cur = ggml_reshape_3d(ctx, cur, n_embd_head_v_out, n_head, n_tokens);
607607
cur = ggml_cont(ctx, ggml_view_3d(ctx, cur, n_embd_head_v, n_head, n_tokens,
608608
ggml_row_size(cur->type, n_embd_head_v_out),
609609
ggml_row_size(cur->type, n_embd_head_v_out * n_head),

0 commit comments

Comments
 (0)