Skip to content

Commit 3f96065

Browse files
committed
fix
1 parent 3dba017 commit 3f96065

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

src/llama.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -595,6 +595,7 @@ static struct ggml_tensor * llm_build_kqv(
595595
padded_v = ggml_pad(ctx, v, 0, k->ne[0] - v->ne[1], 0, 0);
596596
cb(padded_v, "padded_v", il);
597597
n_embd_head_v_out = n_embd_head_k;
598+
padded_v = ggml_cont(ctx, padded_v);
598599
}
599600

600601
cur = ggml_flash_attn_ext(ctx, q, k, padded_v, kq_mask, kq_scale, hparams.f_max_alibi_bias,

0 commit comments

Comments
 (0)