Skip to content

Commit 2bc7545

Browse files
committed
kv-cache : ggml_rope_ext_inplace -> ggml_rope_ext
ggml-ci
1 parent 903e46f commit 2bc7545

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama-kv-cache.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -613,14 +613,14 @@ ggml_tensor * llama_kv_cache_unified::build_rope_shift(
613613
// dequantize to f32 -> RoPE -> quantize back
614614
tmp = ggml_cast(ctx, cur, GGML_TYPE_F32);
615615

616-
tmp = ggml_rope_ext_inplace(ctx, tmp,
616+
tmp = ggml_rope_ext(ctx, tmp,
617617
shift, factors, n_rot, rope_type, n_ctx_orig, freq_base, freq_scale,
618618
yarn_ext_factor, yarn_attn_factor, yarn_beta_fast, yarn_beta_slow);
619619

620620
tmp = ggml_cpy(ctx, tmp, cur);
621621
} else {
622622
// we rotate only the first n_rot dimensions
623-
tmp = ggml_rope_ext_inplace(ctx, cur,
623+
tmp = ggml_rope_ext(ctx, cur,
624624
shift, factors, n_rot, rope_type, n_ctx_orig, freq_base, freq_scale,
625625
yarn_ext_factor, yarn_attn_factor, yarn_beta_fast, yarn_beta_slow);
626626
}

0 commit comments

Comments
 (0)