switched to NTK aware scaling

2025-09-11 01:24:36 +00:00 · 2023-07-02 17:25:08 +08:00 · 2023-07-02 17:25:08 +08:00 · e17c8497cf
commit e17c8497cf
parent e19483ca0f
4 changed files with 26 additions and 25 deletions
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@ -2223,10 +2223,10 @@ inline void ggml_cuda_op_rope(
    const int n_ctx  = ((int32_t *) src1->data)[3];
    GGML_ASSERT(mode == 0);

-    const float theta_scale = powf(10000.0, -2.0f/n_dims);
+    const float theta_scale = get_theta_scale(n_dims,n_past,n_ctx);
    const float p0 = ((mode & 1) == 0 ? n_past + i02 : i02);

-    const float p = n_ctx <= GGML_TRAINING_CTX ? p0 : p0 * GGML_TRAINING_CTX / n_ctx;
+    const float p = p0;

    // compute
    rope_f32_cuda(src0_ddf_i, dst_ddf_i, ne00, i01_diff, p, theta_scale, cudaStream_main);