remove unnecessary scale

2026-06-25 15:46:40 +00:00 · 2026-01-16 23:36:55 +08:00 · 2026-01-16 23:36:55 +08:00 · 93686089a0
commit 93686089a0
parent 130ca90b2f
1 changed files with 2 additions and 2 deletions
--- a/ggml_extend.hpp
+++ b/ggml_extend.hpp
@ -1228,7 +1228,7 @@ __STATIC_INLINE__ struct ggml_tensor* ggml_ext_attention_ext(struct ggml_context
                                                             bool diag_mask_inf       = false,
                                                             bool skip_reshape        = false,
                                                             bool flash_attn          = false,
-                                                             float kv_scale           = 1.0f / 128.f) {  // avoid overflow
+                                                             float kv_scale           = 1.0f) {  // avoid overflow
    int64_t L_q;
    int64_t L_k;
    int64_t C;
@ -2184,7 +2184,7 @@ public:
           bool bias           = true,
           bool force_f32      = false,
           bool force_prec_f32 = false,
-           float scale         = 1.f / 128.f)
+           float scale         = 1.f)
        : in_features(in_features),
          out_features(out_features),
          bias(bias),