From f1257a7de4efbaa785fd97c466862ec44438bdb7 Mon Sep 17 00:00:00 2001 From: Michael Yang Date: Thu, 1 May 2025 12:37:21 -0700 Subject: [PATCH] update vision rope theta default --- convert/convert_qwen25vl.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/convert/convert_qwen25vl.go b/convert/convert_qwen25vl.go index c71a096aa..bc21f629b 100644 --- a/convert/convert_qwen25vl.go +++ b/convert/convert_qwen25vl.go @@ -48,7 +48,7 @@ func (q *qwen25VLModel) KV(t *Tokenizer) ggml.KV { kv["qwen25vl.vision.spatial_patch_size"] = q.VisionModel.SpatialPatchSize kv["qwen25vl.vision.window_size"] = q.VisionModel.WindowSize kv["qwen25vl.vision.attention.layer_norm_epsilon"] = cmp.Or(q.VisionModel.RMSNormEps, 1e-6) - kv["qwen25vl.vision.rope.freq_base"] = cmp.Or(q.VisionModel.RopeTheta, 1e5) + kv["qwen25vl.vision.rope.freq_base"] = cmp.Or(q.VisionModel.RopeTheta, 1e4) kv["qwen25vl.vision.fullatt_block_indexes"] = q.VisionModel.FullAttentionBlocks kv["qwen25vl.vision.temporal_patch_size"] = q.VisionModel.TemporalPatchSize