full attn block indexes should be []int32

This commit is contained in:
Bruce MacDonald 2025-05-01 11:21:56 -07:00
parent b3da8a319e
commit ca981c8a49
2 changed files with 12 additions and 13 deletions

View File

@ -22,7 +22,7 @@ type qwen25VLModel struct {
WindowSize uint32 `json:"window_size"`
RMSNormEps float32 `json:"layer_norm_epsilon"`
RopeTheta float32 `json:"rope_theta"`
FullAttentionBlocks []uint32 `json:"fullatt_block_indexes"`
FullAttentionBlocks []int32 `json:"fullatt_block_indexes"`
TemporalPatchSize uint32 `json:"temporal_patch_size"`
} `json:"vision_config"`
}

View File

@ -69,7 +69,6 @@ func (m *Model) EncodeMultimodal(ctx ml.Context, multimodalData []byte) (any, er
func (m *Model) PostTokenize(inputs []input.Input) ([]input.Input, error) {
var result []input.Input
// Get image token IDs from config
var (
imageToken int32 = 151655
visionStartToken int32 = 151652