full attn block indexes should be []int32
This commit is contained in:
parent
b3da8a319e
commit
ca981c8a49
@ -22,7 +22,7 @@ type qwen25VLModel struct {
|
|||||||
WindowSize uint32 `json:"window_size"`
|
WindowSize uint32 `json:"window_size"`
|
||||||
RMSNormEps float32 `json:"layer_norm_epsilon"`
|
RMSNormEps float32 `json:"layer_norm_epsilon"`
|
||||||
RopeTheta float32 `json:"rope_theta"`
|
RopeTheta float32 `json:"rope_theta"`
|
||||||
FullAttentionBlocks []uint32 `json:"fullatt_block_indexes"`
|
FullAttentionBlocks []int32 `json:"fullatt_block_indexes"`
|
||||||
TemporalPatchSize uint32 `json:"temporal_patch_size"`
|
TemporalPatchSize uint32 `json:"temporal_patch_size"`
|
||||||
} `json:"vision_config"`
|
} `json:"vision_config"`
|
||||||
}
|
}
|
||||||
|
@ -69,7 +69,6 @@ func (m *Model) EncodeMultimodal(ctx ml.Context, multimodalData []byte) (any, er
|
|||||||
func (m *Model) PostTokenize(inputs []input.Input) ([]input.Input, error) {
|
func (m *Model) PostTokenize(inputs []input.Input) ([]input.Input, error) {
|
||||||
var result []input.Input
|
var result []input.Input
|
||||||
|
|
||||||
// Get image token IDs from config
|
|
||||||
var (
|
var (
|
||||||
imageToken int32 = 151655
|
imageToken int32 = 151655
|
||||||
visionStartToken int32 = 151652
|
visionStartToken int32 = 151652
|
||||||
|
Loading…
x
Reference in New Issue
Block a user