From 1a2c413225781b08a08f67e94b3e900f1a95e1d6 Mon Sep 17 00:00:00 2001 From: Bruce MacDonald Date: Fri, 9 May 2025 14:35:10 -0700 Subject: [PATCH] move mask --- model/models/qwen25vl/model_vision.go | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/model/models/qwen25vl/model_vision.go b/model/models/qwen25vl/model_vision.go index 485644963..be227e055 100644 --- a/model/models/qwen25vl/model_vision.go +++ b/model/models/qwen25vl/model_vision.go @@ -232,6 +232,7 @@ func (m *VisionModel) Forward(ctx ml.Context, pixelValues ml.Tensor, grid *Grid) cos = cos.Reshape(ctx, cos.Dim(0), 1, cos.Dim(1)) sin = sin.Reshape(ctx, sin.Dim(0), 1, sin.Dim(1)) + mask := blockDiagonalMask(ctx, hiddenStates.Dim(1), bounds, m.VisionModelOptions.numHeads) // Apply encoder layers for i, layer := range m.Layers { if slices.Contains(m.fullAttnBlocks, i) { @@ -242,7 +243,7 @@ func (m *VisionModel) Forward(ctx ml.Context, pixelValues ml.Tensor, grid *Grid) hiddenStates, cos, sin, - blockDiagonalMask(ctx, hiddenStates.Dim(1), bounds, m.VisionModelOptions.numHeads), + mask, m.VisionModelOptions, ) }