diff --git a/model/models/qwen25vl/model_text.go b/model/models/qwen25vl/model_text.go index 18ba79e84..25c140ed4 100644 --- a/model/models/qwen25vl/model_text.go +++ b/model/models/qwen25vl/model_text.go @@ -146,7 +146,7 @@ func (l *Layer) Forward(ctx ml.Context, hiddenState, positionIDs, outputs ml.Ten func (m *TextModel) Forward(ctx ml.Context, inputs, positions, outputs ml.Tensor, batch input.Batch, cache kvcache.Cache) (ml.Tensor, error) { // Initial token embedding - hiddenState := m.TokenEmbedding.Forward(ctx, inputs) + hiddenState := m.TokenEmbedding.Forward(ctx, inputs).Duplicate(ctx) for _, image := range batch.Multimodal { visionOutputs := image.Multimodal.(ml.Tensor)