mirror of
https://github.com/dogkeeper886/ollama37.git
synced 2025-12-10 15:57:04 +00:00
use non-causal mask for inputs with images
This commit is contained in:
@@ -181,6 +181,11 @@ func (m *TextModel) Forward(ctx ml.Context, inputs, positions, outputs ml.Tensor
|
|||||||
visionOutputs := multimodal[0].Multimodal.(ml.Tensor)
|
visionOutputs := multimodal[0].Multimodal.(ml.Tensor)
|
||||||
offset := multimodal[0].Index - 1 - visionOutputs.Dim(1)
|
offset := multimodal[0].Index - 1 - visionOutputs.Dim(1)
|
||||||
hiddenState = hiddenState.Set(ctx, visionOutputs, offset*hiddenState.Stride(1))
|
hiddenState = hiddenState.Set(ctx, visionOutputs, offset*hiddenState.Stride(1))
|
||||||
|
|
||||||
|
if causal, ok := cache.(*kvcache.WrapperCache).UnderlyingCache().(*kvcache.Causal); ok {
|
||||||
|
causal.SetCausal(ctx, false)
|
||||||
|
defer causal.SetCausal(ctx, true)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
for i, layer := range m.Layers {
|
for i, layer := range m.Layers {
|
||||||
|
|||||||
Reference in New Issue
Block a user