remove support for multiple ggufs in a single file (#10722)

* remove support for multiple ggufs in a single file

this was an attempt to make it easier to import multimodal models into
ollama. this was rarely used and error prone so remove it

* fix: create fused model from blob
This commit is contained in:
Michael Yang 2025-05-21 13:55:31 -07:00 committed by GitHub
parent 7359b02707
commit 61aeaf7e81
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -501,48 +501,27 @@ func ggufLayers(digest string, fn func(resp api.ProgressResponse)) ([]*layerGGML
return nil, errOnlyGGUFSupported return nil, errOnlyGGUFSupported
} }
stat, err := blob.Stat() f, err := ggml.Decode(blob, -1)
if err != nil { if err != nil {
return nil, err return nil, err
} }
var offset int64 mediatype := "application/vnd.ollama.image.model"
for offset < stat.Size() { if f.KV().Kind() == "adapter" {
f, err := ggml.Decode(blob, -1) mediatype = "application/vnd.ollama.image.adapter"
if errors.Is(err, io.EOF) { } else if (f.KV().Uint("block_count") == 0 && f.KV().Uint("vision.block_count") > 0) || f.KV().Kind() == "projector" {
break // if a model has vision.block_count but not block_count, it is a standalone vision model
} else if err != nil { mediatype = "application/vnd.ollama.image.projector"
return nil, err
}
mediatype := "application/vnd.ollama.image.model"
if f.KV().Kind() == "adapter" {
mediatype = "application/vnd.ollama.image.adapter"
} else if _, ok := f.KV()[fmt.Sprintf("%s.vision.block_count", f.KV().Architecture())]; ok || f.KV().Kind() == "projector" {
mediatype = "application/vnd.ollama.image.projector"
}
var layer Layer
if digest != "" && f.Length == stat.Size() && offset == 0 {
layer, err = NewLayerFromLayer(digest, mediatype, blob.Name())
if err != nil {
slog.Debug("could not create new layer from layer", "error", err)
return nil, err
}
}
// Fallback to creating layer from file copy (either NewLayerFromLayer failed, or digest empty/n != stat.Size())
if layer.Digest == "" {
layer, err = NewLayer(io.NewSectionReader(blob, offset, f.Length), mediatype)
if err != nil {
return nil, err
}
}
layers = append(layers, &layerGGML{layer, f})
offset = f.Length
} }
layer, err := NewLayerFromLayer(digest, mediatype, blob.Name())
if err != nil {
slog.Debug("could not create new layer from layer", "error", err)
return nil, err
}
layers = append(layers, &layerGGML{layer, f})
return detectChatTemplate(layers) return detectChatTemplate(layers)
} }