2023-07-16 17:02:22 -07:00
|
|
|
package server
|
|
|
|
|
|
|
|
import (
|
2023-08-04 18:56:40 -04:00
|
|
|
"bufio"
|
2023-07-16 17:02:22 -07:00
|
|
|
"bytes"
|
2023-07-25 17:08:51 -04:00
|
|
|
"context"
|
2023-07-16 17:02:22 -07:00
|
|
|
"crypto/sha256"
|
|
|
|
"encoding/json"
|
|
|
|
"errors"
|
|
|
|
"fmt"
|
2023-08-08 00:55:34 -04:00
|
|
|
"html/template"
|
2023-07-16 17:02:22 -07:00
|
|
|
"io"
|
|
|
|
"log"
|
|
|
|
"net/http"
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2023-07-17 12:08:10 -07:00
|
|
|
"reflect"
|
2023-07-16 17:02:22 -07:00
|
|
|
"strconv"
|
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/jmorganca/ollama/api"
|
2023-08-04 18:56:40 -04:00
|
|
|
"github.com/jmorganca/ollama/llama"
|
2023-07-16 17:02:22 -07:00
|
|
|
"github.com/jmorganca/ollama/parser"
|
2023-08-04 18:56:40 -04:00
|
|
|
"github.com/jmorganca/ollama/vector"
|
2023-07-16 17:02:22 -07:00
|
|
|
)
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
type RegistryOptions struct {
|
|
|
|
Insecure bool
|
|
|
|
Username string
|
|
|
|
Password string
|
2023-08-10 11:34:25 -07:00
|
|
|
Token string
|
2023-07-21 15:42:19 -07:00
|
|
|
}
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
type Model struct {
|
2023-08-04 18:56:40 -04:00
|
|
|
Name string `json:"name"`
|
|
|
|
ModelPath string
|
|
|
|
Template string
|
|
|
|
System string
|
|
|
|
Digest string
|
|
|
|
Options map[string]interface{}
|
|
|
|
Embeddings []vector.Embedding
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
func (m *Model) Prompt(request api.GenerateRequest, embedding string) (string, error) {
|
2023-08-08 00:55:34 -04:00
|
|
|
t := m.Template
|
|
|
|
if request.Template != "" {
|
|
|
|
t = request.Template
|
|
|
|
}
|
|
|
|
|
|
|
|
tmpl, err := template.New("").Parse(t)
|
2023-07-17 14:21:27 -07:00
|
|
|
if err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
|
|
|
|
var vars struct {
|
2023-07-19 23:22:19 -07:00
|
|
|
First bool
|
2023-07-17 14:21:27 -07:00
|
|
|
System string
|
|
|
|
Prompt string
|
2023-08-04 18:56:40 -04:00
|
|
|
Embed string
|
2023-07-19 19:43:00 -07:00
|
|
|
|
|
|
|
// deprecated: versions <= 0.0.7 used this to omit the system prompt
|
|
|
|
Context []int
|
2023-07-17 14:21:27 -07:00
|
|
|
}
|
|
|
|
|
2023-07-21 20:45:32 -07:00
|
|
|
vars.First = len(request.Context) == 0
|
2023-07-17 14:21:27 -07:00
|
|
|
vars.System = m.System
|
|
|
|
vars.Prompt = request.Prompt
|
2023-07-19 23:22:19 -07:00
|
|
|
vars.Context = request.Context
|
2023-08-08 13:49:37 -04:00
|
|
|
vars.Embed = embedding
|
2023-07-17 14:21:27 -07:00
|
|
|
|
2023-08-08 00:55:34 -04:00
|
|
|
if request.System != "" {
|
|
|
|
vars.System = request.System
|
|
|
|
}
|
|
|
|
|
2023-07-17 14:21:27 -07:00
|
|
|
var sb strings.Builder
|
|
|
|
if err := tmpl.Execute(&sb, vars); err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
|
|
|
|
return sb.String(), nil
|
|
|
|
}
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
type ManifestV2 struct {
|
|
|
|
SchemaVersion int `json:"schemaVersion"`
|
|
|
|
MediaType string `json:"mediaType"`
|
|
|
|
Config Layer `json:"config"`
|
|
|
|
Layers []*Layer `json:"layers"`
|
|
|
|
}
|
|
|
|
|
|
|
|
type Layer struct {
|
|
|
|
MediaType string `json:"mediaType"`
|
|
|
|
Digest string `json:"digest"`
|
|
|
|
Size int `json:"size"`
|
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
type LayerReader struct {
|
2023-07-16 17:02:22 -07:00
|
|
|
Layer
|
2023-07-18 17:14:12 -07:00
|
|
|
io.Reader
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
type ConfigV2 struct {
|
|
|
|
Architecture string `json:"architecture"`
|
|
|
|
OS string `json:"os"`
|
|
|
|
RootFS RootFS `json:"rootfs"`
|
|
|
|
}
|
|
|
|
|
|
|
|
type RootFS struct {
|
|
|
|
Type string `json:"type"`
|
|
|
|
DiffIDs []string `json:"diff_ids"`
|
|
|
|
}
|
|
|
|
|
2023-07-18 09:09:45 -07:00
|
|
|
func (m *ManifestV2) GetTotalSize() int {
|
|
|
|
var total int
|
|
|
|
for _, layer := range m.Layers {
|
|
|
|
total += layer.Size
|
|
|
|
}
|
|
|
|
total += m.Config.Size
|
|
|
|
return total
|
|
|
|
}
|
|
|
|
|
2023-07-17 22:44:21 -07:00
|
|
|
func GetManifest(mp ModelPath) (*ManifestV2, error) {
|
|
|
|
fp, err := mp.GetManifestPath(false)
|
2023-07-17 11:03:55 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-07-17 14:21:27 -07:00
|
|
|
|
2023-07-21 23:02:12 -07:00
|
|
|
if _, err = os.Stat(fp); err != nil {
|
|
|
|
return nil, err
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
var manifest *ManifestV2
|
|
|
|
|
2023-07-17 14:21:27 -07:00
|
|
|
bts, err := os.ReadFile(fp)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("couldn't open file '%s'", fp)
|
|
|
|
}
|
|
|
|
|
2023-07-17 14:21:27 -07:00
|
|
|
if err := json.Unmarshal(bts, &manifest); err != nil {
|
2023-07-16 17:02:22 -07:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return manifest, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func GetModel(name string) (*Model, error) {
|
2023-07-17 22:44:21 -07:00
|
|
|
mp := ParseModelPath(name)
|
|
|
|
|
|
|
|
manifest, err := GetManifest(mp)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
model := &Model{
|
2023-07-31 15:07:04 -04:00
|
|
|
Name: mp.GetFullTagname(),
|
2023-07-31 21:35:18 -04:00
|
|
|
Digest: manifest.Config.Digest,
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
for _, layer := range manifest.Layers {
|
2023-07-17 22:44:21 -07:00
|
|
|
filename, err := GetBlobsPath(layer.Digest)
|
2023-07-17 11:03:55 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
switch layer.MediaType {
|
|
|
|
case "application/vnd.ollama.image.model":
|
|
|
|
model.ModelPath = filename
|
2023-08-04 18:56:40 -04:00
|
|
|
case "application/vnd.ollama.image.embed":
|
|
|
|
file, err := os.Open(filename)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to open file: %s", filename)
|
|
|
|
}
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
|
if err = json.NewDecoder(file).Decode(&model.Embeddings); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-07-17 14:21:27 -07:00
|
|
|
case "application/vnd.ollama.image.template":
|
|
|
|
bts, err := os.ReadFile(filename)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
model.Template = string(bts)
|
|
|
|
case "application/vnd.ollama.image.system":
|
|
|
|
bts, err := os.ReadFile(filename)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-07-17 14:21:27 -07:00
|
|
|
|
|
|
|
model.System = string(bts)
|
2023-07-19 19:43:00 -07:00
|
|
|
case "application/vnd.ollama.image.prompt":
|
|
|
|
bts, err := os.ReadFile(filename)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
model.Template = string(bts)
|
2023-07-16 17:02:22 -07:00
|
|
|
case "application/vnd.ollama.image.params":
|
2023-07-17 12:08:10 -07:00
|
|
|
params, err := os.Open(filename)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer params.Close()
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-31 15:07:04 -04:00
|
|
|
// parse model options parameters into a map so that we can see which fields have been specified explicitly
|
2023-08-01 13:36:31 -04:00
|
|
|
if err = json.NewDecoder(params).Decode(&model.Options); err != nil {
|
2023-07-31 15:07:04 -04:00
|
|
|
return nil, err
|
|
|
|
}
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return model, nil
|
|
|
|
}
|
|
|
|
|
2023-08-04 18:56:40 -04:00
|
|
|
func filenameWithPath(path, f string) (string, error) {
|
|
|
|
// if filePath starts with ~/, replace it with the user's home directory.
|
|
|
|
if strings.HasPrefix(f, "~/") {
|
|
|
|
parts := strings.Split(f, "/")
|
|
|
|
home, err := os.UserHomeDir()
|
|
|
|
if err != nil {
|
|
|
|
return "", fmt.Errorf("failed to open file: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
f = filepath.Join(home, filepath.Join(parts[1:]...))
|
|
|
|
}
|
|
|
|
|
|
|
|
// if filePath is not an absolute path, make it relative to the modelfile path
|
|
|
|
if !filepath.IsAbs(f) {
|
|
|
|
f = filepath.Join(filepath.Dir(path), f)
|
|
|
|
}
|
|
|
|
|
|
|
|
return f, nil
|
|
|
|
}
|
|
|
|
|
2023-07-25 17:08:51 -04:00
|
|
|
func CreateModel(ctx context.Context, name string, path string, fn func(resp api.ProgressResponse)) error {
|
2023-07-19 21:55:15 -07:00
|
|
|
mf, err := os.Open(path)
|
|
|
|
if err != nil {
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: fmt.Sprintf("couldn't open modelfile '%s'", path)})
|
2023-07-19 21:55:15 -07:00
|
|
|
return fmt.Errorf("failed to open file: %w", err)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
2023-07-19 21:55:15 -07:00
|
|
|
defer mf.Close()
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "parsing modelfile"})
|
2023-07-16 17:02:22 -07:00
|
|
|
commands, err := parser.Parse(mf)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
var layers []*LayerReader
|
2023-07-28 11:29:00 -04:00
|
|
|
params := make(map[string][]string)
|
2023-08-04 18:56:40 -04:00
|
|
|
embed := EmbeddingParams{fn: fn, opts: api.DefaultOptions()}
|
2023-07-16 17:02:22 -07:00
|
|
|
for _, c := range commands {
|
2023-07-17 14:21:27 -07:00
|
|
|
log.Printf("[%s] - %s\n", c.Name, c.Args)
|
2023-07-16 17:02:22 -07:00
|
|
|
switch c.Name {
|
|
|
|
case "model":
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "looking for model"})
|
2023-08-04 18:56:40 -04:00
|
|
|
embed.model = c.Args
|
2023-07-17 14:21:27 -07:00
|
|
|
mf, err := GetManifest(ParseModelPath(c.Args))
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
2023-08-04 18:56:40 -04:00
|
|
|
modelFile, err := filenameWithPath(path, c.Args)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
if _, err := os.Stat(modelFile); err != nil {
|
2023-07-25 14:25:13 -04:00
|
|
|
// the model file does not exist, try pulling it
|
|
|
|
if errors.Is(err, os.ErrNotExist) {
|
|
|
|
fn(api.ProgressResponse{Status: "pulling model file"})
|
2023-07-25 17:08:51 -04:00
|
|
|
if err := PullModel(ctx, c.Args, &RegistryOptions{}, fn); err != nil {
|
2023-07-25 14:25:13 -04:00
|
|
|
return err
|
|
|
|
}
|
2023-08-08 14:38:57 -04:00
|
|
|
mf, err = GetManifest(ParseModelPath(c.Args))
|
2023-07-25 14:25:13 -04:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to open file after pull: %v", err)
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// create a model from this specified file
|
|
|
|
fn(api.ProgressResponse{Status: "creating model layer"})
|
2023-08-04 18:56:40 -04:00
|
|
|
file, err := os.Open(modelFile)
|
2023-07-25 14:25:13 -04:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to open file: %v", err)
|
|
|
|
}
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
|
l, err := CreateLayer(file)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to create layer: %v", err)
|
|
|
|
}
|
|
|
|
l.MediaType = "application/vnd.ollama.image.model"
|
|
|
|
layers = append(layers, l)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
2023-07-25 14:25:13 -04:00
|
|
|
}
|
|
|
|
if mf != nil {
|
2023-07-16 17:02:22 -07:00
|
|
|
log.Printf("manifest = %#v", mf)
|
|
|
|
for _, l := range mf.Layers {
|
|
|
|
newLayer, err := GetLayerWithBufferFromLayer(l)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
layers = append(layers, newLayer)
|
|
|
|
}
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
case "embed":
|
|
|
|
embedFilePath, err := filenameWithPath(path, c.Args)
|
2023-07-31 21:34:52 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
embed.files = append(embed.files, embedFilePath)
|
2023-08-08 16:56:48 -04:00
|
|
|
case "license":
|
|
|
|
fn(api.ProgressResponse{Status: fmt.Sprintf("creating model %s layer", c.Name)})
|
|
|
|
mediaType := fmt.Sprintf("application/vnd.ollama.image.%s", c.Name)
|
|
|
|
|
|
|
|
layer, err := CreateLayer(strings.NewReader(c.Args))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
layer.MediaType = mediaType
|
|
|
|
layers = append(layers, layer)
|
|
|
|
case "template", "system", "prompt":
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: fmt.Sprintf("creating model %s layer", c.Name)})
|
2023-07-16 17:02:22 -07:00
|
|
|
// remove the prompt layer if one exists
|
2023-07-17 14:21:27 -07:00
|
|
|
mediaType := fmt.Sprintf("application/vnd.ollama.image.%s", c.Name)
|
|
|
|
layers = removeLayerFromLayers(layers, mediaType)
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-17 14:21:27 -07:00
|
|
|
layer, err := CreateLayer(strings.NewReader(c.Args))
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
2023-07-17 14:21:27 -07:00
|
|
|
return err
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
2023-07-17 14:21:27 -07:00
|
|
|
|
|
|
|
layer.MediaType = mediaType
|
|
|
|
layers = append(layers, layer)
|
2023-07-16 17:02:22 -07:00
|
|
|
default:
|
2023-07-28 11:29:00 -04:00
|
|
|
// runtime parameters, build a list of args for each parameter to allow multiple values to be specified (ex: multiple stop tokens)
|
|
|
|
params[c.Name] = append(params[c.Name], c.Args)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create a single layer for the parameters
|
2023-07-17 12:08:10 -07:00
|
|
|
if len(params) > 0 {
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "creating parameter layer"})
|
2023-07-16 17:02:22 -07:00
|
|
|
layers = removeLayerFromLayers(layers, "application/vnd.ollama.image.params")
|
2023-08-04 18:56:40 -04:00
|
|
|
formattedParams, err := formatParams(params)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("couldn't create params json: %v", err)
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
|
|
|
|
bts, err := json.Marshal(formattedParams)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
l, err := CreateLayer(bytes.NewReader(bts))
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("failed to create layer: %v", err)
|
|
|
|
}
|
|
|
|
l.MediaType = "application/vnd.ollama.image.params"
|
|
|
|
layers = append(layers, l)
|
2023-08-04 18:56:40 -04:00
|
|
|
|
|
|
|
// apply these parameters to the embedding options, in case embeddings need to be generated using this model
|
|
|
|
embed.opts = api.DefaultOptions()
|
|
|
|
embed.opts.FromMap(formattedParams)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-08-04 18:56:40 -04:00
|
|
|
// generate the embedding layers
|
|
|
|
embeddingLayers, err := embeddingLayers(embed)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
layers = append(layers, embeddingLayers...)
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
digests, err := getLayerDigests(layers)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
var manifestLayers []*Layer
|
|
|
|
for _, l := range layers {
|
|
|
|
manifestLayers = append(manifestLayers, &l.Layer)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create a layer for the config object
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "creating config layer"})
|
2023-07-16 17:02:22 -07:00
|
|
|
cfg, err := createConfigLayer(digests)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
layers = append(layers, cfg)
|
|
|
|
|
|
|
|
err = SaveLayers(layers, fn, false)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Create the manifest
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "writing manifest"})
|
2023-07-16 17:02:22 -07:00
|
|
|
err = CreateManifest(name, cfg, manifestLayers)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: "success"})
|
2023-07-16 17:02:22 -07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-08-04 18:56:40 -04:00
|
|
|
type EmbeddingParams struct {
|
|
|
|
model string
|
|
|
|
opts api.Options
|
|
|
|
files []string // paths to files to embed
|
|
|
|
fn func(resp api.ProgressResponse)
|
|
|
|
}
|
|
|
|
|
|
|
|
// embeddingLayers loads the associated LLM and generates the embeddings to be stored from an input file
|
|
|
|
func embeddingLayers(e EmbeddingParams) ([]*LayerReader, error) {
|
|
|
|
layers := []*LayerReader{}
|
|
|
|
if len(e.files) > 0 {
|
2023-08-08 14:38:57 -04:00
|
|
|
if _, err := os.Stat(e.model); err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
// this is a model name rather than the file
|
|
|
|
model, err := GetModel(e.model)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to get model to generate embeddings: %v", err)
|
|
|
|
}
|
|
|
|
e.model = model.ModelPath
|
|
|
|
} else {
|
|
|
|
return nil, fmt.Errorf("failed to get model file to generate embeddings: %v", err)
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
e.opts.EmbeddingOnly = true
|
2023-08-08 14:38:57 -04:00
|
|
|
llm, err := llama.New(e.model, e.opts)
|
2023-08-04 18:56:40 -04:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("load model to generate embeddings: %v", err)
|
|
|
|
}
|
2023-08-08 16:56:48 -04:00
|
|
|
defer func() {
|
|
|
|
if llm != nil {
|
|
|
|
llm.Close()
|
|
|
|
}
|
|
|
|
}()
|
2023-08-04 18:56:40 -04:00
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
addedFiles := make(map[string]bool) // keep track of files that have already been added
|
|
|
|
for _, filePattern := range e.files {
|
|
|
|
matchingFiles, err := filepath.Glob(filePattern)
|
2023-08-04 18:56:40 -04:00
|
|
|
if err != nil {
|
2023-08-08 13:49:37 -04:00
|
|
|
return nil, fmt.Errorf("could not find files with pattern %s: %w", filePattern, err)
|
2023-08-04 18:56:40 -04:00
|
|
|
}
|
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
for _, filePath := range matchingFiles {
|
|
|
|
if addedFiles[filePath] {
|
2023-08-04 18:56:40 -04:00
|
|
|
continue
|
|
|
|
}
|
2023-08-08 13:49:37 -04:00
|
|
|
addedFiles[filePath] = true
|
|
|
|
// TODO: check file type
|
|
|
|
f, err := os.Open(filePath)
|
2023-08-04 18:56:40 -04:00
|
|
|
if err != nil {
|
2023-08-08 13:49:37 -04:00
|
|
|
return nil, fmt.Errorf("could not open embed file: %w", err)
|
2023-08-04 18:56:40 -04:00
|
|
|
}
|
2023-08-08 13:49:37 -04:00
|
|
|
scanner := bufio.NewScanner(f)
|
|
|
|
scanner.Split(bufio.ScanLines)
|
|
|
|
|
|
|
|
data := []string{}
|
|
|
|
for scanner.Scan() {
|
|
|
|
data = append(data, scanner.Text())
|
|
|
|
}
|
|
|
|
f.Close()
|
|
|
|
|
|
|
|
// the digest of the file is set here so that the client knows a new operation is in progress
|
|
|
|
fileDigest, _ := GetSHA256Digest(bytes.NewReader([]byte(filePath)))
|
|
|
|
|
|
|
|
embeddings := []vector.Embedding{}
|
|
|
|
for i, d := range data {
|
|
|
|
if strings.TrimSpace(d) == "" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
e.fn(api.ProgressResponse{
|
|
|
|
Status: fmt.Sprintf("creating embeddings for file %s", filePath),
|
|
|
|
Digest: fileDigest,
|
|
|
|
Total: len(data) - 1,
|
|
|
|
Completed: i,
|
|
|
|
})
|
|
|
|
embed, err := llm.Embedding(d)
|
|
|
|
if err != nil {
|
2023-08-09 16:13:24 -04:00
|
|
|
log.Printf("failed to generate embedding for '%s' line %d: %v", filePath, i+1, err)
|
|
|
|
continue
|
2023-08-08 13:49:37 -04:00
|
|
|
}
|
|
|
|
embeddings = append(embeddings, vector.Embedding{Data: d, Vector: embed})
|
2023-08-04 18:56:40 -04:00
|
|
|
}
|
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
b, err := json.Marshal(embeddings)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to encode embeddings: %w", err)
|
|
|
|
}
|
|
|
|
r := bytes.NewReader(b)
|
2023-08-04 18:56:40 -04:00
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
digest, size := GetSHA256Digest(r)
|
|
|
|
// Reset the position of the reader after calculating the digest
|
|
|
|
if _, err := r.Seek(0, io.SeekStart); err != nil {
|
|
|
|
return nil, fmt.Errorf("could not reset embed reader: %w", err)
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
layer := &LayerReader{
|
|
|
|
Layer: Layer{
|
|
|
|
MediaType: "application/vnd.ollama.image.embed",
|
|
|
|
Digest: digest,
|
|
|
|
Size: size,
|
|
|
|
},
|
|
|
|
Reader: r,
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
|
2023-08-08 13:49:37 -04:00
|
|
|
layers = append(layers, layer)
|
|
|
|
}
|
2023-08-04 18:56:40 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return layers, nil
|
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
func removeLayerFromLayers(layers []*LayerReader, mediaType string) []*LayerReader {
|
2023-07-16 17:02:22 -07:00
|
|
|
j := 0
|
|
|
|
for _, l := range layers {
|
|
|
|
if l.MediaType != mediaType {
|
|
|
|
layers[j] = l
|
|
|
|
j++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return layers[:j]
|
|
|
|
}
|
|
|
|
|
2023-07-25 14:25:13 -04:00
|
|
|
func SaveLayers(layers []*LayerReader, fn func(resp api.ProgressResponse), force bool) error {
|
2023-07-16 17:02:22 -07:00
|
|
|
// Write each of the layers to disk
|
|
|
|
for _, layer := range layers {
|
2023-07-17 22:44:21 -07:00
|
|
|
fp, err := GetBlobsPath(layer.Digest)
|
2023-07-17 11:03:55 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-07-16 17:02:22 -07:00
|
|
|
|
|
|
|
_, err = os.Stat(fp)
|
|
|
|
if os.IsNotExist(err) || force {
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: fmt.Sprintf("writing layer %s", layer.Digest)})
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
out, err := os.Create(fp)
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't create %s", fp)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer out.Close()
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
if _, err = io.Copy(out, layer.Reader); err != nil {
|
2023-07-16 17:02:22 -07:00
|
|
|
return err
|
|
|
|
}
|
2023-07-18 17:14:12 -07:00
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
} else {
|
2023-07-25 14:25:13 -04:00
|
|
|
fn(api.ProgressResponse{Status: fmt.Sprintf("using already created layer %s", layer.Digest)})
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
func CreateManifest(name string, cfg *LayerReader, layers []*Layer) error {
|
2023-07-17 22:44:21 -07:00
|
|
|
mp := ParseModelPath(name)
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
manifest := ManifestV2{
|
|
|
|
SchemaVersion: 2,
|
|
|
|
MediaType: "application/vnd.docker.distribution.manifest.v2+json",
|
|
|
|
Config: Layer{
|
|
|
|
MediaType: cfg.MediaType,
|
|
|
|
Size: cfg.Size,
|
|
|
|
Digest: cfg.Digest,
|
|
|
|
},
|
|
|
|
Layers: layers,
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestJSON, err := json.Marshal(manifest)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-17 22:44:21 -07:00
|
|
|
fp, err := mp.GetManifestPath(true)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-07-17 11:03:55 -07:00
|
|
|
return os.WriteFile(fp, manifestJSON, 0o644)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
func GetLayerWithBufferFromLayer(layer *Layer) (*LayerReader, error) {
|
2023-07-17 22:44:21 -07:00
|
|
|
fp, err := GetBlobsPath(layer.Digest)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
file, err := os.Open(fp)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("could not open blob: %w", err)
|
|
|
|
}
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
|
newLayer, err := CreateLayer(file)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
newLayer.MediaType = layer.MediaType
|
|
|
|
return newLayer, nil
|
|
|
|
}
|
|
|
|
|
2023-08-04 18:56:40 -04:00
|
|
|
// formatParams converts specified parameter options to their correct types
|
|
|
|
func formatParams(params map[string][]string) (map[string]interface{}, error) {
|
2023-08-01 13:36:31 -04:00
|
|
|
opts := api.Options{}
|
|
|
|
valueOpts := reflect.ValueOf(&opts).Elem() // names of the fields in the options struct
|
|
|
|
typeOpts := reflect.TypeOf(opts) // types of the fields in the options struct
|
2023-07-17 12:08:10 -07:00
|
|
|
|
2023-08-01 13:36:31 -04:00
|
|
|
// build map of json struct tags to their types
|
2023-07-17 12:08:10 -07:00
|
|
|
jsonOpts := make(map[string]reflect.StructField)
|
|
|
|
for _, field := range reflect.VisibleFields(typeOpts) {
|
|
|
|
jsonTag := strings.Split(field.Tag.Get("json"), ",")[0]
|
|
|
|
if jsonTag != "" {
|
|
|
|
jsonOpts[jsonTag] = field
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-01 13:36:31 -04:00
|
|
|
out := make(map[string]interface{})
|
2023-07-17 12:08:10 -07:00
|
|
|
// iterate params and set values based on json struct tags
|
2023-07-28 11:29:00 -04:00
|
|
|
for key, vals := range params {
|
2023-07-17 12:08:10 -07:00
|
|
|
if opt, ok := jsonOpts[key]; ok {
|
|
|
|
field := valueOpts.FieldByName(opt.Name)
|
|
|
|
if field.IsValid() && field.CanSet() {
|
|
|
|
switch field.Kind() {
|
|
|
|
case reflect.Float32:
|
2023-07-28 11:29:00 -04:00
|
|
|
floatVal, err := strconv.ParseFloat(vals[0], 32)
|
2023-07-17 12:08:10 -07:00
|
|
|
if err != nil {
|
2023-07-28 11:29:00 -04:00
|
|
|
return nil, fmt.Errorf("invalid float value %s", vals)
|
2023-07-17 12:08:10 -07:00
|
|
|
}
|
|
|
|
|
2023-08-01 13:36:31 -04:00
|
|
|
out[key] = floatVal
|
2023-07-17 12:08:10 -07:00
|
|
|
case reflect.Int:
|
2023-07-28 11:29:00 -04:00
|
|
|
intVal, err := strconv.ParseInt(vals[0], 10, 0)
|
2023-07-17 12:08:10 -07:00
|
|
|
if err != nil {
|
2023-07-28 11:29:00 -04:00
|
|
|
return nil, fmt.Errorf("invalid int value %s", vals)
|
2023-07-17 12:08:10 -07:00
|
|
|
}
|
|
|
|
|
2023-08-01 13:36:31 -04:00
|
|
|
out[key] = intVal
|
2023-07-17 12:08:10 -07:00
|
|
|
case reflect.Bool:
|
2023-07-28 11:29:00 -04:00
|
|
|
boolVal, err := strconv.ParseBool(vals[0])
|
2023-07-17 12:08:10 -07:00
|
|
|
if err != nil {
|
2023-07-28 11:29:00 -04:00
|
|
|
return nil, fmt.Errorf("invalid bool value %s", vals)
|
2023-07-17 12:08:10 -07:00
|
|
|
}
|
|
|
|
|
2023-08-01 13:36:31 -04:00
|
|
|
out[key] = boolVal
|
2023-07-17 12:08:10 -07:00
|
|
|
case reflect.String:
|
2023-08-01 13:36:31 -04:00
|
|
|
out[key] = vals[0]
|
2023-07-27 17:02:14 -04:00
|
|
|
case reflect.Slice:
|
2023-08-01 13:36:31 -04:00
|
|
|
// TODO: only string slices are supported right now
|
|
|
|
out[key] = vals
|
2023-07-17 12:08:10 -07:00
|
|
|
default:
|
|
|
|
return nil, fmt.Errorf("unknown type %s for %s", field.Kind(), key)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-04 18:56:40 -04:00
|
|
|
return out, nil
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
func getLayerDigests(layers []*LayerReader) ([]string, error) {
|
2023-07-16 17:02:22 -07:00
|
|
|
var digests []string
|
|
|
|
for _, l := range layers {
|
|
|
|
if l.Digest == "" {
|
|
|
|
return nil, fmt.Errorf("layer is missing a digest")
|
|
|
|
}
|
|
|
|
digests = append(digests, l.Digest)
|
|
|
|
}
|
|
|
|
return digests, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// CreateLayer creates a Layer object from a given file
|
2023-07-18 17:14:12 -07:00
|
|
|
func CreateLayer(f io.ReadSeeker) (*LayerReader, error) {
|
|
|
|
digest, size := GetSHA256Digest(f)
|
|
|
|
f.Seek(0, 0)
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
layer := &LayerReader{
|
2023-07-16 17:02:22 -07:00
|
|
|
Layer: Layer{
|
|
|
|
MediaType: "application/vnd.docker.image.rootfs.diff.tar",
|
|
|
|
Digest: digest,
|
|
|
|
Size: size,
|
|
|
|
},
|
2023-07-18 17:14:12 -07:00
|
|
|
Reader: f,
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return layer, nil
|
|
|
|
}
|
|
|
|
|
2023-07-24 11:27:28 -04:00
|
|
|
func CopyModel(src, dest string) error {
|
|
|
|
srcPath, err := ParseModelPath(src).GetManifestPath(false)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
destPath, err := ParseModelPath(dest).GetManifestPath(true)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// copy the file
|
2023-07-28 10:38:15 -07:00
|
|
|
input, err := os.ReadFile(srcPath)
|
2023-07-24 11:27:28 -04:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println("Error reading file:", err)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-28 10:38:15 -07:00
|
|
|
err = os.WriteFile(destPath, input, 0o644)
|
2023-07-24 11:27:28 -04:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println("Error reading file:", err)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-21 23:02:12 -07:00
|
|
|
func DeleteModel(name string) error {
|
2023-07-20 16:09:23 -07:00
|
|
|
mp := ParseModelPath(name)
|
|
|
|
|
|
|
|
manifest, err := GetManifest(mp)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
deleteMap := make(map[string]bool)
|
|
|
|
for _, layer := range manifest.Layers {
|
|
|
|
deleteMap[layer.Digest] = true
|
|
|
|
}
|
|
|
|
deleteMap[manifest.Config.Digest] = true
|
|
|
|
|
|
|
|
fp, err := GetManifestPath()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
err = filepath.Walk(fp, func(path string, info os.FileInfo, err error) error {
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if !info.IsDir() {
|
|
|
|
path := path[len(fp)+1:]
|
|
|
|
slashIndex := strings.LastIndex(path, "/")
|
|
|
|
if slashIndex == -1 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
tag := path[:slashIndex] + ":" + path[slashIndex+1:]
|
|
|
|
fmp := ParseModelPath(tag)
|
|
|
|
|
|
|
|
// skip the manifest we're trying to delete
|
|
|
|
if mp.GetFullTagname() == fmp.GetFullTagname() {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// save (i.e. delete from the deleteMap) any files used in other manifests
|
|
|
|
manifest, err := GetManifest(fmp)
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("skipping file: %s", fp)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
for _, layer := range manifest.Layers {
|
|
|
|
delete(deleteMap, layer.Digest)
|
|
|
|
}
|
|
|
|
delete(deleteMap, manifest.Config.Digest)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
2023-07-31 15:26:18 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-07-20 16:09:23 -07:00
|
|
|
|
2023-07-28 12:15:23 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-20 16:09:23 -07:00
|
|
|
// only delete the files which are still in the deleteMap
|
|
|
|
for k, v := range deleteMap {
|
|
|
|
if v {
|
2023-07-21 17:30:40 -07:00
|
|
|
fp, err := GetBlobsPath(k)
|
2023-07-20 16:09:23 -07:00
|
|
|
if err != nil {
|
2023-07-21 17:30:40 -07:00
|
|
|
log.Printf("couldn't get file path for '%s': %v", k, err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if err := os.Remove(fp); err != nil {
|
|
|
|
log.Printf("couldn't remove file '%s': %v", fp, err)
|
2023-07-20 16:09:23 -07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fp, err = mp.GetManifestPath(false)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
err = os.Remove(fp)
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't remove manifest file '%s': %v", fp, err)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
func PushModel(name string, regOpts *RegistryOptions, fn func(api.ProgressResponse)) error {
|
2023-07-17 22:44:21 -07:00
|
|
|
mp := ParseModelPath(name)
|
|
|
|
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{Status: "retrieving manifest"})
|
|
|
|
|
2023-07-17 22:44:21 -07:00
|
|
|
manifest, err := GetManifest(mp)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{Status: "couldn't retrieve manifest"})
|
2023-07-16 17:02:22 -07:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
var layers []*Layer
|
2023-07-31 21:37:40 -04:00
|
|
|
layers = append(layers, manifest.Layers...)
|
2023-07-16 17:02:22 -07:00
|
|
|
layers = append(layers, &manifest.Config)
|
|
|
|
|
|
|
|
for _, layer := range layers {
|
2023-07-21 15:42:19 -07:00
|
|
|
exists, err := checkBlobExistence(mp, layer.Digest, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if exists {
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{
|
|
|
|
Status: "using existing layer",
|
|
|
|
Digest: layer.Digest,
|
2023-07-22 17:31:26 -07:00
|
|
|
Total: layer.Size,
|
|
|
|
Completed: layer.Size,
|
2023-07-18 18:51:30 -07:00
|
|
|
})
|
2023-07-22 17:31:26 -07:00
|
|
|
log.Printf("Layer %s already exists", layer.Digest)
|
2023-07-16 17:02:22 -07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{
|
2023-07-22 17:31:26 -07:00
|
|
|
Status: "starting upload",
|
|
|
|
Digest: layer.Digest,
|
|
|
|
Total: layer.Size,
|
2023-07-18 18:51:30 -07:00
|
|
|
})
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
location, err := startUpload(mp, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't start upload: %v", err)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-22 17:31:26 -07:00
|
|
|
err = uploadBlobChunked(mp, location, layer, regOpts, fn)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("error uploading blob: %v", err)
|
|
|
|
return err
|
|
|
|
}
|
2023-07-18 18:51:30 -07:00
|
|
|
}
|
|
|
|
|
2023-07-22 17:31:26 -07:00
|
|
|
fn(api.ProgressResponse{Status: "pushing manifest"})
|
2023-07-21 15:42:19 -07:00
|
|
|
url := fmt.Sprintf("%s/v2/%s/manifests/%s", mp.Registry, mp.GetNamespaceRepository(), mp.Tag)
|
2023-07-16 17:02:22 -07:00
|
|
|
headers := map[string]string{
|
|
|
|
"Content-Type": "application/vnd.docker.distribution.manifest.v2+json",
|
|
|
|
}
|
|
|
|
|
|
|
|
manifestJSON, err := json.Marshal(manifest)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
resp, err := makeRequest("PUT", url, headers, bytes.NewReader(manifestJSON), regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
// Check for success: For a successful upload, the Docker registry will respond with a 201 Created
|
|
|
|
if resp.StatusCode != http.StatusCreated {
|
|
|
|
body, _ := io.ReadAll(resp.Body)
|
2023-07-24 15:04:21 -04:00
|
|
|
return fmt.Errorf("on push registry responded with code %d: %v", resp.StatusCode, string(body))
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-07-22 17:31:26 -07:00
|
|
|
fn(api.ProgressResponse{Status: "success"})
|
2023-07-16 17:02:22 -07:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-25 17:08:51 -04:00
|
|
|
func PullModel(ctx context.Context, name string, regOpts *RegistryOptions, fn func(api.ProgressResponse)) error {
|
2023-07-17 22:44:21 -07:00
|
|
|
mp := ParseModelPath(name)
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{Status: "pulling manifest"})
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
manifest, err := pullModelManifest(mp, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
2023-07-24 17:48:17 -04:00
|
|
|
return fmt.Errorf("pull model manifest: %s", err)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
var layers []*Layer
|
2023-07-20 20:18:00 +02:00
|
|
|
layers = append(layers, manifest.Layers...)
|
2023-07-16 17:02:22 -07:00
|
|
|
layers = append(layers, &manifest.Config)
|
|
|
|
|
|
|
|
for _, layer := range layers {
|
2023-07-25 17:08:51 -04:00
|
|
|
if err := downloadBlob(ctx, mp, layer.Digest, regOpts, fn); err != nil {
|
2023-07-16 17:02:22 -07:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-20 11:44:05 -07:00
|
|
|
fn(api.ProgressResponse{Status: "verifying sha256 digest"})
|
|
|
|
for _, layer := range layers {
|
|
|
|
if err := verifyBlob(layer.Digest); err != nil {
|
2023-07-24 14:53:01 -04:00
|
|
|
if errors.Is(err, errDigestMismatch) {
|
|
|
|
// something went wrong, delete the blob
|
|
|
|
fp, err := GetBlobsPath(layer.Digest)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := os.Remove(fp); err != nil {
|
|
|
|
// log this, but return the original error
|
|
|
|
log.Printf("couldn't remove file with digest mismatch '%s': %v", fp, err)
|
|
|
|
}
|
|
|
|
}
|
2023-07-20 11:44:05 -07:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{Status: "writing manifest"})
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-17 11:03:55 -07:00
|
|
|
manifestJSON, err := json.Marshal(manifest)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-17 22:44:21 -07:00
|
|
|
fp, err := mp.GetManifestPath(true)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-20 20:18:00 +02:00
|
|
|
err = os.WriteFile(fp, manifestJSON, 0o644)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't write to %s", fp)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-18 18:51:30 -07:00
|
|
|
fn(api.ProgressResponse{Status: "success"})
|
2023-07-16 17:02:22 -07:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
func pullModelManifest(mp ModelPath, regOpts *RegistryOptions) (*ManifestV2, error) {
|
|
|
|
url := fmt.Sprintf("%s/v2/%s/manifests/%s", mp.Registry, mp.GetNamespaceRepository(), mp.Tag)
|
2023-07-16 17:02:22 -07:00
|
|
|
headers := map[string]string{
|
|
|
|
"Accept": "application/vnd.docker.distribution.manifest.v2+json",
|
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
resp, err := makeRequest("GET", url, headers, nil, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't get manifest: %v", err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
// Check for success: For a successful upload, the Docker registry will respond with a 201 Created
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
2023-07-24 17:48:17 -04:00
|
|
|
if resp.StatusCode == http.StatusNotFound {
|
2023-07-25 10:30:14 -04:00
|
|
|
return nil, fmt.Errorf("model not found")
|
2023-07-24 17:48:17 -04:00
|
|
|
}
|
2023-07-16 17:02:22 -07:00
|
|
|
body, _ := io.ReadAll(resp.Body)
|
2023-07-24 15:04:21 -04:00
|
|
|
return nil, fmt.Errorf("on pull registry responded with code %d: %s", resp.StatusCode, body)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
var m *ManifestV2
|
|
|
|
if err := json.NewDecoder(resp.Body).Decode(&m); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return m, err
|
|
|
|
}
|
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
func createConfigLayer(layers []string) (*LayerReader, error) {
|
2023-07-16 17:02:22 -07:00
|
|
|
// TODO change architecture and OS
|
|
|
|
config := ConfigV2{
|
|
|
|
Architecture: "arm64",
|
|
|
|
OS: "linux",
|
|
|
|
RootFS: RootFS{
|
|
|
|
Type: "layers",
|
|
|
|
DiffIDs: layers,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
configJSON, err := json.Marshal(config)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-07-19 00:47:55 -07:00
|
|
|
digest, size := GetSHA256Digest(bytes.NewBuffer(configJSON))
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-18 17:14:12 -07:00
|
|
|
layer := &LayerReader{
|
2023-07-16 17:02:22 -07:00
|
|
|
Layer: Layer{
|
|
|
|
MediaType: "application/vnd.docker.container.image.v1+json",
|
|
|
|
Digest: digest,
|
|
|
|
Size: size,
|
|
|
|
},
|
2023-07-19 00:47:55 -07:00
|
|
|
Reader: bytes.NewBuffer(configJSON),
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
return layer, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetSHA256Digest returns the SHA256 hash of a given buffer and returns it, and the size of buffer
|
2023-07-18 17:14:12 -07:00
|
|
|
func GetSHA256Digest(r io.Reader) (string, int) {
|
|
|
|
h := sha256.New()
|
|
|
|
n, err := io.Copy(h, r)
|
|
|
|
if err != nil {
|
|
|
|
log.Fatal(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
return fmt.Sprintf("sha256:%x", h.Sum(nil)), int(n)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
func startUpload(mp ModelPath, regOpts *RegistryOptions) (string, error) {
|
|
|
|
url := fmt.Sprintf("%s/v2/%s/blobs/uploads/", mp.Registry, mp.GetNamespaceRepository())
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
resp, err := makeRequest("POST", url, nil, nil, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't start upload: %v", err)
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
// Check for success
|
|
|
|
if resp.StatusCode != http.StatusAccepted {
|
|
|
|
body, _ := io.ReadAll(resp.Body)
|
2023-07-24 15:04:21 -04:00
|
|
|
return "", fmt.Errorf("on upload registry responded with code %d: %s", resp.StatusCode, body)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Extract UUID location from header
|
|
|
|
location := resp.Header.Get("Location")
|
|
|
|
if location == "" {
|
|
|
|
return "", fmt.Errorf("location header is missing in response")
|
|
|
|
}
|
|
|
|
|
|
|
|
return location, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Function to check if a blob already exists in the Docker registry
|
2023-07-21 15:42:19 -07:00
|
|
|
func checkBlobExistence(mp ModelPath, digest string, regOpts *RegistryOptions) (bool, error) {
|
|
|
|
url := fmt.Sprintf("%s/v2/%s/blobs/%s", mp.Registry, mp.GetNamespaceRepository(), digest)
|
2023-07-16 17:02:22 -07:00
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
resp, err := makeRequest("HEAD", url, nil, nil, regOpts)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't check for blob: %v", err)
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
// Check for success: If the blob exists, the Docker registry will respond with a 200 OK
|
|
|
|
return resp.StatusCode == http.StatusOK, nil
|
|
|
|
}
|
|
|
|
|
2023-07-31 15:02:07 -07:00
|
|
|
func uploadBlobChunked(mp ModelPath, url string, layer *Layer, regOpts *RegistryOptions, fn func(api.ProgressResponse)) error {
|
2023-07-16 17:02:22 -07:00
|
|
|
// TODO allow resumability
|
|
|
|
// TODO allow canceling uploads via DELETE
|
|
|
|
// TODO allow cross repo blob mount
|
|
|
|
|
2023-07-17 22:44:21 -07:00
|
|
|
fp, err := GetBlobsPath(layer.Digest)
|
2023-07-17 11:03:55 -07:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
f, err := os.Open(fp)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2023-08-01 12:15:22 -07:00
|
|
|
totalUploaded := 0
|
|
|
|
|
|
|
|
r, w := io.Pipe()
|
|
|
|
defer r.Close()
|
|
|
|
|
|
|
|
go func() {
|
|
|
|
defer w.Close()
|
|
|
|
for {
|
|
|
|
n, err := io.CopyN(w, f, 1024*1024)
|
|
|
|
if err != nil && !errors.Is(err, io.EOF) {
|
|
|
|
fn(api.ProgressResponse{
|
|
|
|
Status: fmt.Sprintf("error copying pipe: %v", err),
|
|
|
|
Digest: layer.Digest,
|
|
|
|
Total: layer.Size,
|
|
|
|
Completed: totalUploaded,
|
|
|
|
})
|
|
|
|
return
|
|
|
|
}
|
2023-07-22 17:31:26 -07:00
|
|
|
|
2023-08-01 12:15:22 -07:00
|
|
|
totalUploaded += int(n)
|
2023-07-22 17:31:26 -07:00
|
|
|
|
|
|
|
fn(api.ProgressResponse{
|
2023-08-01 12:15:22 -07:00
|
|
|
Status: fmt.Sprintf("uploading %s", layer.Digest),
|
2023-07-22 17:31:26 -07:00
|
|
|
Digest: layer.Digest,
|
2023-08-01 12:15:22 -07:00
|
|
|
Total: layer.Size,
|
|
|
|
Completed: totalUploaded,
|
2023-07-22 17:31:26 -07:00
|
|
|
})
|
2023-08-01 12:15:22 -07:00
|
|
|
|
|
|
|
if totalUploaded >= layer.Size {
|
|
|
|
return
|
|
|
|
}
|
2023-07-22 17:31:26 -07:00
|
|
|
}
|
2023-08-01 12:15:22 -07:00
|
|
|
}()
|
2023-07-22 17:31:26 -07:00
|
|
|
|
2023-08-01 12:15:22 -07:00
|
|
|
url = fmt.Sprintf("%s&digest=%s", url, layer.Digest)
|
2023-07-22 17:31:26 -07:00
|
|
|
|
2023-08-01 12:15:22 -07:00
|
|
|
headers := make(map[string]string)
|
|
|
|
headers["Content-Type"] = "application/octet-stream"
|
|
|
|
headers["Content-Range"] = fmt.Sprintf("0-%d", layer.Size-1)
|
|
|
|
headers["Content-Length"] = strconv.Itoa(int(layer.Size))
|
2023-07-22 17:31:26 -07:00
|
|
|
|
2023-08-01 12:15:22 -07:00
|
|
|
// finish the upload
|
|
|
|
resp, err := makeRequest("PUT", url, headers, r, regOpts)
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("couldn't finish upload: %v", err)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
if resp.StatusCode != http.StatusCreated {
|
|
|
|
body, _ := io.ReadAll(resp.Body)
|
|
|
|
return fmt.Errorf("on finish upload registry responded with code %d: %v", resp.StatusCode, string(body))
|
2023-07-22 17:31:26 -07:00
|
|
|
}
|
2023-07-16 17:02:22 -07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-07-21 15:42:19 -07:00
|
|
|
func makeRequest(method, url string, headers map[string]string, body io.Reader, regOpts *RegistryOptions) (*http.Response, error) {
|
|
|
|
if !strings.HasPrefix(url, "http") {
|
|
|
|
if regOpts.Insecure {
|
|
|
|
url = "http://" + url
|
|
|
|
} else {
|
|
|
|
url = "https://" + url
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-10 11:34:25 -07:00
|
|
|
// make a copy of the body in case we need to try the call to makeRequest again
|
|
|
|
var buf bytes.Buffer
|
|
|
|
if body != nil {
|
|
|
|
_, err := io.Copy(&buf, body)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
bodyCopy := bytes.NewReader(buf.Bytes())
|
|
|
|
|
|
|
|
req, err := http.NewRequest(method, url, bodyCopy)
|
2023-07-16 17:02:22 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-08-10 11:34:25 -07:00
|
|
|
if regOpts.Token != "" {
|
|
|
|
req.Header.Set("Authorization", "Bearer "+regOpts.Token)
|
|
|
|
} else if regOpts.Username != "" && regOpts.Password != "" {
|
|
|
|
req.SetBasicAuth(regOpts.Username, regOpts.Password)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
2023-08-10 11:34:25 -07:00
|
|
|
for k, v := range headers {
|
|
|
|
req.Header.Set(k, v)
|
2023-07-16 17:02:22 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
client := &http.Client{
|
|
|
|
CheckRedirect: func(req *http.Request, via []*http.Request) error {
|
|
|
|
if len(via) >= 10 {
|
|
|
|
return fmt.Errorf("too many redirects")
|
|
|
|
}
|
|
|
|
log.Printf("redirected to: %s\n", req.URL)
|
|
|
|
return nil
|
|
|
|
},
|
|
|
|
}
|
|
|
|
resp, err := client.Do(req)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-08-10 11:34:25 -07:00
|
|
|
// if the request is unauthenticated, try to authenticate and make the request again
|
|
|
|
if resp.StatusCode == http.StatusUnauthorized {
|
|
|
|
auth := resp.Header.Get("Www-Authenticate")
|
|
|
|
authRedir := ParseAuthRedirectString(string(auth))
|
|
|
|
token, err := getAuthToken(authRedir, regOpts)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
regOpts.Token = token
|
|
|
|
bodyCopy = bytes.NewReader(buf.Bytes())
|
|
|
|
return makeRequest(method, url, headers, bodyCopy, regOpts)
|
|
|
|
}
|
|
|
|
|
2023-07-16 17:02:22 -07:00
|
|
|
return resp, nil
|
|
|
|
}
|
2023-07-20 11:44:05 -07:00
|
|
|
|
2023-08-10 11:34:25 -07:00
|
|
|
func getValue(header, key string) string {
|
|
|
|
startIdx := strings.Index(header, key+"=")
|
|
|
|
if startIdx == -1 {
|
|
|
|
return ""
|
|
|
|
}
|
|
|
|
|
|
|
|
// Move the index to the starting quote after the key.
|
|
|
|
startIdx += len(key) + 2
|
|
|
|
endIdx := startIdx
|
|
|
|
|
|
|
|
for endIdx < len(header) {
|
|
|
|
if header[endIdx] == '"' {
|
|
|
|
if endIdx+1 < len(header) && header[endIdx+1] != ',' { // If the next character isn't a comma, continue
|
|
|
|
endIdx++
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
break
|
|
|
|
}
|
|
|
|
endIdx++
|
|
|
|
}
|
|
|
|
return header[startIdx:endIdx]
|
|
|
|
}
|
|
|
|
|
|
|
|
func ParseAuthRedirectString(authStr string) AuthRedirect {
|
|
|
|
authStr = strings.TrimPrefix(authStr, "Bearer ")
|
|
|
|
|
|
|
|
return AuthRedirect{
|
|
|
|
Realm: getValue(authStr, "realm"),
|
|
|
|
Service: getValue(authStr, "service"),
|
|
|
|
Scope: getValue(authStr, "scope"),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-24 14:53:01 -04:00
|
|
|
var errDigestMismatch = fmt.Errorf("digest mismatch, file must be downloaded again")
|
|
|
|
|
2023-07-20 11:44:05 -07:00
|
|
|
func verifyBlob(digest string) error {
|
|
|
|
fp, err := GetBlobsPath(digest)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
f, err := os.Open(fp)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer f.Close()
|
|
|
|
|
|
|
|
fileDigest, _ := GetSHA256Digest(f)
|
|
|
|
if digest != fileDigest {
|
2023-07-24 14:53:01 -04:00
|
|
|
return fmt.Errorf("%w: want %s, got %s", errDigestMismatch, digest, fileDigest)
|
2023-07-20 11:44:05 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|