a6d03dd510
fix pull 0 bytes on completed layer
344 lines
6.8 KiB
Go
344 lines
6.8 KiB
Go
package cmd
|
|
|
|
import (
|
|
"bufio"
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"log"
|
|
"net"
|
|
"net/http"
|
|
"os"
|
|
"path/filepath"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/dustin/go-humanize"
|
|
"github.com/olekukonko/tablewriter"
|
|
"github.com/schollz/progressbar/v3"
|
|
"github.com/spf13/cobra"
|
|
"golang.org/x/term"
|
|
|
|
"github.com/jmorganca/ollama/api"
|
|
"github.com/jmorganca/ollama/format"
|
|
"github.com/jmorganca/ollama/server"
|
|
)
|
|
|
|
func create(cmd *cobra.Command, args []string) error {
|
|
filename, _ := cmd.Flags().GetString("file")
|
|
filename, err := filepath.Abs(filename)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
client := api.NewClient()
|
|
|
|
var spinner *Spinner
|
|
|
|
request := api.CreateRequest{Name: args[0], Path: filename}
|
|
fn := func(resp api.CreateProgress) error {
|
|
if spinner != nil {
|
|
spinner.Stop()
|
|
}
|
|
|
|
spinner = NewSpinner(resp.Status)
|
|
go spinner.Spin(100 * time.Millisecond)
|
|
|
|
return nil
|
|
}
|
|
|
|
if err := client.Create(context.Background(), &request, fn); err != nil {
|
|
return err
|
|
}
|
|
|
|
if spinner != nil {
|
|
spinner.Stop()
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func RunRun(cmd *cobra.Command, args []string) error {
|
|
mp := server.ParseModelPath(args[0])
|
|
fp, err := mp.GetManifestPath(false)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
_, err = os.Stat(fp)
|
|
switch {
|
|
case errors.Is(err, os.ErrNotExist):
|
|
if err := pull(args[0]); err != nil {
|
|
var apiStatusError api.StatusError
|
|
if !errors.As(err, &apiStatusError) {
|
|
return err
|
|
}
|
|
|
|
if apiStatusError.StatusCode != http.StatusBadGateway {
|
|
return err
|
|
}
|
|
}
|
|
case err != nil:
|
|
return err
|
|
}
|
|
|
|
return RunGenerate(cmd, args)
|
|
}
|
|
|
|
func push(cmd *cobra.Command, args []string) error {
|
|
client := api.NewClient()
|
|
|
|
request := api.PushRequest{Name: args[0]}
|
|
fn := func(resp api.ProgressResponse) error {
|
|
fmt.Println(resp.Status)
|
|
return nil
|
|
}
|
|
|
|
if err := client.Push(context.Background(), &request, fn); err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func list(cmd *cobra.Command, args []string) error {
|
|
client := api.NewClient()
|
|
|
|
models, err := client.List(context.Background())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
var data [][]string
|
|
|
|
for _, m := range models.Models {
|
|
data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
|
|
}
|
|
|
|
table := tablewriter.NewWriter(os.Stdout)
|
|
table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
|
|
table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
|
|
table.SetAlignment(tablewriter.ALIGN_LEFT)
|
|
table.SetHeaderLine(false)
|
|
table.SetBorder(false)
|
|
table.SetNoWhiteSpace(true)
|
|
table.SetTablePadding("\t")
|
|
table.AppendBulk(data)
|
|
table.Render()
|
|
|
|
return nil
|
|
}
|
|
|
|
func RunPull(cmd *cobra.Command, args []string) error {
|
|
return pull(args[0])
|
|
}
|
|
|
|
func pull(model string) error {
|
|
client := api.NewClient()
|
|
|
|
var currentDigest string
|
|
var bar *progressbar.ProgressBar
|
|
|
|
request := api.PullRequest{Name: model}
|
|
fn := func(resp api.ProgressResponse) error {
|
|
if resp.Digest != currentDigest && resp.Digest != "" {
|
|
currentDigest = resp.Digest
|
|
bar = progressbar.DefaultBytes(
|
|
int64(resp.Total),
|
|
fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
|
|
)
|
|
|
|
bar.Set(resp.Completed)
|
|
} else if resp.Digest == currentDigest && resp.Digest != "" {
|
|
bar.Set(resp.Completed)
|
|
} else {
|
|
currentDigest = ""
|
|
fmt.Println(resp.Status)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
if err := client.Pull(context.Background(), &request, fn); err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func RunGenerate(cmd *cobra.Command, args []string) error {
|
|
if len(args) > 1 {
|
|
// join all args into a single prompt
|
|
return generate(cmd, args[0], strings.Join(args[1:], " "))
|
|
}
|
|
|
|
if term.IsTerminal(int(os.Stdin.Fd())) {
|
|
return generateInteractive(cmd, args[0])
|
|
}
|
|
|
|
return generateBatch(cmd, args[0])
|
|
}
|
|
|
|
var generateContextKey struct{}
|
|
|
|
func generate(cmd *cobra.Command, model, prompt string) error {
|
|
if len(strings.TrimSpace(prompt)) > 0 {
|
|
client := api.NewClient()
|
|
|
|
spinner := NewSpinner("")
|
|
go spinner.Spin(60 * time.Millisecond)
|
|
|
|
var latest api.GenerateResponse
|
|
|
|
generateContext, ok := cmd.Context().Value(generateContextKey).([]int)
|
|
if !ok {
|
|
generateContext = []int{}
|
|
}
|
|
|
|
request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
|
|
fn := func(resp api.GenerateResponse) error {
|
|
if !spinner.IsFinished() {
|
|
spinner.Finish()
|
|
}
|
|
|
|
latest = resp
|
|
|
|
fmt.Print(resp.Response)
|
|
|
|
cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context))
|
|
return nil
|
|
}
|
|
|
|
if err := client.Generate(context.Background(), &request, fn); err != nil {
|
|
return err
|
|
}
|
|
|
|
fmt.Println()
|
|
fmt.Println()
|
|
|
|
verbose, err := cmd.Flags().GetBool("verbose")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
if verbose {
|
|
latest.Summary()
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func generateInteractive(cmd *cobra.Command, model string) error {
|
|
fmt.Print(">>> ")
|
|
scanner := bufio.NewScanner(os.Stdin)
|
|
for scanner.Scan() {
|
|
if err := generate(cmd, model, scanner.Text()); err != nil {
|
|
return err
|
|
}
|
|
|
|
fmt.Print(">>> ")
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func generateBatch(cmd *cobra.Command, model string) error {
|
|
scanner := bufio.NewScanner(os.Stdin)
|
|
for scanner.Scan() {
|
|
prompt := scanner.Text()
|
|
fmt.Printf(">>> %s\n", prompt)
|
|
if err := generate(cmd, model, prompt); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func RunServer(_ *cobra.Command, _ []string) error {
|
|
host := os.Getenv("OLLAMA_HOST")
|
|
if host == "" {
|
|
host = "127.0.0.1"
|
|
}
|
|
|
|
port := os.Getenv("OLLAMA_PORT")
|
|
if port == "" {
|
|
port = "11434"
|
|
}
|
|
|
|
ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
return server.Serve(ln)
|
|
}
|
|
|
|
func NewCLI() *cobra.Command {
|
|
log.SetFlags(log.LstdFlags | log.Lshortfile)
|
|
|
|
rootCmd := &cobra.Command{
|
|
Use: "ollama",
|
|
Short: "Large language model runner",
|
|
SilenceUsage: true,
|
|
CompletionOptions: cobra.CompletionOptions{
|
|
DisableDefaultCmd: true,
|
|
},
|
|
}
|
|
|
|
cobra.EnableCommandSorting = false
|
|
|
|
createCmd := &cobra.Command{
|
|
Use: "create MODEL",
|
|
Short: "Create a model from a Modelfile",
|
|
Args: cobra.MinimumNArgs(1),
|
|
RunE: create,
|
|
}
|
|
|
|
createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
|
|
|
|
runCmd := &cobra.Command{
|
|
Use: "run MODEL [PROMPT]",
|
|
Short: "Run a model",
|
|
Args: cobra.MinimumNArgs(1),
|
|
RunE: RunRun,
|
|
}
|
|
|
|
runCmd.Flags().Bool("verbose", false, "Show timings for response")
|
|
|
|
serveCmd := &cobra.Command{
|
|
Use: "serve",
|
|
Aliases: []string{"start"},
|
|
Short: "Start ollama",
|
|
RunE: RunServer,
|
|
}
|
|
|
|
pullCmd := &cobra.Command{
|
|
Use: "pull MODEL",
|
|
Short: "Pull a model from a registry",
|
|
Args: cobra.MinimumNArgs(1),
|
|
RunE: RunPull,
|
|
}
|
|
|
|
pushCmd := &cobra.Command{
|
|
Use: "push MODEL",
|
|
Short: "Push a model to a registry",
|
|
Args: cobra.MinimumNArgs(1),
|
|
RunE: push,
|
|
}
|
|
|
|
listCmd := &cobra.Command{
|
|
Use: "list",
|
|
Short: "List models",
|
|
RunE: list,
|
|
}
|
|
|
|
rootCmd.AddCommand(
|
|
serveCmd,
|
|
createCmd,
|
|
runCmd,
|
|
pullCmd,
|
|
pushCmd,
|
|
listCmd,
|
|
)
|
|
|
|
return rootCmd
|
|
}
|