ollama/cmd/cmd.go

706 lines
16 KiB
Go
Raw Normal View History

package cmd
import (
2023-07-06 20:49:31 +00:00
"bufio"
"context"
2023-07-06 22:43:04 +00:00
"errors"
2023-07-06 16:24:49 +00:00
"fmt"
2023-07-18 21:01:19 +00:00
"io"
"log"
"net"
2023-07-11 20:05:51 +00:00
"net/http"
"os"
"os/exec"
"path/filepath"
"runtime"
2023-07-07 17:12:58 +00:00
"strings"
2023-07-06 22:43:04 +00:00
"time"
2023-07-18 21:01:19 +00:00
"github.com/chzyer/readline"
2023-07-18 16:09:45 +00:00
"github.com/dustin/go-humanize"
"github.com/olekukonko/tablewriter"
2023-07-06 20:49:31 +00:00
"github.com/spf13/cobra"
2023-07-03 20:32:48 +00:00
"github.com/jmorganca/ollama/api"
2023-07-18 16:09:45 +00:00
"github.com/jmorganca/ollama/format"
"github.com/jmorganca/ollama/progressbar"
2023-07-03 20:32:48 +00:00
"github.com/jmorganca/ollama/server"
)
2023-07-20 23:09:23 +00:00
func CreateHandler(cmd *cobra.Command, args []string) error {
filename, _ := cmd.Flags().GetString("file")
filename, err := filepath.Abs(filename)
if err != nil {
return err
}
client := api.NewClient()
2023-07-17 21:14:41 +00:00
var spinner *Spinner
var currentDigest string
var bar *progressbar.ProgressBar
2023-07-17 21:14:41 +00:00
request := api.CreateRequest{Name: args[0], Path: filename}
fn := func(resp api.ProgressResponse) error {
if resp.Digest != currentDigest && resp.Digest != "" {
if spinner != nil {
spinner.Stop()
}
currentDigest = resp.Digest
bar = progressbar.DefaultBytes(
int64(resp.Total),
fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
)
2023-07-17 21:14:41 +00:00
bar.Set(resp.Completed)
} else if resp.Digest == currentDigest && resp.Digest != "" {
bar.Set(resp.Completed)
} else {
currentDigest = ""
if spinner != nil {
spinner.Stop()
}
spinner = NewSpinner(resp.Status)
go spinner.Spin(100 * time.Millisecond)
}
return nil
}
if err := client.Create(context.Background(), &request, fn); err != nil {
return err
}
2023-07-17 21:14:41 +00:00
if spinner != nil {
spinner.Stop()
}
return nil
}
func RunHandler(cmd *cobra.Command, args []string) error {
mp := server.ParseModelPath(args[0])
2023-07-18 05:44:21 +00:00
fp, err := mp.GetManifestPath(false)
if err != nil {
return err
}
_, err = os.Stat(fp)
2023-07-06 22:43:04 +00:00
switch {
case errors.Is(err, os.ErrNotExist):
if err := pull(args[0], false); err != nil {
2023-07-11 20:05:51 +00:00
var apiStatusError api.StatusError
if !errors.As(err, &apiStatusError) {
return err
}
if apiStatusError.StatusCode != http.StatusBadGateway {
return err
}
2023-07-06 22:43:04 +00:00
}
case err != nil:
2023-07-06 21:05:55 +00:00
return err
}
return RunGenerate(cmd, args)
2023-07-06 18:18:40 +00:00
}
2023-07-20 23:09:23 +00:00
func PushHandler(cmd *cobra.Command, args []string) error {
client := api.NewClient()
insecure, err := cmd.Flags().GetBool("insecure")
if err != nil {
return err
}
var currentDigest string
var bar *progressbar.ProgressBar
request := api.PushRequest{Name: args[0], Insecure: insecure}
2023-07-19 01:51:30 +00:00
fn := func(resp api.ProgressResponse) error {
if resp.Digest != currentDigest && resp.Digest != "" {
currentDigest = resp.Digest
bar = progressbar.DefaultBytes(
int64(resp.Total),
fmt.Sprintf("pushing %s...", resp.Digest[7:19]),
)
bar.Set(resp.Completed)
} else if resp.Digest == currentDigest && resp.Digest != "" {
bar.Set(resp.Completed)
} else {
currentDigest = ""
fmt.Println(resp.Status)
}
return nil
}
if err := client.Push(context.Background(), &request, fn); err != nil {
return err
}
return nil
}
2023-07-20 23:09:23 +00:00
func ListHandler(cmd *cobra.Command, args []string) error {
2023-07-18 16:09:45 +00:00
client := api.NewClient()
models, err := client.List(context.Background())
if err != nil {
return err
}
var data [][]string
for _, m := range models.Models {
2023-07-18 21:01:19 +00:00
if len(args) == 0 || strings.HasPrefix(m.Name, args[0]) {
data = append(data, []string{m.Name, humanize.Bytes(uint64(m.Size)), format.HumanTime(m.ModifiedAt, "Never")})
}
2023-07-18 16:09:45 +00:00
}
table := tablewriter.NewWriter(os.Stdout)
table.SetHeader([]string{"NAME", "SIZE", "MODIFIED"})
table.SetHeaderAlignment(tablewriter.ALIGN_LEFT)
table.SetAlignment(tablewriter.ALIGN_LEFT)
table.SetHeaderLine(false)
table.SetBorder(false)
table.SetNoWhiteSpace(true)
table.SetTablePadding("\t")
table.AppendBulk(data)
table.Render()
return nil
}
2023-07-20 23:09:23 +00:00
func DeleteHandler(cmd *cobra.Command, args []string) error {
client := api.NewClient()
2023-07-24 15:27:28 +00:00
req := api.DeleteRequest{Name: args[0]}
if err := client.Delete(context.Background(), &req); err != nil {
2023-07-20 23:09:23 +00:00
return err
}
fmt.Printf("deleted '%s'\n", args[0])
2023-07-20 23:09:23 +00:00
return nil
}
2023-07-24 15:27:28 +00:00
func CopyHandler(cmd *cobra.Command, args []string) error {
client := api.NewClient()
req := api.CopyRequest{Source: args[0], Destination: args[1]}
if err := client.Copy(context.Background(), &req); err != nil {
return err
}
fmt.Printf("copied '%s' to '%s'\n", args[0], args[1])
return nil
}
2023-07-20 23:09:23 +00:00
func PullHandler(cmd *cobra.Command, args []string) error {
insecure, err := cmd.Flags().GetBool("insecure")
if err != nil {
return err
}
return pull(args[0], insecure)
}
func pull(model string, insecure bool) error {
2023-07-07 18:26:58 +00:00
client := api.NewClient()
2023-07-19 01:51:30 +00:00
var currentDigest string
2023-07-07 18:26:58 +00:00
var bar *progressbar.ProgressBar
2023-07-11 20:05:51 +00:00
request := api.PullRequest{Name: model, Insecure: insecure}
2023-07-19 01:51:30 +00:00
fn := func(resp api.ProgressResponse) error {
if resp.Digest != currentDigest && resp.Digest != "" {
currentDigest = resp.Digest
bar = progressbar.DefaultBytes(
int64(resp.Total),
2023-07-19 01:51:30 +00:00
fmt.Sprintf("pulling %s...", resp.Digest[7:19]),
)
2023-07-19 01:51:30 +00:00
bar.Set(resp.Completed)
} else if resp.Digest == currentDigest && resp.Digest != "" {
bar.Set(resp.Completed)
} else {
2023-07-19 01:51:30 +00:00
currentDigest = ""
fmt.Println(resp.Status)
}
return nil
}
2023-07-07 14:22:37 +00:00
if err := client.Pull(context.Background(), &request, fn); err != nil {
return err
}
return nil
2023-07-06 20:49:31 +00:00
}
2023-07-13 01:18:06 +00:00
func RunGenerate(cmd *cobra.Command, args []string) error {
2023-07-06 20:49:31 +00:00
if len(args) > 1 {
2023-07-12 16:55:07 +00:00
// join all args into a single prompt
2023-07-13 01:18:06 +00:00
return generate(cmd, args[0], strings.Join(args[1:], " "))
2023-07-06 20:49:31 +00:00
}
2023-07-18 21:01:19 +00:00
if readline.IsTerminal(int(os.Stdin.Fd())) {
2023-07-13 01:18:06 +00:00
return generateInteractive(cmd, args[0])
2023-07-06 20:49:31 +00:00
}
2023-07-13 01:18:06 +00:00
return generateBatch(cmd, args[0])
2023-07-06 20:49:31 +00:00
}
2023-07-18 18:59:42 +00:00
type generateContextKey string
2023-07-13 01:18:06 +00:00
func generate(cmd *cobra.Command, model, prompt string) error {
2023-07-07 17:12:58 +00:00
if len(strings.TrimSpace(prompt)) > 0 {
client := api.NewClient()
2023-07-17 21:14:41 +00:00
spinner := NewSpinner("")
go spinner.Spin(60 * time.Millisecond)
2023-07-06 22:43:04 +00:00
2023-07-13 01:18:06 +00:00
var latest api.GenerateResponse
2023-07-18 18:59:42 +00:00
generateContext, ok := cmd.Context().Value(generateContextKey("context")).([]int)
if !ok {
generateContext = []int{}
}
2023-08-01 01:35:18 +00:00
request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext}
2023-07-18 18:59:42 +00:00
fn := func(response api.GenerateResponse) error {
2023-07-07 17:12:58 +00:00
if !spinner.IsFinished() {
spinner.Finish()
}
2023-07-06 22:43:04 +00:00
2023-07-18 18:59:42 +00:00
latest = response
2023-07-13 01:18:06 +00:00
2023-07-18 18:59:42 +00:00
fmt.Print(response.Response)
2023-07-07 17:12:58 +00:00
return nil
2023-07-07 21:04:43 +00:00
}
if err := client.Generate(context.Background(), &request, fn); err != nil {
if strings.Contains(err.Error(), "failed to load model") {
// tell the user to check the server log, if it exists locally
home, nestedErr := os.UserHomeDir()
if nestedErr != nil {
// return the original error
return err
}
logPath := filepath.Join(home, ".ollama", "logs", "server.log")
if _, nestedErr := os.Stat(logPath); nestedErr == nil {
err = fmt.Errorf("%w\nFor more details, check the error logs at %s", err, logPath)
}
}
2023-07-07 21:04:43 +00:00
return err
}
2023-07-06 22:43:04 +00:00
2023-07-07 17:12:58 +00:00
fmt.Println()
fmt.Println()
2023-07-13 01:18:06 +00:00
verbose, err := cmd.Flags().GetBool("verbose")
if err != nil {
return err
}
if verbose {
latest.Summary()
}
2023-07-18 18:59:42 +00:00
ctx := cmd.Context()
ctx = context.WithValue(ctx, generateContextKey("context"), latest.Context)
cmd.SetContext(ctx)
2023-07-07 17:12:58 +00:00
}
2023-07-06 20:49:31 +00:00
return nil
}
func showLayer(l *server.Layer) {
filename, err := server.GetBlobsPath(l.Digest)
bts, err := os.ReadFile(filename)
if err != nil {
fmt.Printf("Couldn't read layer")
return
}
fmt.Printf(string(bts) + "\n")
}
2023-07-13 01:18:06 +00:00
func generateInteractive(cmd *cobra.Command, model string) error {
2023-07-18 21:01:19 +00:00
home, err := os.UserHomeDir()
if err != nil {
return err
}
completer := readline.NewPrefixCompleter(
readline.PcItem("/help"),
readline.PcItem("/list"),
readline.PcItem("/set",
readline.PcItem("history"),
readline.PcItem("nohistory"),
2023-07-19 16:25:23 +00:00
readline.PcItem("verbose"),
readline.PcItem("quiet"),
2023-07-18 21:01:19 +00:00
readline.PcItem("mode",
readline.PcItem("vim"),
readline.PcItem("emacs"),
readline.PcItem("default"),
),
),
readline.PcItem("/show",
readline.PcItem("license"),
readline.PcItem("system"),
readline.PcItem("template"),
),
2023-07-18 21:01:19 +00:00
readline.PcItem("/exit"),
readline.PcItem("/bye"),
)
usage := func() {
fmt.Fprintln(os.Stderr, "commands:")
fmt.Fprintln(os.Stderr, completer.Tree(" "))
}
config := readline.Config{
Prompt: ">>> ",
HistoryFile: filepath.Join(home, ".ollama", "history"),
AutoComplete: completer,
}
scanner, err := readline.NewEx(&config)
if err != nil {
return err
}
defer scanner.Close()
var multiLineBuffer string
var isMultiLine bool
2023-07-18 21:01:19 +00:00
for {
line, err := scanner.Readline()
switch {
case errors.Is(err, io.EOF):
return nil
case errors.Is(err, readline.ErrInterrupt):
2023-07-20 07:53:08 +00:00
if line == "" {
return nil
}
2023-07-18 21:01:19 +00:00
continue
case err != nil:
2023-07-06 20:49:31 +00:00
return err
}
2023-07-18 21:01:19 +00:00
line = strings.TrimSpace(line)
2023-07-06 20:49:31 +00:00
2023-07-18 21:01:19 +00:00
switch {
case isMultiLine:
if strings.HasSuffix(line, `"""`) {
isMultiLine = false
multiLineBuffer += strings.TrimSuffix(line, `"""`)
line = multiLineBuffer
multiLineBuffer = ""
scanner.SetPrompt(">>> ")
} else {
multiLineBuffer += line + " "
continue
}
case strings.HasPrefix(line, `"""`):
isMultiLine = true
multiLineBuffer = strings.TrimPrefix(line, `"""`) + " "
scanner.SetPrompt("... ")
continue
2023-07-18 21:01:19 +00:00
case strings.HasPrefix(line, "/list"):
args := strings.Fields(line)
2023-07-20 23:09:23 +00:00
if err := ListHandler(cmd, args[1:]); err != nil {
2023-07-18 21:01:19 +00:00
return err
}
continue
case strings.HasPrefix(line, "/set"):
args := strings.Fields(line)
if len(args) > 1 {
switch args[1] {
case "history":
scanner.HistoryEnable()
continue
case "nohistory":
scanner.HistoryDisable()
continue
2023-07-19 16:25:23 +00:00
case "verbose":
cmd.Flags().Set("verbose", "true")
continue
case "quiet":
cmd.Flags().Set("verbose", "false")
continue
2023-07-18 21:01:19 +00:00
case "mode":
if len(args) > 2 {
switch args[2] {
case "vim":
scanner.SetVimMode(true)
continue
case "emacs", "default":
scanner.SetVimMode(false)
continue
default:
usage()
continue
}
} else {
usage()
continue
}
}
} else {
usage()
continue
}
case strings.HasPrefix(line, "/show"):
args := strings.Fields(line)
if len(args) > 1 {
mp := server.ParseModelPath(model)
manifest, err := server.GetManifest(mp)
if err != nil {
fmt.Printf("error: couldn't get a manifestfor this model")
continue
}
switch args[1] {
case "license":
for _, l := range manifest.Layers {
if l.MediaType == "application/vnd.ollama.image.license" {
showLayer(l)
}
}
continue
case "system":
for _, l := range manifest.Layers {
if l.MediaType == "application/vnd.ollama.image.system" {
showLayer(l)
}
}
continue
case "template":
for _, l := range manifest.Layers {
if l.MediaType == "application/vnd.ollama.image.template" {
showLayer(l)
2023-07-18 21:01:19 +00:00
}
}
continue
default:
usage()
continue
2023-07-18 21:01:19 +00:00
}
} else {
usage()
continue
2023-07-18 21:01:19 +00:00
}
case line == "/help", line == "/?":
usage()
continue
case line == "/exit", line == "/bye":
return nil
}
if err := generate(cmd, model, line); err != nil {
return err
}
}
2023-07-06 16:24:49 +00:00
}
2023-07-13 01:18:06 +00:00
func generateBatch(cmd *cobra.Command, model string) error {
2023-07-06 20:49:31 +00:00
scanner := bufio.NewScanner(os.Stdin)
for scanner.Scan() {
prompt := scanner.Text()
fmt.Printf(">>> %s\n", prompt)
2023-07-13 01:18:06 +00:00
if err := generate(cmd, model, prompt); err != nil {
2023-07-06 20:49:31 +00:00
return err
}
}
return nil
}
// getRunServerParams takes a command and the environment variables and returns the correct params
// given the order of precedence: command line args (highest), environment variables, defaults (lowest)
func getRunServerParams(cmd *cobra.Command) (host, port string, extraOrigins []string, err error) {
host = os.Getenv("OLLAMA_HOST")
hostFlag := cmd.Flags().Lookup("host")
if hostFlag == nil {
return "", "", nil, errors.New("host unset")
}
if hostFlag.Changed || host == "" {
host = hostFlag.Value.String()
}
port = os.Getenv("OLLAMA_PORT")
portFlag := cmd.Flags().Lookup("port")
if portFlag == nil {
return "", "", nil, errors.New("port unset")
}
if portFlag.Changed || port == "" {
port = portFlag.Value.String()
}
extraOrigins, err = cmd.Flags().GetStringSlice("allowed-origins")
if err != nil {
return "", "", nil, err
}
return host, port, extraOrigins, nil
}
func RunServer(cmd *cobra.Command, _ []string) error {
host, port, extraOrigins, err := getRunServerParams(cmd)
2023-07-04 04:47:00 +00:00
if err != nil {
return err
}
ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port))
if err != nil {
return err
}
2023-07-04 04:47:00 +00:00
return server.Serve(ln, extraOrigins)
2023-07-04 04:47:00 +00:00
}
2023-07-31 21:38:10 +00:00
func startMacApp(client *api.Client) error {
2023-08-01 20:01:55 +00:00
exe, err := os.Executable()
if err != nil {
return err
}
link, err := os.Readlink(exe)
2023-07-31 21:38:10 +00:00
if err != nil {
return err
}
2023-08-01 17:48:48 +00:00
if !strings.Contains(link, "Ollama.app") {
return fmt.Errorf("could not find ollama app")
}
2023-07-31 21:38:10 +00:00
path := strings.Split(link, "Ollama.app")
if err := exec.Command("/usr/bin/open", "-a", path[0]+"Ollama.app").Run(); err != nil {
return err
}
// wait for the server to start
timeout := time.After(5 * time.Second)
tick := time.Tick(500 * time.Millisecond)
for {
select {
case <-timeout:
return errors.New("timed out waiting for server to start")
case <-tick:
if err := client.Heartbeat(context.Background()); err == nil {
return nil // server has started
}
}
}
}
func checkServerHeartbeat(_ *cobra.Command, _ []string) error {
client := api.NewClient()
if err := client.Heartbeat(context.Background()); err != nil {
2023-07-31 21:38:10 +00:00
if !strings.Contains(err.Error(), "connection refused") {
return err
}
if runtime.GOOS == "darwin" {
if err := startMacApp(client); err != nil {
2023-08-01 17:48:48 +00:00
return fmt.Errorf("could not connect to ollama app, is it running?")
}
2023-07-31 21:38:10 +00:00
} else {
return fmt.Errorf("could not connect to ollama server, run 'ollama serve' to start it")
}
}
return nil
}
func NewCLI() *cobra.Command {
log.SetFlags(log.LstdFlags | log.Lshortfile)
rootCmd := &cobra.Command{
2023-07-06 20:49:31 +00:00
Use: "ollama",
Short: "Large language model runner",
SilenceUsage: true,
CompletionOptions: cobra.CompletionOptions{
DisableDefaultCmd: true,
},
}
cobra.EnableCommandSorting = false
createCmd := &cobra.Command{
Use: "create MODEL",
Short: "Create a model from a Modelfile",
Args: cobra.MinimumNArgs(1),
PreRunE: checkServerHeartbeat,
RunE: CreateHandler,
}
createCmd.Flags().StringP("file", "f", "Modelfile", "Name of the Modelfile (default \"Modelfile\")")
runCmd := &cobra.Command{
Use: "run MODEL [PROMPT]",
Short: "Run a model",
Args: cobra.MinimumNArgs(1),
PreRunE: checkServerHeartbeat,
RunE: RunHandler,
}
2023-07-13 01:18:06 +00:00
runCmd.Flags().Bool("verbose", false, "Show timings for response")
serveCmd := &cobra.Command{
Use: "serve",
Aliases: []string{"start"},
Short: "Start ollama",
2023-07-06 20:49:31 +00:00
RunE: RunServer,
}
serveCmd.Flags().String("port", "11434", "Port to listen on, may also use OLLAMA_PORT environment variable")
serveCmd.Flags().String("host", "127.0.0.1", "Host listen address, may also use OLLAMA_HOST environment variable")
serveCmd.Flags().StringSlice("allowed-origins", []string{}, "Additional allowed CORS origins (outside of localhost), specify as comma-separated list")
pullCmd := &cobra.Command{
Use: "pull MODEL",
Short: "Pull a model from a registry",
Args: cobra.MinimumNArgs(1),
PreRunE: checkServerHeartbeat,
RunE: PullHandler,
}
pullCmd.Flags().Bool("insecure", false, "Use an insecure registry")
pushCmd := &cobra.Command{
Use: "push MODEL",
Short: "Push a model to a registry",
Args: cobra.MinimumNArgs(1),
PreRunE: checkServerHeartbeat,
RunE: PushHandler,
}
pushCmd.Flags().Bool("insecure", false, "Use an insecure registry")
2023-07-18 16:09:45 +00:00
listCmd := &cobra.Command{
Use: "list",
2023-07-20 22:28:27 +00:00
Aliases: []string{"ls"},
Short: "List models",
PreRunE: checkServerHeartbeat,
RunE: ListHandler,
2023-07-20 23:09:23 +00:00
}
2023-07-24 15:27:28 +00:00
copyCmd := &cobra.Command{
Use: "cp",
Short: "Copy a model",
Args: cobra.MinimumNArgs(2),
PreRunE: checkServerHeartbeat,
RunE: CopyHandler,
2023-07-24 15:27:28 +00:00
}
2023-07-20 23:09:23 +00:00
deleteCmd := &cobra.Command{
Use: "rm",
Short: "Remove a model",
Args: cobra.MinimumNArgs(1),
PreRunE: checkServerHeartbeat,
RunE: DeleteHandler,
2023-07-18 16:09:45 +00:00
}
rootCmd.AddCommand(
serveCmd,
createCmd,
runCmd,
pullCmd,
pushCmd,
2023-07-18 16:09:45 +00:00
listCmd,
2023-07-24 15:27:28 +00:00
copyCmd,
2023-07-20 23:09:23 +00:00
deleteCmd,
)
return rootCmd
}