package cmd import ( "bufio" "context" "errors" "fmt" "log" "net" "net/http" "os" "path" "strings" "time" "github.com/schollz/progressbar/v3" "github.com/spf13/cobra" "golang.org/x/term" "github.com/jmorganca/ollama/api" "github.com/jmorganca/ollama/server" ) func cacheDir() string { home, err := os.UserHomeDir() if err != nil { panic(err) } return path.Join(home, ".ollama") } func RunRun(cmd *cobra.Command, args []string) error { _, err := os.Stat(args[0]) switch { case errors.Is(err, os.ErrNotExist): if err := pull(args[0]); err != nil { var apiStatusError api.StatusError if !errors.As(err, &apiStatusError) { return err } if apiStatusError.StatusCode != http.StatusBadGateway { return err } } case err != nil: return err } return RunGenerate(cmd, args) } func pull(model string) error { client := api.NewClient() var bar *progressbar.ProgressBar return client.Pull( context.Background(), &api.PullRequest{Model: model}, func(progress api.PullProgress) error { if bar == nil { if progress.Percent >= 100 { // already downloaded return nil } bar = progressbar.DefaultBytes(progress.Total) } return bar.Set64(progress.Completed) }, ) } func RunGenerate(cmd *cobra.Command, args []string) error { if len(args) > 1 { // join all args into a single prompt return generate(cmd, args[0], strings.Join(args[1:], " ")) } if term.IsTerminal(int(os.Stdin.Fd())) { return generateInteractive(cmd, args[0]) } return generateBatch(cmd, args[0]) } var generateContextKey struct{} func generate(cmd *cobra.Command, model, prompt string) error { if len(strings.TrimSpace(prompt)) > 0 { client := api.NewClient() spinner := progressbar.NewOptions(-1, progressbar.OptionSetWriter(os.Stderr), progressbar.OptionThrottle(60*time.Millisecond), progressbar.OptionSpinnerType(14), progressbar.OptionSetRenderBlankState(true), progressbar.OptionSetElapsedTime(false), progressbar.OptionClearOnFinish(), ) go func() { for range time.Tick(60 * time.Millisecond) { if spinner.IsFinished() { break } spinner.Add(1) } }() var latest api.GenerateResponse generateContext, ok := cmd.Context().Value(generateContextKey).([]int) if !ok { generateContext = []int{} } request := api.GenerateRequest{Model: model, Prompt: prompt, Context: generateContext} fn := func(resp api.GenerateResponse) error { if !spinner.IsFinished() { spinner.Finish() } latest = resp fmt.Print(resp.Response) cmd.SetContext(context.WithValue(cmd.Context(), generateContextKey, resp.Context)) return nil } if err := client.Generate(context.Background(), &request, fn); err != nil { return err } fmt.Println() fmt.Println() verbose, err := cmd.Flags().GetBool("verbose") if err != nil { return err } if verbose { latest.Summary() } } return nil } func generateInteractive(cmd *cobra.Command, model string) error { fmt.Print(">>> ") scanner := bufio.NewScanner(os.Stdin) for scanner.Scan() { if err := generate(cmd, model, scanner.Text()); err != nil { return err } fmt.Print(">>> ") } return nil } func generateBatch(cmd *cobra.Command, model string) error { scanner := bufio.NewScanner(os.Stdin) for scanner.Scan() { prompt := scanner.Text() fmt.Printf(">>> %s\n", prompt) if err := generate(cmd, model, prompt); err != nil { return err } } return nil } func RunServer(_ *cobra.Command, _ []string) error { host := os.Getenv("OLLAMA_HOST") if host == "" { host = "127.0.0.1" } port := os.Getenv("OLLAMA_PORT") if port == "" { port = "11434" } ln, err := net.Listen("tcp", fmt.Sprintf("%s:%s", host, port)) if err != nil { return err } return server.Serve(ln) } func NewCLI() *cobra.Command { log.SetFlags(log.LstdFlags | log.Lshortfile) rootCmd := &cobra.Command{ Use: "ollama", Short: "Large language model runner", SilenceUsage: true, CompletionOptions: cobra.CompletionOptions{ DisableDefaultCmd: true, }, PersistentPreRunE: func(_ *cobra.Command, args []string) error { // create the models directory and it's parent return os.MkdirAll(path.Join(cacheDir(), "models"), 0o700) }, } cobra.EnableCommandSorting = false runCmd := &cobra.Command{ Use: "run MODEL [PROMPT]", Short: "Run a model", Args: cobra.MinimumNArgs(1), RunE: RunRun, } runCmd.Flags().Bool("verbose", false, "Show timings for response") serveCmd := &cobra.Command{ Use: "serve", Aliases: []string{"start"}, Short: "Start ollama", RunE: RunServer, } rootCmd.AddCommand( serveCmd, runCmd, ) return rootCmd }