2024-01-04 15:20:26 -08:00
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
|
|
|
"errors"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"net/http"
|
|
|
|
"os"
|
2024-02-01 17:09:51 -08:00
|
|
|
"path/filepath"
|
2024-01-04 15:20:26 -08:00
|
|
|
"regexp"
|
2024-05-21 21:30:52 -07:00
|
|
|
"slices"
|
2024-01-25 12:12:36 -08:00
|
|
|
"sort"
|
2024-01-04 15:20:26 -08:00
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/spf13/cobra"
|
|
|
|
|
2024-03-26 13:04:17 -07:00
|
|
|
"github.com/ollama/ollama/api"
|
2024-05-24 14:57:15 -07:00
|
|
|
"github.com/ollama/ollama/envconfig"
|
2024-03-26 13:04:17 -07:00
|
|
|
"github.com/ollama/ollama/progress"
|
|
|
|
"github.com/ollama/ollama/readline"
|
2024-05-13 18:48:28 -07:00
|
|
|
"github.com/ollama/ollama/types/errtypes"
|
2024-01-04 15:20:26 -08:00
|
|
|
)
|
|
|
|
|
|
|
|
type MultilineState int
|
|
|
|
|
|
|
|
const (
|
|
|
|
MultilineNone MultilineState = iota
|
|
|
|
MultilinePrompt
|
|
|
|
MultilineSystem
|
|
|
|
MultilineTemplate
|
|
|
|
)
|
|
|
|
|
2024-01-25 12:12:36 -08:00
|
|
|
func loadModel(cmd *cobra.Command, opts *runOptions) error {
|
|
|
|
p := progress.NewProgress(os.Stderr)
|
|
|
|
defer p.StopAndClear()
|
|
|
|
|
|
|
|
spinner := progress.NewSpinner("")
|
|
|
|
p.Add("", spinner)
|
|
|
|
|
cmd: defer stating model info until necessary (#5248)
This commit changes the 'ollama run' command to defer fetching model
information until it really needs it. That is, when in interactive mode.
It also removes one such case where the model information is fetch in
duplicate, just before calling generateInteractive and then again, first
thing, in generateInteractive.
This positively impacts the performance of the command:
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.168 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.220 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.217 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 4% cpu 0.652 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 5% cpu 0.498 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 3% cpu 0.479 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
2024-06-24 20:14:03 -07:00
|
|
|
client, err := api.ClientFromEnvironment()
|
2024-01-04 15:20:26 -08:00
|
|
|
if err != nil {
|
2024-01-25 12:12:36 -08:00
|
|
|
return err
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
|
|
|
|
2024-01-25 12:12:36 -08:00
|
|
|
chatReq := &api.ChatRequest{
|
cmd: defer stating model info until necessary (#5248)
This commit changes the 'ollama run' command to defer fetching model
information until it really needs it. That is, when in interactive mode.
It also removes one such case where the model information is fetch in
duplicate, just before calling generateInteractive and then again, first
thing, in generateInteractive.
This positively impacts the performance of the command:
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.168 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.220 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.217 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 4% cpu 0.652 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 5% cpu 0.498 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 3% cpu 0.479 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
2024-06-24 20:14:03 -07:00
|
|
|
Model: opts.Model,
|
|
|
|
KeepAlive: opts.KeepAlive,
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
2024-05-13 17:17:36 -07:00
|
|
|
|
cmd: defer stating model info until necessary (#5248)
This commit changes the 'ollama run' command to defer fetching model
information until it really needs it. That is, when in interactive mode.
It also removes one such case where the model information is fetch in
duplicate, just before calling generateInteractive and then again, first
thing, in generateInteractive.
This positively impacts the performance of the command:
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.168 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.220 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.217 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 4% cpu 0.652 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 5% cpu 0.498 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 3% cpu 0.479 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
2024-06-24 20:14:03 -07:00
|
|
|
return client.Chat(cmd.Context(), chatReq, func(resp api.ChatResponse) error {
|
2024-01-25 12:12:36 -08:00
|
|
|
p.StopAndClear()
|
cmd: defer stating model info until necessary (#5248)
This commit changes the 'ollama run' command to defer fetching model
information until it really needs it. That is, when in interactive mode.
It also removes one such case where the model information is fetch in
duplicate, just before calling generateInteractive and then again, first
thing, in generateInteractive.
This positively impacts the performance of the command:
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.168 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.220 total
; time ./before run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./before run llama3 'hi' 0.02s user 0.01s system 2% cpu 1.217 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 4% cpu 0.652 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 5% cpu 0.498 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with or would you like to chat?
./after run llama3 'hi' 0.01s user 0.01s system 3% cpu 0.479 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
; time ./after run llama3 'hi'
Hi! It's nice to meet you. Is there something I can help you with, or would you like to chat?
./after run llama3 'hi' 0.02s user 0.01s system 5% cpu 0.507 total
2024-06-24 20:14:03 -07:00
|
|
|
for _, msg := range opts.Messages {
|
|
|
|
switch msg.Role {
|
|
|
|
case "user":
|
|
|
|
fmt.Printf(">>> %s\n", msg.Content)
|
|
|
|
case "assistant":
|
|
|
|
state := &displayResponseState{}
|
|
|
|
displayResponse(msg.Content, opts.WordWrap, state)
|
|
|
|
fmt.Println()
|
|
|
|
fmt.Println()
|
2024-01-25 12:12:36 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func generateInteractive(cmd *cobra.Command, opts runOptions) error {
|
|
|
|
err := loadModel(cmd, &opts)
|
|
|
|
if err != nil {
|
2024-01-04 15:20:26 -08:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
usage := func() {
|
|
|
|
fmt.Fprintln(os.Stderr, "Available Commands:")
|
2024-01-25 12:12:36 -08:00
|
|
|
fmt.Fprintln(os.Stderr, " /set Set session variables")
|
|
|
|
fmt.Fprintln(os.Stderr, " /show Show model information")
|
|
|
|
fmt.Fprintln(os.Stderr, " /load <model> Load a session or model")
|
|
|
|
fmt.Fprintln(os.Stderr, " /save <model> Save your current session")
|
2024-05-01 15:44:36 -06:00
|
|
|
fmt.Fprintln(os.Stderr, " /clear Clear session context")
|
2024-01-25 12:12:36 -08:00
|
|
|
fmt.Fprintln(os.Stderr, " /bye Exit")
|
|
|
|
fmt.Fprintln(os.Stderr, " /?, /help Help for a command")
|
|
|
|
fmt.Fprintln(os.Stderr, " /? shortcuts Help for keyboard shortcuts")
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
fmt.Fprintln(os.Stderr, "Use \"\"\" to begin a multi-line message.")
|
2024-02-01 17:09:51 -08:00
|
|
|
|
|
|
|
if opts.MultiModal {
|
|
|
|
fmt.Fprintf(os.Stderr, "Use %s to include .jpg or .png images.\n", filepath.FromSlash("/path/to/file"))
|
|
|
|
}
|
|
|
|
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
}
|
|
|
|
|
|
|
|
usageSet := func() {
|
|
|
|
fmt.Fprintln(os.Stderr, "Available Commands:")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter ... Set a parameter")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set system <string> Set system message")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set template <string> Set prompt template")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set history Enable history")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set nohistory Disable history")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set wordwrap Enable wordwrap")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set nowordwrap Disable wordwrap")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set format json Enable JSON mode")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set noformat Disable formatting")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set verbose Show LLM stats")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set quiet Disable LLM stats")
|
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
}
|
|
|
|
|
|
|
|
usageShortcuts := func() {
|
|
|
|
fmt.Fprintln(os.Stderr, "Available keyboard shortcuts:")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + a Move to the beginning of the line (Home)")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + e Move to the end of the line (End)")
|
|
|
|
fmt.Fprintln(os.Stderr, " Alt + b Move back (left) one word")
|
|
|
|
fmt.Fprintln(os.Stderr, " Alt + f Move forward (right) one word")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + k Delete the sentence after the cursor")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + u Delete the sentence before the cursor")
|
2024-05-21 16:55:09 -07:00
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + w Delete the word before the cursor")
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + l Clear the screen")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + c Stop the model from responding")
|
|
|
|
fmt.Fprintln(os.Stderr, " Ctrl + d Exit ollama (/bye)")
|
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
}
|
|
|
|
|
|
|
|
usageShow := func() {
|
|
|
|
fmt.Fprintln(os.Stderr, "Available Commands:")
|
2024-01-04 17:23:11 -08:00
|
|
|
fmt.Fprintln(os.Stderr, " /show info Show details for this model")
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Fprintln(os.Stderr, " /show license Show model license")
|
|
|
|
fmt.Fprintln(os.Stderr, " /show modelfile Show Modelfile for this model")
|
|
|
|
fmt.Fprintln(os.Stderr, " /show parameters Show parameters for this model")
|
|
|
|
fmt.Fprintln(os.Stderr, " /show system Show system message")
|
|
|
|
fmt.Fprintln(os.Stderr, " /show template Show prompt template")
|
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
}
|
|
|
|
|
|
|
|
// only list out the most common parameters
|
|
|
|
usageParameters := func() {
|
|
|
|
fmt.Fprintln(os.Stderr, "Available Parameters:")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter seed <int> Random number seed")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter num_predict <int> Max number of tokens to predict")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter top_k <int> Pick from top k num of tokens")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter top_p <float> Pick token based on sum of probabilities")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter num_ctx <int> Set the context size")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter temperature <float> Set creativity level")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter repeat_penalty <float> How strongly to penalize repetitions")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter repeat_last_n <int> Set how far back to look for repetitions")
|
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter num_gpu <int> The number of layers to send to the GPU")
|
2024-05-08 01:48:35 +02:00
|
|
|
fmt.Fprintln(os.Stderr, " /set parameter stop <string> <string> ... Set the stop parameters")
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Fprintln(os.Stderr, "")
|
|
|
|
}
|
|
|
|
|
|
|
|
scanner, err := readline.New(readline.Prompt{
|
|
|
|
Prompt: ">>> ",
|
|
|
|
AltPrompt: "... ",
|
|
|
|
Placeholder: "Send a message (/? for help)",
|
|
|
|
AltPlaceholder: `Use """ to end multi-line input`,
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2024-05-24 14:57:15 -07:00
|
|
|
if envconfig.NoHistory {
|
2024-05-18 11:51:57 -07:00
|
|
|
scanner.HistoryDisable()
|
|
|
|
}
|
|
|
|
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Print(readline.StartBracketedPaste)
|
|
|
|
defer fmt.Printf(readline.EndBracketedPaste)
|
|
|
|
|
2024-01-05 15:51:33 -08:00
|
|
|
var sb strings.Builder
|
2024-01-04 15:20:26 -08:00
|
|
|
var multiline MultilineState
|
|
|
|
|
|
|
|
for {
|
|
|
|
line, err := scanner.Readline()
|
|
|
|
switch {
|
|
|
|
case errors.Is(err, io.EOF):
|
|
|
|
fmt.Println()
|
|
|
|
return nil
|
|
|
|
case errors.Is(err, readline.ErrInterrupt):
|
|
|
|
if line == "" {
|
|
|
|
fmt.Println("\nUse Ctrl + d or /bye to exit.")
|
|
|
|
}
|
|
|
|
|
|
|
|
scanner.Prompt.UseAlt = false
|
2024-01-05 15:51:33 -08:00
|
|
|
sb.Reset()
|
2024-01-04 15:20:26 -08:00
|
|
|
|
|
|
|
continue
|
|
|
|
case err != nil:
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
switch {
|
2024-01-05 15:51:33 -08:00
|
|
|
case multiline != MultilineNone:
|
|
|
|
// check if there's a multiline terminating string
|
|
|
|
before, ok := strings.CutSuffix(line, `"""`)
|
|
|
|
sb.WriteString(before)
|
|
|
|
if !ok {
|
|
|
|
fmt.Fprintln(&sb)
|
2024-01-04 15:20:26 -08:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
switch multiline {
|
|
|
|
case MultilineSystem:
|
2024-01-05 15:51:33 -08:00
|
|
|
opts.System = sb.String()
|
2024-02-01 17:09:51 -08:00
|
|
|
opts.Messages = append(opts.Messages, api.Message{Role: "system", Content: opts.System})
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Println("Set system message.")
|
2024-01-05 15:51:33 -08:00
|
|
|
sb.Reset()
|
2024-01-04 15:20:26 -08:00
|
|
|
case MultilineTemplate:
|
2024-01-05 15:51:33 -08:00
|
|
|
opts.Template = sb.String()
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Println("Set prompt template.")
|
2024-01-05 15:51:33 -08:00
|
|
|
sb.Reset()
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
2024-01-05 15:51:33 -08:00
|
|
|
|
2024-01-04 15:20:26 -08:00
|
|
|
multiline = MultilineNone
|
2024-01-05 15:51:33 -08:00
|
|
|
scanner.Prompt.UseAlt = false
|
|
|
|
case strings.HasPrefix(line, `"""`):
|
|
|
|
line := strings.TrimPrefix(line, `"""`)
|
|
|
|
line, ok := strings.CutSuffix(line, `"""`)
|
|
|
|
sb.WriteString(line)
|
|
|
|
if !ok {
|
|
|
|
// no multiline terminating string; need more input
|
|
|
|
fmt.Fprintln(&sb)
|
|
|
|
multiline = MultilinePrompt
|
|
|
|
scanner.Prompt.UseAlt = true
|
|
|
|
}
|
2024-01-04 15:20:26 -08:00
|
|
|
case scanner.Pasting:
|
2024-01-05 15:51:33 -08:00
|
|
|
fmt.Fprintln(&sb, line)
|
2024-01-04 15:20:26 -08:00
|
|
|
continue
|
|
|
|
case strings.HasPrefix(line, "/list"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if err := ListHandler(cmd, args[1:]); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2024-01-25 12:12:36 -08:00
|
|
|
case strings.HasPrefix(line, "/load"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if len(args) != 2 {
|
|
|
|
fmt.Println("Usage:\n /load <modelname>")
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
opts.Model = args[1]
|
|
|
|
opts.Messages = []api.Message{}
|
|
|
|
fmt.Printf("Loading model '%s'\n", opts.Model)
|
|
|
|
if err := loadModel(cmd, &opts); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
case strings.HasPrefix(line, "/save"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if len(args) != 2 {
|
|
|
|
fmt.Println("Usage:\n /save <modelname>")
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
client, err := api.ClientFromEnvironment()
|
|
|
|
if err != nil {
|
|
|
|
fmt.Println("error: couldn't connect to ollama server")
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
req := &api.CreateRequest{
|
|
|
|
Name: args[1],
|
|
|
|
Modelfile: buildModelfile(opts),
|
|
|
|
}
|
|
|
|
fn := func(resp api.ProgressResponse) error { return nil }
|
|
|
|
err = client.Create(cmd.Context(), req, fn)
|
|
|
|
if err != nil {
|
2024-05-13 18:48:28 -07:00
|
|
|
if strings.Contains(err.Error(), errtypes.InvalidModelNameErrMsg) {
|
|
|
|
fmt.Printf("error: The model name '%s' is invalid\n", args[1])
|
|
|
|
continue
|
|
|
|
}
|
2024-01-25 12:12:36 -08:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
fmt.Printf("Created new model '%s'\n", args[1])
|
|
|
|
continue
|
2024-05-01 15:44:36 -06:00
|
|
|
case strings.HasPrefix(line, "/clear"):
|
|
|
|
opts.Messages = []api.Message{}
|
2024-05-14 11:38:20 -07:00
|
|
|
if opts.System != "" {
|
|
|
|
newMessage := api.Message{Role: "system", Content: opts.System}
|
|
|
|
opts.Messages = append(opts.Messages, newMessage)
|
|
|
|
}
|
2024-05-01 15:44:36 -06:00
|
|
|
fmt.Println("Cleared session context")
|
|
|
|
continue
|
2024-01-04 15:20:26 -08:00
|
|
|
case strings.HasPrefix(line, "/set"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if len(args) > 1 {
|
|
|
|
switch args[1] {
|
|
|
|
case "history":
|
|
|
|
scanner.HistoryEnable()
|
|
|
|
case "nohistory":
|
|
|
|
scanner.HistoryDisable()
|
|
|
|
case "wordwrap":
|
|
|
|
opts.WordWrap = true
|
|
|
|
fmt.Println("Set 'wordwrap' mode.")
|
|
|
|
case "nowordwrap":
|
|
|
|
opts.WordWrap = false
|
|
|
|
fmt.Println("Set 'nowordwrap' mode.")
|
|
|
|
case "verbose":
|
2024-03-28 18:54:01 -07:00
|
|
|
if err := cmd.Flags().Set("verbose", "true"); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Println("Set 'verbose' mode.")
|
|
|
|
case "quiet":
|
2024-03-28 18:54:01 -07:00
|
|
|
if err := cmd.Flags().Set("verbose", "false"); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Println("Set 'quiet' mode.")
|
|
|
|
case "format":
|
|
|
|
if len(args) < 3 || args[2] != "json" {
|
|
|
|
fmt.Println("Invalid or missing format. For 'json' mode use '/set format json'")
|
|
|
|
} else {
|
|
|
|
opts.Format = args[2]
|
|
|
|
fmt.Printf("Set format to '%s' mode.\n", args[2])
|
|
|
|
}
|
|
|
|
case "noformat":
|
|
|
|
opts.Format = ""
|
|
|
|
fmt.Println("Disabled format.")
|
|
|
|
case "parameter":
|
|
|
|
if len(args) < 4 {
|
|
|
|
usageParameters()
|
|
|
|
continue
|
|
|
|
}
|
2023-12-15 14:07:34 -08:00
|
|
|
params := args[3:]
|
2024-01-04 15:20:26 -08:00
|
|
|
fp, err := api.FormatParams(map[string][]string{args[2]: params})
|
|
|
|
if err != nil {
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Printf("Couldn't set parameter: %q\n", err)
|
2024-01-04 15:20:26 -08:00
|
|
|
continue
|
|
|
|
}
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Printf("Set parameter '%s' to '%s'\n", args[2], strings.Join(params, ", "))
|
2024-01-04 15:20:26 -08:00
|
|
|
opts.Options[args[2]] = fp[args[2]]
|
|
|
|
case "system", "template":
|
|
|
|
if len(args) < 3 {
|
|
|
|
usageSet()
|
|
|
|
continue
|
|
|
|
}
|
2024-01-05 15:51:33 -08:00
|
|
|
|
|
|
|
if args[1] == "system" {
|
|
|
|
multiline = MultilineSystem
|
|
|
|
} else if args[1] == "template" {
|
|
|
|
multiline = MultilineTemplate
|
|
|
|
}
|
|
|
|
|
2024-01-04 15:20:26 -08:00
|
|
|
line := strings.Join(args[2:], " ")
|
2024-01-05 15:51:33 -08:00
|
|
|
line, ok := strings.CutPrefix(line, `"""`)
|
|
|
|
if !ok {
|
|
|
|
multiline = MultilineNone
|
2024-01-04 15:20:26 -08:00
|
|
|
} else {
|
2024-01-05 15:51:33 -08:00
|
|
|
// only cut suffix if the line is multiline
|
|
|
|
line, ok = strings.CutSuffix(line, `"""`)
|
|
|
|
if ok {
|
|
|
|
multiline = MultilineNone
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
sb.WriteString(line)
|
|
|
|
if multiline != MultilineNone {
|
|
|
|
scanner.Prompt.UseAlt = true
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if args[1] == "system" {
|
2024-02-16 14:42:43 -05:00
|
|
|
opts.System = sb.String() // for display in modelfile
|
|
|
|
newMessage := api.Message{Role: "system", Content: sb.String()}
|
|
|
|
// Check if the slice is not empty and the last message is from 'system'
|
|
|
|
if len(opts.Messages) > 0 && opts.Messages[len(opts.Messages)-1].Role == "system" {
|
|
|
|
// Replace the last message
|
|
|
|
opts.Messages[len(opts.Messages)-1] = newMessage
|
|
|
|
} else {
|
|
|
|
opts.Messages = append(opts.Messages, newMessage)
|
|
|
|
}
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Println("Set system message.")
|
2024-02-01 17:09:51 -08:00
|
|
|
sb.Reset()
|
2024-01-05 15:51:33 -08:00
|
|
|
} else if args[1] == "template" {
|
|
|
|
opts.Template = sb.String()
|
|
|
|
fmt.Println("Set prompt template.")
|
2024-02-01 17:09:51 -08:00
|
|
|
sb.Reset()
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
2024-01-05 15:51:33 -08:00
|
|
|
|
|
|
|
sb.Reset()
|
|
|
|
continue
|
2024-01-04 15:20:26 -08:00
|
|
|
default:
|
|
|
|
fmt.Printf("Unknown command '/set %s'. Type /? for help\n", args[1])
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
usageSet()
|
|
|
|
}
|
|
|
|
case strings.HasPrefix(line, "/show"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if len(args) > 1 {
|
|
|
|
client, err := api.ClientFromEnvironment()
|
|
|
|
if err != nil {
|
|
|
|
fmt.Println("error: couldn't connect to ollama server")
|
|
|
|
return err
|
|
|
|
}
|
2024-01-04 17:23:11 -08:00
|
|
|
req := &api.ShowRequest{
|
2024-01-05 15:06:43 -08:00
|
|
|
Name: opts.Model,
|
2024-01-04 17:23:11 -08:00
|
|
|
System: opts.System,
|
|
|
|
Template: opts.Template,
|
|
|
|
Options: opts.Options,
|
|
|
|
}
|
|
|
|
resp, err := client.Show(cmd.Context(), req)
|
2024-01-04 15:20:26 -08:00
|
|
|
if err != nil {
|
|
|
|
fmt.Println("error: couldn't get model")
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
switch args[1] {
|
2024-01-04 17:23:11 -08:00
|
|
|
case "info":
|
|
|
|
fmt.Println("Model details:")
|
|
|
|
if len(resp.Details.Families) > 0 {
|
|
|
|
fmt.Printf("Family %s\n", strings.Join(resp.Details.Families, ", "))
|
|
|
|
} else if resp.Details.Family != "" {
|
|
|
|
fmt.Printf("Family %s\n", resp.Details.Family)
|
|
|
|
}
|
|
|
|
fmt.Printf("Parameter Size %s\n", resp.Details.ParameterSize)
|
|
|
|
fmt.Printf("Quantization Level %s\n", resp.Details.QuantizationLevel)
|
|
|
|
fmt.Println("")
|
2024-01-04 15:20:26 -08:00
|
|
|
case "license":
|
|
|
|
if resp.License == "" {
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Println("No license was specified for this model.")
|
2024-01-04 15:20:26 -08:00
|
|
|
} else {
|
|
|
|
fmt.Println(resp.License)
|
|
|
|
}
|
|
|
|
case "modelfile":
|
|
|
|
fmt.Println(resp.Modelfile)
|
|
|
|
case "parameters":
|
|
|
|
if resp.Parameters == "" {
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Println("No parameters were specified for this model.")
|
2024-01-04 15:20:26 -08:00
|
|
|
} else {
|
|
|
|
if len(opts.Options) > 0 {
|
|
|
|
fmt.Println("User defined parameters:")
|
|
|
|
for k, v := range opts.Options {
|
|
|
|
fmt.Printf("%-*s %v\n", 30, k, v)
|
|
|
|
}
|
|
|
|
fmt.Println()
|
|
|
|
}
|
|
|
|
fmt.Println("Model defined parameters:")
|
|
|
|
fmt.Println(resp.Parameters)
|
|
|
|
}
|
|
|
|
case "system":
|
|
|
|
switch {
|
|
|
|
case opts.System != "":
|
|
|
|
fmt.Println(opts.System + "\n")
|
|
|
|
case resp.System != "":
|
|
|
|
fmt.Println(resp.System + "\n")
|
|
|
|
default:
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Println("No system message was specified for this model.")
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
|
|
|
case "template":
|
|
|
|
switch {
|
|
|
|
case opts.Template != "":
|
|
|
|
fmt.Println(opts.Template + "\n")
|
|
|
|
case resp.Template != "":
|
|
|
|
fmt.Println(resp.Template)
|
|
|
|
default:
|
2024-01-12 11:21:08 -08:00
|
|
|
fmt.Println("No prompt template was specified for this model.")
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
|
|
|
default:
|
|
|
|
fmt.Printf("Unknown command '/show %s'. Type /? for help\n", args[1])
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
usageShow()
|
|
|
|
}
|
|
|
|
case strings.HasPrefix(line, "/help"), strings.HasPrefix(line, "/?"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
if len(args) > 1 {
|
|
|
|
switch args[1] {
|
|
|
|
case "set", "/set":
|
|
|
|
usageSet()
|
|
|
|
case "show", "/show":
|
|
|
|
usageShow()
|
|
|
|
case "shortcut", "shortcuts":
|
|
|
|
usageShortcuts()
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
usage()
|
|
|
|
}
|
2024-02-20 05:56:49 +03:00
|
|
|
case strings.HasPrefix(line, "/exit"), strings.HasPrefix(line, "/bye"):
|
2024-01-04 15:20:26 -08:00
|
|
|
return nil
|
|
|
|
case strings.HasPrefix(line, "/"):
|
|
|
|
args := strings.Fields(line)
|
|
|
|
isFile := false
|
|
|
|
|
2024-01-25 12:12:36 -08:00
|
|
|
if opts.MultiModal {
|
2024-01-04 15:20:26 -08:00
|
|
|
for _, f := range extractFileNames(line) {
|
|
|
|
if strings.HasPrefix(f, args[0]) {
|
|
|
|
isFile = true
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-01-05 15:51:33 -08:00
|
|
|
if !isFile {
|
2024-01-04 15:20:26 -08:00
|
|
|
fmt.Printf("Unknown command '%s'. Type /? for help\n", args[0])
|
|
|
|
continue
|
|
|
|
}
|
2024-01-05 15:51:33 -08:00
|
|
|
|
|
|
|
sb.WriteString(line)
|
2024-01-04 15:20:26 -08:00
|
|
|
default:
|
2024-01-05 15:51:33 -08:00
|
|
|
sb.WriteString(line)
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
|
|
|
|
2024-01-05 15:51:33 -08:00
|
|
|
if sb.Len() > 0 && multiline == MultilineNone {
|
2024-01-12 12:05:52 -08:00
|
|
|
newMessage := api.Message{Role: "user", Content: sb.String()}
|
|
|
|
|
2024-01-25 12:12:36 -08:00
|
|
|
if opts.MultiModal {
|
2024-01-12 12:05:52 -08:00
|
|
|
msg, images, err := extractFileData(sb.String())
|
2024-01-04 15:20:26 -08:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2024-02-01 21:30:26 -08:00
|
|
|
|
|
|
|
// clear all previous images for better responses
|
|
|
|
if len(images) > 0 {
|
|
|
|
for i := range opts.Messages {
|
|
|
|
opts.Messages[i].Images = nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-01-12 12:05:52 -08:00
|
|
|
newMessage.Content = msg
|
2024-02-01 17:09:51 -08:00
|
|
|
newMessage.Images = images
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
2024-01-05 15:51:33 -08:00
|
|
|
|
2024-01-12 12:05:52 -08:00
|
|
|
opts.Messages = append(opts.Messages, newMessage)
|
|
|
|
|
|
|
|
assistant, err := chat(cmd, opts)
|
|
|
|
if err != nil {
|
2024-01-04 15:20:26 -08:00
|
|
|
return err
|
|
|
|
}
|
2024-01-12 12:05:52 -08:00
|
|
|
if assistant != nil {
|
|
|
|
opts.Messages = append(opts.Messages, *assistant)
|
|
|
|
}
|
2024-01-04 15:20:26 -08:00
|
|
|
|
2024-01-05 15:51:33 -08:00
|
|
|
sb.Reset()
|
2024-01-04 15:20:26 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-01-25 12:12:36 -08:00
|
|
|
func buildModelfile(opts runOptions) string {
|
|
|
|
var mf strings.Builder
|
|
|
|
model := opts.ParentModel
|
|
|
|
if model == "" {
|
|
|
|
model = opts.Model
|
|
|
|
}
|
|
|
|
fmt.Fprintf(&mf, "FROM %s\n", model)
|
|
|
|
if opts.System != "" {
|
|
|
|
fmt.Fprintf(&mf, "SYSTEM \"\"\"%s\"\"\"\n", opts.System)
|
|
|
|
}
|
|
|
|
|
|
|
|
if opts.Template != "" {
|
|
|
|
fmt.Fprintf(&mf, "TEMPLATE \"\"\"%s\"\"\"\n", opts.Template)
|
|
|
|
}
|
|
|
|
|
|
|
|
keys := make([]string, 0)
|
|
|
|
for k := range opts.Options {
|
|
|
|
keys = append(keys, k)
|
|
|
|
}
|
|
|
|
sort.Strings(keys)
|
|
|
|
for _, k := range keys {
|
|
|
|
fmt.Fprintf(&mf, "PARAMETER %s %v\n", k, opts.Options[k])
|
|
|
|
}
|
|
|
|
fmt.Fprintln(&mf)
|
|
|
|
|
|
|
|
for _, msg := range opts.Messages {
|
|
|
|
fmt.Fprintf(&mf, "MESSAGE %s \"\"\"%s\"\"\"\n", msg.Role, msg.Content)
|
|
|
|
}
|
|
|
|
|
|
|
|
return mf.String()
|
|
|
|
}
|
|
|
|
|
2024-01-04 15:20:26 -08:00
|
|
|
func normalizeFilePath(fp string) string {
|
|
|
|
// Define a map of escaped characters and their replacements
|
|
|
|
replacements := map[string]string{
|
|
|
|
"\\ ": " ", // Escaped space
|
|
|
|
"\\(": "(", // Escaped left parenthesis
|
|
|
|
"\\)": ")", // Escaped right parenthesis
|
|
|
|
"\\[": "[", // Escaped left square bracket
|
|
|
|
"\\]": "]", // Escaped right square bracket
|
|
|
|
"\\{": "{", // Escaped left curly brace
|
|
|
|
"\\}": "}", // Escaped right curly brace
|
|
|
|
"\\$": "$", // Escaped dollar sign
|
|
|
|
"\\&": "&", // Escaped ampersand
|
|
|
|
"\\;": ";", // Escaped semicolon
|
|
|
|
"\\'": "'", // Escaped single quote
|
|
|
|
"\\\\": "\\", // Escaped backslash
|
|
|
|
"\\*": "*", // Escaped asterisk
|
|
|
|
"\\?": "?", // Escaped question mark
|
|
|
|
}
|
|
|
|
|
|
|
|
for escaped, actual := range replacements {
|
|
|
|
fp = strings.ReplaceAll(fp, escaped, actual)
|
|
|
|
}
|
|
|
|
return fp
|
|
|
|
}
|
|
|
|
|
|
|
|
func extractFileNames(input string) []string {
|
2024-01-06 10:50:27 -08:00
|
|
|
// Regex to match file paths starting with optional drive letter, / ./ \ or .\ and include escaped or unescaped spaces (\ or %20)
|
2024-01-04 15:20:26 -08:00
|
|
|
// and followed by more characters and a file extension
|
2024-01-06 10:50:27 -08:00
|
|
|
// This will capture non filename strings, but we'll check for file existence to remove mismatches
|
|
|
|
regexPattern := `(?:[a-zA-Z]:)?(?:\./|/|\\)[\S\\ ]+?\.(?i:jpg|jpeg|png|svg)\b`
|
2024-01-04 15:20:26 -08:00
|
|
|
re := regexp.MustCompile(regexPattern)
|
|
|
|
|
|
|
|
return re.FindAllString(input, -1)
|
|
|
|
}
|
|
|
|
|
2024-01-12 12:05:52 -08:00
|
|
|
func extractFileData(input string) (string, []api.ImageData, error) {
|
2024-01-04 15:20:26 -08:00
|
|
|
filePaths := extractFileNames(input)
|
2024-01-12 12:05:52 -08:00
|
|
|
var imgs []api.ImageData
|
2024-01-04 15:20:26 -08:00
|
|
|
|
|
|
|
for _, fp := range filePaths {
|
|
|
|
nfp := normalizeFilePath(fp)
|
|
|
|
data, err := getImageData(nfp)
|
|
|
|
if err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
continue
|
|
|
|
}
|
2024-02-01 21:33:06 -08:00
|
|
|
fmt.Fprintf(os.Stderr, "Couldn't process image: %q\n", err)
|
2024-01-04 15:20:26 -08:00
|
|
|
return "", imgs, err
|
|
|
|
}
|
2024-02-01 21:33:06 -08:00
|
|
|
fmt.Fprintf(os.Stderr, "Added image '%s'\n", nfp)
|
2024-01-04 15:20:26 -08:00
|
|
|
input = strings.ReplaceAll(input, fp, "")
|
|
|
|
imgs = append(imgs, data)
|
|
|
|
}
|
|
|
|
return input, imgs, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func getImageData(filePath string) ([]byte, error) {
|
|
|
|
file, err := os.Open(filePath)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
|
buf := make([]byte, 512)
|
|
|
|
_, err = file.Read(buf)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
contentType := http.DetectContentType(buf)
|
2024-02-12 11:16:20 -08:00
|
|
|
allowedTypes := []string{"image/jpeg", "image/jpg", "image/png"}
|
2024-01-04 15:20:26 -08:00
|
|
|
if !slices.Contains(allowedTypes, contentType) {
|
|
|
|
return nil, fmt.Errorf("invalid image type: %s", contentType)
|
|
|
|
}
|
|
|
|
|
|
|
|
info, err := file.Stat()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check if the file size exceeds 100MB
|
|
|
|
var maxSize int64 = 100 * 1024 * 1024 // 100MB in bytes
|
|
|
|
if info.Size() > maxSize {
|
|
|
|
return nil, fmt.Errorf("file size exceeds maximum limit (100MB)")
|
|
|
|
}
|
|
|
|
|
|
|
|
buf = make([]byte, info.Size())
|
|
|
|
_, err = file.Seek(0, 0)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
_, err = io.ReadFull(file, buf)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return buf, nil
|
|
|
|
}
|