ollama/server/prompt.go

package server

import (
	"bytes"
	"context"
	"log/slog"
	"slices"

	"github.com/ollama/ollama/api"
	"github.com/ollama/ollama/llm"
	"github.com/ollama/ollama/template"
)

type tokenizeFunc func(context.Context, string) ([]int, error)

// chatPrompt accepts a list of messages and returns the prompt and images that should be used for the next chat turn.
// chatPrompt truncates any messages that exceed the context window of the model, making sure to always include 1) the
// latest message and 2) system messages
func chatPrompt(ctx context.Context, m *Model, tokenize tokenizeFunc, opts *api.Options, msgs []api.Message) (prompt string, images []llm.ImageData, _ error) {
	// pull out any system messages which should always be included in the prompt
	var system []api.Message
	msgs = slices.DeleteFunc(msgs, func(m api.Message) bool {
		if m.Role == "system" {
			system = append(system, m)
			return true
		}

		return false
	})

	if len(system) == 0 && m.System != "" {
		// add model system prompt since it wasn't provided
		system = append(system, api.Message{Role: "system", Content: m.System})
	}

	// always include the last message
	n := len(msgs) - 1
	// in reverse, find all messages that fit into context window
	for i := n - 1; i >= 0; i-- {
		var b bytes.Buffer
		if err := m.Template.Execute(&b, template.Values{Messages: append(system, msgs[i:]...)}); err != nil {
			return "", nil, err
		}

		s, err := tokenize(ctx, b.String())
		if err != nil {
			return "", nil, err
		}

		c := len(s)
		if m.ProjectorPaths != nil {
			for _, m := range msgs[i:] {
				// images are represented as 768 sized embeddings
				// TODO: get embedding length from project metadata
				c += 768 * len(m.Images)
			}
		}

		if c > opts.NumCtx {
			slog.Debug("truncating input messages which exceed context length", "truncated", len(msgs[i:]))
			break
		} else {
			n = i
		}
	}

	// truncate any messages that do not fit into the context window
	var b bytes.Buffer
	if err := m.Template.Execute(&b, template.Values{Messages: append(system, msgs[n:]...)}); err != nil {
		return "", nil, err
	}

	for _, m := range msgs[n:] {
		for _, i := range m.Images {
			images = append(images, llm.ImageData{
				ID:   len(images),
				Data: i,
			})
		}
	}

	return b.String(), images, nil
}
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`package server`

			`import (`
update message processing 2024-06-17 17:38:55 +00:00			`"bytes"`
			`"context"`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`"log/slog"`
update message processing 2024-06-17 17:38:55 +00:00			`"slices"`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00
change `github.com/jmorganca/ollama` to `github.com/ollama/ollama` (#3347) 2024-03-26 20:04:17 +00:00			`"github.com/ollama/ollama/api"`
update message processing 2024-06-17 17:38:55 +00:00			`"github.com/ollama/ollama/llm"`
rename templates to template 2024-06-10 21:54:42 +00:00			`"github.com/ollama/ollama/template"`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`)`

comments 2024-06-20 18:00:08 +00:00			`type tokenizeFunc func(context.Context, string) ([]int, error)`

			`// chatPrompt accepts a list of messages and returns the prompt and images that should be used for the next chat turn.`
			`// chatPrompt truncates any messages that exceed the context window of the model, making sure to always include 1) the`
			`// latest message and 2) system messages`
			`func chatPrompt(ctx context.Context, m Model, tokenize tokenizeFunc, opts api.Options, msgs []api.Message) (prompt string, images []llm.ImageData, _ error) {`
			`// pull out any system messages which should always be included in the prompt`
update message processing 2024-06-17 17:38:55 +00:00			`var system []api.Message`
			`msgs = slices.DeleteFunc(msgs, func(m api.Message) bool {`
			`if m.Role == "system" {`
			`system = append(system, m)`
			`return true`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

update message processing 2024-06-17 17:38:55 +00:00			`return false`
			`})`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00
comments 2024-06-20 18:00:08 +00:00			`if len(system) == 0 && m.System != "" {`
update message processing 2024-06-17 17:38:55 +00:00			`// add model system prompt since it wasn't provided`
comments 2024-06-20 18:00:08 +00:00			`system = append(system, api.Message{Role: "system", Content: m.System})`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

comments 2024-06-20 18:00:08 +00:00			`// always include the last message`
update message processing 2024-06-17 17:38:55 +00:00			`n := len(msgs) - 1`
comments 2024-06-20 18:00:08 +00:00			`// in reverse, find all messages that fit into context window`
update message processing 2024-06-17 17:38:55 +00:00			`for i := n - 1; i >= 0; i-- {`
			`var b bytes.Buffer`
comments 2024-06-20 18:00:08 +00:00			`if err := m.Template.Execute(&b, template.Values{Messages: append(system, msgs[i:]...)}); err != nil {`
update message processing 2024-06-17 17:38:55 +00:00			`return "", nil, err`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

comments 2024-06-20 18:00:08 +00:00			`s, err := tokenize(ctx, b.String())`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`if err != nil {`
update message processing 2024-06-17 17:38:55 +00:00			`return "", nil, err`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

update message processing 2024-06-17 17:38:55 +00:00			`c := len(s)`
comments 2024-06-20 18:00:08 +00:00			`if m.ProjectorPaths != nil {`
update message processing 2024-06-17 17:38:55 +00:00			`for _, m := range msgs[i:] {`
comments 2024-06-20 18:00:08 +00:00			`// images are represented as 768 sized embeddings`
			`// TODO: get embedding length from project metadata`
update message processing 2024-06-17 17:38:55 +00:00			`c += 768 * len(m.Images)`
			`}`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

comments 2024-06-20 18:00:08 +00:00			`if c > opts.NumCtx {`
update message processing 2024-06-17 17:38:55 +00:00			`slog.Debug("truncating input messages which exceed context length", "truncated", len(msgs[i:]))`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`break`
update message processing 2024-06-17 17:38:55 +00:00			`} else {`
			`n = i`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`
update message processing 2024-06-17 17:38:55 +00:00			`}`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00
comments 2024-06-20 18:00:08 +00:00			`// truncate any messages that do not fit into the context window`
update message processing 2024-06-17 17:38:55 +00:00			`var b bytes.Buffer`
comments 2024-06-20 18:00:08 +00:00			`if err := m.Template.Execute(&b, template.Values{Messages: append(system, msgs[n:]...)}); err != nil {`
update message processing 2024-06-17 17:38:55 +00:00			`return "", nil, err`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`

update message processing 2024-06-17 17:38:55 +00:00			`for _, m := range msgs[n:] {`
			`for _, i := range m.Images {`
			`images = append(images, llm.ImageData{`
			`ID: len(images),`
			`Data: i,`
			`})`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`
			`}`

update message processing 2024-06-17 17:38:55 +00:00			`return b.String(), images, nil`
Fix issues with templating prompt in chat mode (#2460) 2024-02-12 23:06:57 +00:00			`}`