ollama/template/template_test.go

344 lines
9.2 KiB
Go
Raw Normal View History

2024-06-10 21:54:42 +00:00
package template
import (
"bufio"
"bytes"
"encoding/json"
"io"
"os"
"path/filepath"
"slices"
2024-06-27 21:15:17 +00:00
"strings"
2024-06-10 21:54:42 +00:00
"testing"
2024-06-27 21:15:17 +00:00
"github.com/google/go-cmp/cmp"
2024-06-17 17:38:55 +00:00
"github.com/ollama/ollama/api"
2024-06-10 21:54:42 +00:00
"github.com/ollama/ollama/llm"
)
func TestNamed(t *testing.T) {
f, err := os.Open(filepath.Join("testdata", "templates.jsonl"))
if err != nil {
t.Fatal(err)
}
defer f.Close()
scanner := bufio.NewScanner(f)
for scanner.Scan() {
var ss map[string]string
if err := json.Unmarshal(scanner.Bytes(), &ss); err != nil {
t.Fatal(err)
}
for k, v := range ss {
t.Run(k, func(t *testing.T) {
kv := llm.KV{"tokenizer.chat_template": v}
s := kv.ChatTemplate()
r, err := Named(s)
if err != nil {
t.Fatal(err)
}
if r.Name != k {
t.Errorf("expected %q, got %q", k, r.Name)
}
var b bytes.Buffer
if _, err := io.Copy(&b, r.Reader()); err != nil {
t.Fatal(err)
}
2024-06-27 21:15:17 +00:00
tmpl, err := Parse(b.String())
2024-06-10 21:54:42 +00:00
if err != nil {
t.Fatal(err)
}
if tmpl.Tree.Root.String() == "" {
t.Errorf("empty %s template", k)
}
})
}
}
}
2024-06-27 21:15:17 +00:00
func TestTemplate(t *testing.T) {
cases := make(map[string][]api.Message)
for _, mm := range [][]api.Message{
{
{Role: "user", Content: "Hello, how are you?"},
},
{
{Role: "user", Content: "Hello, how are you?"},
{Role: "assistant", Content: "I'm doing great. How can I help you today?"},
{Role: "user", Content: "I'd like to show off how chat templating works!"},
},
{
{Role: "system", Content: "You are a helpful assistant."},
{Role: "user", Content: "Hello, how are you?"},
{Role: "assistant", Content: "I'm doing great. How can I help you today?"},
{Role: "user", Content: "I'd like to show off how chat templating works!"},
},
} {
var roles []string
for _, m := range mm {
roles = append(roles, m.Role)
}
cases[strings.Join(roles, "-")] = mm
}
matches, err := filepath.Glob("*.gotmpl")
if err != nil {
t.Fatal(err)
}
for _, match := range matches {
t.Run(match, func(t *testing.T) {
bts, err := os.ReadFile(match)
if err != nil {
t.Fatal(err)
}
tmpl, err := Parse(string(bts))
if err != nil {
t.Fatal(err)
}
for n, tt := range cases {
var actual bytes.Buffer
2024-06-27 21:15:17 +00:00
t.Run(n, func(t *testing.T) {
if err := tmpl.Execute(&actual, Values{Messages: tt}); err != nil {
t.Fatal(err)
}
expect, err := os.ReadFile(filepath.Join("testdata", match, n))
if err != nil {
t.Fatal(err)
}
if diff := cmp.Diff(actual.Bytes(), expect); diff != "" {
t.Errorf("mismatch (-got +want):\n%s", diff)
}
})
t.Run("legacy", func(t *testing.T) {
var legacy bytes.Buffer
if err := tmpl.Execute(&legacy, Values{Messages: tt, forceLegacy: true}); err != nil {
t.Fatal(err)
}
legacyBytes := legacy.Bytes()
if slices.Contains([]string{"chatqa.gotmpl", "openchat.gotmpl", "vicuna.gotmpl"}, match) && legacyBytes[len(legacyBytes)-1] == ' ' {
t.Log("removing trailing space from legacy output")
legacyBytes = legacyBytes[:len(legacyBytes)-1]
} else if slices.Contains([]string{"codellama-70b-instruct.gotmpl", "llama2-chat.gotmpl", "mistral-instruct.gotmpl"}, match) {
t.Skip("legacy outputs cannot be compared to messages outputs")
}
if diff := cmp.Diff(legacyBytes, actual.Bytes()); diff != "" {
t.Errorf("mismatch (-got +want):\n%s", diff)
}
})
2024-06-27 21:15:17 +00:00
}
})
}
}
2024-06-10 21:54:42 +00:00
func TestParse(t *testing.T) {
cases := []struct {
2024-06-11 21:03:42 +00:00
template string
vars []string
2024-06-10 21:54:42 +00:00
}{
2024-06-17 17:38:55 +00:00
{"{{ .Prompt }}", []string{"prompt", "response"}},
{"{{ .System }} {{ .Prompt }}", []string{"prompt", "response", "system"}},
2024-06-10 21:54:42 +00:00
{"{{ .System }} {{ .Prompt }} {{ .Response }}", []string{"prompt", "response", "system"}},
2024-06-17 17:38:55 +00:00
{"{{ with .Tools }}{{ . }}{{ end }} {{ .System }} {{ .Prompt }}", []string{"prompt", "response", "system", "tools"}},
2024-06-10 21:54:42 +00:00
{"{{ range .Messages }}{{ .Role }} {{ .Content }}{{ end }}", []string{"content", "messages", "role"}},
{"{{ range .Messages }}{{ if eq .Role \"system\" }}SYSTEM: {{ .Content }}{{ else if eq .Role \"user\" }}USER: {{ .Content }}{{ else if eq .Role \"assistant\" }}ASSISTANT: {{ .Content }}{{ end }}{{ end }}", []string{"content", "messages", "role"}},
{`{{- if .Messages }}
{{- if .System }}<|im_start|>system
{{ .System }}<|im_end|>
{{ end }}
{{- range .Messages }}<|im_start|>{{ .Role }}
{{ .Content }}<|im_end|>
{{ end }}<|im_start|>assistant
{{ else -}}
{{ if .System }}<|im_start|>system
{{ .System }}<|im_end|>
{{ end }}{{ if .Prompt }}<|im_start|>user
{{ .Prompt }}<|im_end|>
{{ end }}<|im_start|>assistant
{{ .Response }}<|im_end|>
{{- end -}}`, []string{"content", "messages", "prompt", "response", "role", "system"}},
2024-06-10 21:54:42 +00:00
}
for _, tt := range cases {
t.Run("", func(t *testing.T) {
tmpl, err := Parse(tt.template)
if err != nil {
t.Fatal(err)
}
if diff := cmp.Diff(tmpl.Vars(), tt.vars); diff != "" {
t.Errorf("mismatch (-got +want):\n%s", diff)
2024-06-10 21:54:42 +00:00
}
})
}
}
2024-06-17 17:38:55 +00:00
func TestExecuteWithMessages(t *testing.T) {
2024-06-20 18:00:08 +00:00
type template struct {
name string
template string
}
2024-06-17 17:38:55 +00:00
cases := []struct {
2024-06-20 18:00:08 +00:00
name string
templates []template
2024-06-17 17:38:55 +00:00
values Values
expected string
}{
{
2024-06-20 18:00:08 +00:00
"mistral",
[]template{
{"no response", `[INST] {{ if .System }}{{ .System }}{{ "\n\n" }}{{ end }}{{ .Prompt }}[/INST] `},
{"response", `[INST] {{ if .System }}{{ .System }}{{ "\n\n" }}{{ end }}{{ .Prompt }}[/INST] {{ .Response }}`},
2024-07-03 20:49:14 +00:00
{"messages", `{{- range $index, $_ := .Messages }}
{{- if eq .Role "user" }}[INST] {{ if and (eq $index 0) $.System }}{{ $.System }}{{ "\n\n" }}
2024-06-17 17:38:55 +00:00
{{- end }}{{ .Content }}[/INST] {{ else if eq .Role "assistant" }}{{ .Content }}
{{- end }}
2024-06-20 18:00:08 +00:00
{{- end }}`},
2024-06-17 17:38:55 +00:00
},
Values{
Messages: []api.Message{
{Role: "user", Content: "Hello friend!"},
{Role: "assistant", Content: "Hello human!"},
2024-06-20 18:00:08 +00:00
{Role: "user", Content: "What is your name?"},
2024-06-17 17:38:55 +00:00
},
},
2024-06-20 18:00:08 +00:00
`[INST] Hello friend![/INST] Hello human![INST] What is your name?[/INST] `,
2024-06-17 17:38:55 +00:00
},
{
2024-06-20 18:00:08 +00:00
"mistral system",
[]template{
{"no response", `[INST] {{ if .System }}{{ .System }}{{ "\n\n" }}{{ end }}{{ .Prompt }}[/INST] `},
{"response", `[INST] {{ if .System }}{{ .System }}{{ "\n\n" }}{{ end }}{{ .Prompt }}[/INST] {{ .Response }}`},
{"messages", `
2024-07-03 20:49:14 +00:00
{{- range $index, $_ := .Messages }}
{{- if eq .Role "user" }}[INST] {{ if and (eq $index 0) $.System }}{{ $.System }}{{ "\n\n" }}
2024-06-17 17:38:55 +00:00
{{- end }}{{ .Content }}[/INST] {{ else if eq .Role "assistant" }}{{ .Content }}
{{- end }}
2024-06-20 18:00:08 +00:00
{{- end }}`},
2024-06-17 17:38:55 +00:00
},
Values{
Messages: []api.Message{
{Role: "system", Content: "You are a helpful assistant!"},
{Role: "user", Content: "Hello friend!"},
{Role: "assistant", Content: "Hello human!"},
2024-06-20 18:00:08 +00:00
{Role: "user", Content: "What is your name?"},
2024-06-17 17:38:55 +00:00
},
},
`[INST] You are a helpful assistant!
2024-06-17 17:38:55 +00:00
Hello friend![/INST] Hello human![INST] What is your name?[/INST] `,
2024-06-17 17:38:55 +00:00
},
{
2024-06-20 18:00:08 +00:00
"chatml",
[]template{
// this does not have a "no response" test because it's impossible to render the same output
{"response", `{{ if .System }}<|im_start|>system
2024-06-17 17:38:55 +00:00
{{ .System }}<|im_end|>
{{ end }}{{ if .Prompt }}<|im_start|>user
{{ .Prompt }}<|im_end|>
{{ end }}<|im_start|>assistant
{{ .Response }}<|im_end|>
2024-06-20 18:00:08 +00:00
`},
{"messages", `
2024-07-03 20:49:14 +00:00
{{- range $index, $_ := .Messages }}
{{- if and (eq .Role "user") (eq $index 0) $.System }}<|im_start|>system
2024-06-20 18:00:08 +00:00
{{ $.System }}<|im_end|>{{ "\n" }}
2024-06-17 17:38:55 +00:00
{{- end }}<|im_start|>{{ .Role }}
2024-06-20 18:00:08 +00:00
{{ .Content }}<|im_end|>{{ "\n" }}
2024-06-17 17:38:55 +00:00
{{- end }}<|im_start|>assistant
2024-06-20 18:00:08 +00:00
`},
2024-06-17 17:38:55 +00:00
},
Values{
Messages: []api.Message{
{Role: "system", Content: "You are a helpful assistant!"},
{Role: "user", Content: "Hello friend!"},
{Role: "assistant", Content: "Hello human!"},
2024-06-20 18:00:08 +00:00
{Role: "user", Content: "What is your name?"},
2024-06-17 17:38:55 +00:00
},
},
`<|im_start|>system
You are a helpful assistant!<|im_end|>
<|im_start|>user
2024-06-17 17:38:55 +00:00
Hello friend!<|im_end|>
<|im_start|>assistant
Hello human!<|im_end|>
<|im_start|>user
2024-06-20 18:00:08 +00:00
What is your name?<|im_end|>
2024-06-17 17:38:55 +00:00
<|im_start|>assistant
`,
},
{
2024-06-20 18:00:08 +00:00
"moondream",
[]template{
// this does not have a "no response" test because it's impossible to render the same output
{"response", `{{ if .Prompt }}Question: {{ .Prompt }}
2024-06-17 17:38:55 +00:00
{{ end }}Answer: {{ .Response }}
2024-06-20 18:00:08 +00:00
`},
{"messages", `
2024-06-17 17:38:55 +00:00
{{- range .Messages }}
2024-06-20 18:00:08 +00:00
{{- if eq .Role "user" }}Question: {{ .Content }}{{ "\n\n" }}
{{- else if eq .Role "assistant" }}Answer: {{ .Content }}{{ "\n\n" }}
2024-06-17 17:38:55 +00:00
{{- end }}
2024-06-20 18:00:08 +00:00
{{- end }}Answer: `},
2024-06-17 17:38:55 +00:00
},
Values{
Messages: []api.Message{
{Role: "user", Content: "What's in this image?", Images: []api.ImageData{[]byte("")}},
{Role: "assistant", Content: "It's a hot dog."},
{Role: "user", Content: "What's in _this_ image?"},
{Role: "user", Images: []api.ImageData{[]byte("")}},
{Role: "user", Content: "Is it a hot dog?"},
},
},
`Question: [img-0] What's in this image?
Answer: It's a hot dog.
Question: What's in _this_ image?
[img-1]
Is it a hot dog?
Answer: `,
},
}
for _, tt := range cases {
2024-06-20 18:00:08 +00:00
t.Run(tt.name, func(t *testing.T) {
for _, ttt := range tt.templates {
t.Run(ttt.name, func(t *testing.T) {
tmpl, err := Parse(ttt.template)
2024-06-17 17:38:55 +00:00
if err != nil {
t.Fatal(err)
}
var b bytes.Buffer
if err := tmpl.Execute(&b, tt.values); err != nil {
t.Fatal(err)
}
if diff := cmp.Diff(b.String(), tt.expected); diff != "" {
t.Errorf("mismatch (-got +want):\n%s", diff)
2024-06-17 17:38:55 +00:00
}
})
}
})
}
}