package parser import ( "bytes" "fmt" "io" "strings" "testing" "github.com/stretchr/testify/assert" ) func TestParser(t *testing.T) { input := ` FROM model1 ADAPTER adapter1 LICENSE MIT PARAMETER param1 value1 PARAMETER param2 value2 TEMPLATE template1 ` reader := strings.NewReader(input) commands, err := Parse(reader) assert.Nil(t, err) expectedCommands := []Command{ {Name: "model", Args: "model1"}, {Name: "adapter", Args: "adapter1"}, {Name: "license", Args: "MIT"}, {Name: "param1", Args: "value1"}, {Name: "param2", Args: "value2"}, {Name: "template", Args: "template1"}, } assert.Equal(t, expectedCommands, commands) } func TestParserFrom(t *testing.T) { var cases = []struct { input string expected []Command err error }{ { "FROM foo", []Command{{Name: "model", Args: "foo"}}, nil, }, { "FROM /path/to/model", []Command{{Name: "model", Args: "/path/to/model"}}, nil, }, { "FROM /path/to/model/fp16.bin", []Command{{Name: "model", Args: "/path/to/model/fp16.bin"}}, nil, }, { "FROM llama3:latest", []Command{{Name: "model", Args: "llama3:latest"}}, nil, }, { "FROM llama3:7b-instruct-q4_K_M", []Command{{Name: "model", Args: "llama3:7b-instruct-q4_K_M"}}, nil, }, { "", nil, errMissingFrom, }, { "PARAMETER param1 value1", nil, errMissingFrom, }, { "PARAMETER param1 value1\nFROM foo", []Command{{Name: "param1", Args: "value1"}, {Name: "model", Args: "foo"}}, nil, }, } for _, c := range cases { t.Run("", func(t *testing.T) { commands, err := Parse(strings.NewReader(c.input)) assert.ErrorIs(t, err, c.err) assert.Equal(t, c.expected, commands) }) } } func TestParserParametersMissingValue(t *testing.T) { input := ` FROM foo PARAMETER param1 ` reader := strings.NewReader(input) _, err := Parse(reader) assert.ErrorIs(t, err, io.ErrUnexpectedEOF) } func TestParserBadCommand(t *testing.T) { input := ` FROM foo BADCOMMAND param1 value1 ` _, err := Parse(strings.NewReader(input)) assert.ErrorIs(t, err, errInvalidCommand) } func TestParserMessages(t *testing.T) { var cases = []struct { input string expected []Command err error }{ { ` FROM foo MESSAGE system You are a Parser. Always Parse things. `, []Command{ {Name: "model", Args: "foo"}, {Name: "message", Args: "system: You are a Parser. Always Parse things."}, }, nil, }, { ` FROM foo MESSAGE system You are a Parser. Always Parse things.`, []Command{ {Name: "model", Args: "foo"}, {Name: "message", Args: "system: You are a Parser. Always Parse things."}, }, nil, }, { ` FROM foo MESSAGE system You are a Parser. Always Parse things. MESSAGE user Hey there! MESSAGE assistant Hello, I want to parse all the things! `, []Command{ {Name: "model", Args: "foo"}, {Name: "message", Args: "system: You are a Parser. Always Parse things."}, {Name: "message", Args: "user: Hey there!"}, {Name: "message", Args: "assistant: Hello, I want to parse all the things!"}, }, nil, }, { ` FROM foo MESSAGE system """ You are a multiline Parser. Always Parse things. """ `, []Command{ {Name: "model", Args: "foo"}, {Name: "message", Args: "system: \nYou are a multiline Parser. Always Parse things.\n"}, }, nil, }, { ` FROM foo MESSAGE badguy I'm a bad guy! `, nil, errInvalidMessageRole, }, { ` FROM foo MESSAGE system `, nil, io.ErrUnexpectedEOF, }, { ` FROM foo MESSAGE system`, nil, io.ErrUnexpectedEOF, }, } for _, c := range cases { t.Run("", func(t *testing.T) { commands, err := Parse(strings.NewReader(c.input)) assert.ErrorIs(t, err, c.err) assert.Equal(t, c.expected, commands) }) } } func TestParserQuoted(t *testing.T) { var cases = []struct { multiline string expected []Command err error }{ { ` FROM foo SYSTEM """ This is a multiline system. """ `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "\nThis is a\nmultiline system.\n"}, }, nil, }, { ` FROM foo SYSTEM """ This is a multiline system.""" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "\nThis is a\nmultiline system."}, }, nil, }, { ` FROM foo SYSTEM """This is a multiline system.""" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "This is a\nmultiline system."}, }, nil, }, { ` FROM foo SYSTEM """This is a multiline system.""" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "This is a multiline system."}, }, nil, }, { ` FROM foo SYSTEM """This is a multiline system."" `, nil, io.ErrUnexpectedEOF, }, { ` FROM foo SYSTEM " `, nil, io.ErrUnexpectedEOF, }, { ` FROM foo SYSTEM """ This is a multiline system with "quotes". """ `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "\nThis is a multiline system with \"quotes\".\n"}, }, nil, }, { ` FROM foo SYSTEM """""" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: ""}, }, nil, }, { ` FROM foo SYSTEM "" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: ""}, }, nil, }, { ` FROM foo SYSTEM "'" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: "'"}, }, nil, }, { ` FROM foo SYSTEM """''"'""'""'"'''''""'""'""" `, []Command{ {Name: "model", Args: "foo"}, {Name: "system", Args: `''"'""'""'"'''''""'""'`}, }, nil, }, { ` FROM foo TEMPLATE """ {{ .Prompt }} """`, []Command{ {Name: "model", Args: "foo"}, {Name: "template", Args: "\n{{ .Prompt }}\n"}, }, nil, }, } for _, c := range cases { t.Run("", func(t *testing.T) { commands, err := Parse(strings.NewReader(c.multiline)) assert.ErrorIs(t, err, c.err) assert.Equal(t, c.expected, commands) }) } } func TestParserParameters(t *testing.T) { var cases = map[string]struct { name, value string }{ "numa true": {"numa", "true"}, "num_ctx 1": {"num_ctx", "1"}, "num_batch 1": {"num_batch", "1"}, "num_gqa 1": {"num_gqa", "1"}, "num_gpu 1": {"num_gpu", "1"}, "main_gpu 1": {"main_gpu", "1"}, "low_vram true": {"low_vram", "true"}, "f16_kv true": {"f16_kv", "true"}, "logits_all true": {"logits_all", "true"}, "vocab_only true": {"vocab_only", "true"}, "use_mmap true": {"use_mmap", "true"}, "use_mlock true": {"use_mlock", "true"}, "num_thread 1": {"num_thread", "1"}, "num_keep 1": {"num_keep", "1"}, "seed 1": {"seed", "1"}, "num_predict 1": {"num_predict", "1"}, "top_k 1": {"top_k", "1"}, "top_p 1.0": {"top_p", "1.0"}, "tfs_z 1.0": {"tfs_z", "1.0"}, "typical_p 1.0": {"typical_p", "1.0"}, "repeat_last_n 1": {"repeat_last_n", "1"}, "temperature 1.0": {"temperature", "1.0"}, "repeat_penalty 1.0": {"repeat_penalty", "1.0"}, "presence_penalty 1.0": {"presence_penalty", "1.0"}, "frequency_penalty 1.0": {"frequency_penalty", "1.0"}, "mirostat 1": {"mirostat", "1"}, "mirostat_tau 1.0": {"mirostat_tau", "1.0"}, "mirostat_eta 1.0": {"mirostat_eta", "1.0"}, "penalize_newline true": {"penalize_newline", "true"}, "stop ### User:": {"stop", "### User:"}, "stop ### User: ": {"stop", "### User: "}, "stop \"### User:\"": {"stop", "### User:"}, "stop \"### User: \"": {"stop", "### User: "}, "stop \"\"\"### User:\"\"\"": {"stop", "### User:"}, "stop \"\"\"### User:\n\"\"\"": {"stop", "### User:\n"}, "stop <|endoftext|>": {"stop", "<|endoftext|>"}, "stop <|eot_id|>": {"stop", "<|eot_id|>"}, "stop ": {"stop", ""}, } for k, v := range cases { t.Run(k, func(t *testing.T) { var b bytes.Buffer fmt.Fprintln(&b, "FROM foo") fmt.Fprintln(&b, "PARAMETER", k) commands, err := Parse(&b) assert.Nil(t, err) assert.Equal(t, []Command{ {Name: "model", Args: "foo"}, {Name: v.name, Args: v.value}, }, commands) }) } } func TestParserComments(t *testing.T) { var cases = []struct { input string expected []Command }{ { ` # comment FROM foo `, []Command{ {Name: "model", Args: "foo"}, }, }, } for _, c := range cases { t.Run("", func(t *testing.T) { commands, err := Parse(strings.NewReader(c.input)) assert.Nil(t, err) assert.Equal(t, c.expected, commands) }) } } func TestParseFormatParse(t *testing.T) { var cases = []string{ ` FROM foo ADAPTER adapter1 LICENSE MIT PARAMETER param1 value1 PARAMETER param2 value2 TEMPLATE template1 MESSAGE system You are a Parser. Always Parse things. MESSAGE user Hey there! MESSAGE assistant Hello, I want to parse all the things! `, ` FROM foo ADAPTER adapter1 LICENSE MIT PARAMETER param1 value1 PARAMETER param2 value2 TEMPLATE template1 MESSAGE system """ You are a store greeter. Always responsed with "Hello!". """ MESSAGE user Hey there! MESSAGE assistant Hello, I want to parse all the things! `, ` FROM foo ADAPTER adapter1 LICENSE """ Very long and boring legal text. Blah blah blah. "Oh look, a quote!" """ PARAMETER param1 value1 PARAMETER param2 value2 TEMPLATE template1 MESSAGE system """ You are a store greeter. Always responsed with "Hello!". """ MESSAGE user Hey there! MESSAGE assistant Hello, I want to parse all the things! `, } for _, c := range cases { t.Run("", func(t *testing.T) { commands, err := Parse(strings.NewReader(c)) assert.NoError(t, err) commands2, err := Parse(strings.NewReader(Format(commands))) assert.NoError(t, err) assert.Equal(t, commands, commands2) }) } }