ollama/api/client.go

419 lines
12 KiB
Go
Raw Normal View History

// Package api implements the client-side API for code wishing to interact
// with the ollama service. The methods of the [Client] type correspond to
// the ollama REST API as described in [the API documentation].
// The ollama command-line client itself uses this package to interact with
// the backend service.
//
// # Examples
//
// Several examples of using this package are available [in the GitHub
// repository].
//
// [the API documentation]: https://github.com/ollama/ollama/blob/main/docs/api.md
// [in the GitHub repository]: https://github.com/ollama/ollama/tree/main/examples
package api
import (
2023-07-04 00:47:00 -04:00
"bufio"
"bytes"
"context"
"encoding/json"
2023-07-07 14:04:43 -07:00
"fmt"
2023-07-18 09:09:45 -07:00
"io"
2023-10-09 12:18:26 -07:00
"net"
"net/http"
2023-07-06 15:02:10 -07:00
"net/url"
"os"
2023-08-21 18:24:42 -07:00
"runtime"
"strconv"
2023-08-17 18:20:38 -04:00
"strings"
2023-08-21 18:24:42 -07:00
"github.com/ollama/ollama/format"
"github.com/ollama/ollama/version"
)
// Client encapsulates client state for interacting with the ollama
// service. Use [ClientFromEnvironment] to create new Clients.
2023-07-18 09:09:45 -07:00
type Client struct {
2023-10-09 12:18:26 -07:00
base *url.URL
http *http.Client
2023-07-11 13:05:51 -07:00
}
2023-07-18 09:09:45 -07:00
func checkError(resp *http.Response, body []byte) error {
2023-08-26 21:55:21 -07:00
if resp.StatusCode < http.StatusBadRequest {
2023-07-18 09:09:45 -07:00
return nil
2023-07-11 13:05:51 -07:00
}
2023-07-18 09:09:45 -07:00
apiError := StatusError{StatusCode: resp.StatusCode}
2023-07-11 13:05:51 -07:00
2023-07-18 09:09:45 -07:00
err := json.Unmarshal(body, &apiError)
if err != nil {
// Use the full body as the message if we fail to decode a response.
2023-07-20 20:45:12 +02:00
apiError.ErrorMessage = string(body)
2023-07-18 09:09:45 -07:00
}
return apiError
2023-07-06 15:02:10 -07:00
}
// ClientFromEnvironment creates a new [Client] using configuration from the
// environment variable OLLAMA_HOST, which points to the network host and
// port on which the ollama service is listenting. The format of this variable
// is:
//
// <scheme>://<host>:<port>
//
// If the variable is not specified, a default ollama host and port will be
// used.
2023-10-09 12:18:26 -07:00
func ClientFromEnvironment() (*Client, error) {
ollamaHost, err := GetOllamaHost()
if err != nil {
return nil, err
}
return &Client{
base: &url.URL{
Scheme: ollamaHost.Scheme,
Host: net.JoinHostPort(ollamaHost.Host, ollamaHost.Port),
},
http: http.DefaultClient,
}, nil
}
type OllamaHost struct {
Scheme string
Host string
Port string
}
func GetOllamaHost() (OllamaHost, error) {
2023-10-26 10:47:41 -07:00
defaultPort := "11434"
hostVar := os.Getenv("OLLAMA_HOST")
hostVar = strings.TrimSpace(strings.Trim(strings.TrimSpace(hostVar), "\"'"))
scheme, hostport, ok := strings.Cut(hostVar, "://")
2023-10-26 10:47:41 -07:00
switch {
case !ok:
scheme, hostport = "http", hostVar
2023-10-26 10:47:41 -07:00
case scheme == "http":
defaultPort = "80"
case scheme == "https":
defaultPort = "443"
2023-10-09 12:18:26 -07:00
}
2023-10-26 10:47:41 -07:00
// trim trailing slashes
hostport = strings.TrimRight(hostport, "/")
2023-10-09 12:18:26 -07:00
host, port, err := net.SplitHostPort(hostport)
if err != nil {
2023-10-26 10:47:41 -07:00
host, port = "127.0.0.1", defaultPort
2023-10-20 11:32:28 -07:00
if ip := net.ParseIP(strings.Trim(hostport, "[]")); ip != nil {
2023-10-09 12:18:26 -07:00
host = ip.String()
2023-10-20 11:32:28 -07:00
} else if hostport != "" {
host = hostport
2023-10-09 12:18:26 -07:00
}
}
if portNum, err := strconv.ParseInt(port, 10, 32); err != nil || portNum > 65535 || portNum < 0 {
return OllamaHost{}, ErrInvalidHostPort
}
return OllamaHost{
Scheme: scheme,
Host: host,
Port: port,
}, nil
2023-07-18 09:09:45 -07:00
}
func NewClient(base *url.URL, http *http.Client) *Client {
return &Client{
base: base,
http: http,
}
}
2023-07-18 09:09:45 -07:00
func (c *Client) do(ctx context.Context, method, path string, reqData, respData any) error {
var reqBody io.Reader
var data []byte
var err error
2023-11-14 14:07:40 -08:00
switch reqData := reqData.(type) {
case io.Reader:
// reqData is already an io.Reader
reqBody = reqData
case nil:
// noop
default:
2023-07-18 09:09:45 -07:00
data, err = json.Marshal(reqData)
if err != nil {
return err
}
2023-11-14 14:07:40 -08:00
2023-07-18 09:09:45 -07:00
reqBody = bytes.NewReader(data)
}
2023-10-09 12:18:26 -07:00
requestURL := c.base.JoinPath(path)
2023-08-21 18:24:42 -07:00
request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), reqBody)
2023-07-18 09:09:45 -07:00
if err != nil {
return err
}
2023-08-21 18:24:42 -07:00
request.Header.Set("Content-Type", "application/json")
request.Header.Set("Accept", "application/json")
request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
2023-07-18 09:09:45 -07:00
2023-10-09 12:18:26 -07:00
respObj, err := c.http.Do(request)
2023-07-18 09:09:45 -07:00
if err != nil {
return err
}
defer respObj.Body.Close()
respBody, err := io.ReadAll(respObj.Body)
if err != nil {
return err
}
if err := checkError(respObj, respBody); err != nil {
return err
}
if len(respBody) > 0 && respData != nil {
if err := json.Unmarshal(respBody, respData); err != nil {
return err
}
}
return nil
}
2023-10-12 09:34:16 -07:00
const maxBufferSize = 512 * format.KiloByte
2023-10-04 14:09:00 -04:00
2023-07-11 13:05:51 -07:00
func (c *Client) stream(ctx context.Context, method, path string, data any, fn func([]byte) error) error {
var buf *bytes.Buffer
if data != nil {
bts, err := json.Marshal(data)
if err != nil {
return err
}
2023-07-06 16:53:14 -07:00
buf = bytes.NewBuffer(bts)
}
2023-10-09 12:18:26 -07:00
requestURL := c.base.JoinPath(path)
2023-08-21 18:24:42 -07:00
request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), buf)
if err != nil {
return err
}
2023-07-06 15:02:10 -07:00
request.Header.Set("Content-Type", "application/json")
request.Header.Set("Accept", "application/x-ndjson")
2023-08-21 18:24:42 -07:00
request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
2023-07-04 00:47:00 -04:00
2023-10-09 12:18:26 -07:00
response, err := c.http.Do(request)
2023-07-04 00:47:00 -04:00
if err != nil {
return err
}
2023-07-06 15:02:10 -07:00
defer response.Body.Close()
2023-07-04 00:47:00 -04:00
scanner := bufio.NewScanner(response.Body)
2023-10-04 14:09:00 -04:00
// increase the buffer size to avoid running out of space
scanBuf := make([]byte, 0, maxBufferSize)
scanner.Buffer(scanBuf, maxBufferSize)
for scanner.Scan() {
var errorResponse struct {
2023-07-11 13:05:51 -07:00
Error string `json:"error,omitempty"`
}
bts := scanner.Bytes()
if err := json.Unmarshal(bts, &errorResponse); err != nil {
return fmt.Errorf("unmarshal: %w", err)
}
2023-07-20 12:12:08 -07:00
if errorResponse.Error != "" {
return fmt.Errorf(errorResponse.Error)
2023-07-20 12:12:08 -07:00
}
2023-08-26 21:55:21 -07:00
if response.StatusCode >= http.StatusBadRequest {
2023-07-11 13:05:51 -07:00
return StatusError{
2023-07-20 20:45:12 +02:00
StatusCode: response.StatusCode,
Status: response.Status,
ErrorMessage: errorResponse.Error,
2023-07-11 13:05:51 -07:00
}
}
2023-07-11 13:05:51 -07:00
if err := fn(bts); err != nil {
return err
}
}
2023-07-06 14:05:55 -07:00
return nil
}
// GenerateResponseFunc is a function that [Client.Generate] invokes every time
// a response is received from the service. If this function returns an error,
// [Client.Generate] will stop generating and return this error.
2023-07-06 14:05:55 -07:00
type GenerateResponseFunc func(GenerateResponse) error
// Generate generates a response for a given prompt. The req parameter should
// be populated with prompt details. fn is called for each response (there may
// be multiple responses, e.g. in case streaming is enabled).
2023-07-06 14:05:55 -07:00
func (c *Client) Generate(ctx context.Context, req *GenerateRequest, fn GenerateResponseFunc) error {
return c.stream(ctx, http.MethodPost, "/api/generate", req, func(bts []byte) error {
var resp GenerateResponse
if err := json.Unmarshal(bts, &resp); err != nil {
return err
}
return fn(resp)
})
2023-07-04 00:47:00 -04:00
}
2023-07-06 12:24:49 -04:00
// ChatResponseFunc is a function that [Client.Chat] invokes every time
// a response is received from the service. If this function returns an error,
// [Client.Chat] will stop generating and return this error.
2023-12-05 14:57:33 -05:00
type ChatResponseFunc func(ChatResponse) error
// Chat generates the next message in a chat. [ChatRequest] may contain a
// sequence of messages which can be used to maintain chat history with a model.
// fn is called for each response (there may be multiple responses, e.g. if case
// streaming is enabled).
2023-12-05 14:57:33 -05:00
func (c *Client) Chat(ctx context.Context, req *ChatRequest, fn ChatResponseFunc) error {
return c.stream(ctx, http.MethodPost, "/api/chat", req, func(bts []byte) error {
var resp ChatResponse
if err := json.Unmarshal(bts, &resp); err != nil {
return err
}
return fn(resp)
})
}
// PullProgressFunc is a function that [Client.Pull] invokes every time there
// is progress with a "pull" request sent to the service. If this function
// returns an error, [Client.Pull] will stop the process and return this error.
2023-07-18 18:51:30 -07:00
type PullProgressFunc func(ProgressResponse) error
2023-07-06 14:05:55 -07:00
// Pull downloads a model from the ollama library. fn is called each time
// progress is made on the request and can be used to display a progress bar,
// etc.
2023-07-06 14:05:55 -07:00
func (c *Client) Pull(ctx context.Context, req *PullRequest, fn PullProgressFunc) error {
return c.stream(ctx, http.MethodPost, "/api/pull", req, func(bts []byte) error {
2023-07-18 18:51:30 -07:00
var resp ProgressResponse
if err := json.Unmarshal(bts, &resp); err != nil {
return err
}
return fn(resp)
})
2023-07-06 12:24:49 -04:00
}
// PushProgressFunc is a function that [Client.Push] invokes when progress is
// made.
// It's similar to other progress function types like [PullProgressFunc].
2023-07-18 18:51:30 -07:00
type PushProgressFunc func(ProgressResponse) error
// Push uploads a model to the model library; requires registering for ollama.ai
// and adding a public key first. fn is called each time progress is made on
// the request and can be used to display a progress bar, etc.
func (c *Client) Push(ctx context.Context, req *PushRequest, fn PushProgressFunc) error {
return c.stream(ctx, http.MethodPost, "/api/push", req, func(bts []byte) error {
2023-07-18 18:51:30 -07:00
var resp ProgressResponse
if err := json.Unmarshal(bts, &resp); err != nil {
return err
}
return fn(resp)
})
}
// CreateProgressFunc is a function that [Client.Create] invokes when progress
// is made.
// It's similar to other progress function types like [PullProgressFunc].
type CreateProgressFunc func(ProgressResponse) error
// Create creates a model from a [Modelfile]. fn is a progress function that
// behaves similarly to other methods (see [Client.Pull]).
//
// [Modelfile]: https://github.com/ollama/ollama/blob/main/docs/modelfile.md
func (c *Client) Create(ctx context.Context, req *CreateRequest, fn CreateProgressFunc) error {
return c.stream(ctx, http.MethodPost, "/api/create", req, func(bts []byte) error {
var resp ProgressResponse
if err := json.Unmarshal(bts, &resp); err != nil {
return err
}
return fn(resp)
})
}
2023-07-18 09:09:45 -07:00
// List lists models that are available locally.
2023-07-18 09:09:45 -07:00
func (c *Client) List(ctx context.Context) (*ListResponse, error) {
var lr ListResponse
if err := c.do(ctx, http.MethodGet, "/api/tags", nil, &lr); err != nil {
return nil, err
}
return &lr, nil
}
2023-07-20 16:09:23 -07:00
// Copy copies a model - creating a model with another name from an existing
// model.
2023-07-24 11:27:28 -04:00
func (c *Client) Copy(ctx context.Context, req *CopyRequest) error {
if err := c.do(ctx, http.MethodPost, "/api/copy", req, nil); err != nil {
return err
}
return nil
}
// Delete deletes a model and its data.
func (c *Client) Delete(ctx context.Context, req *DeleteRequest) error {
if err := c.do(ctx, http.MethodDelete, "/api/delete", req, nil); err != nil {
return err
}
return nil
2023-07-20 16:09:23 -07:00
}
// Show obtains model information, including details, modelfile, license etc.
2023-09-06 11:04:17 -07:00
func (c *Client) Show(ctx context.Context, req *ShowRequest) (*ShowResponse, error) {
var resp ShowResponse
if err := c.do(ctx, http.MethodPost, "/api/show", req, &resp); err != nil {
return nil, err
}
return &resp, nil
}
// Hearbeat checks if the server has started and is responsive; if yes, it
// returns nil, otherwise an error.
func (c *Client) Heartbeat(ctx context.Context) error {
2023-08-01 14:50:38 -04:00
if err := c.do(ctx, http.MethodHead, "/", nil, nil); err != nil {
return err
}
return nil
}
// Embeddings generates embeddings from a model.
2024-01-04 13:00:52 -07:00
func (c *Client) Embeddings(ctx context.Context, req *EmbeddingRequest) (*EmbeddingResponse, error) {
var resp EmbeddingResponse
if err := c.do(ctx, http.MethodPost, "/api/embeddings", req, &resp); err != nil {
return nil, err
}
return &resp, nil
}
2023-11-14 14:07:40 -08:00
// CreateBlob creates a blob from a file on the server. digest is the
// expected SHA256 digest of the file, and r represents the file.
2023-11-15 10:59:38 -08:00
func (c *Client) CreateBlob(ctx context.Context, digest string, r io.Reader) error {
2024-04-05 09:30:09 -07:00
return c.do(ctx, http.MethodPost, fmt.Sprintf("/api/blobs/%s", digest), r, nil)
2023-11-14 14:07:40 -08:00
}
2023-11-22 09:41:44 -08:00
// Version returns the Ollama server version as a string.
2023-11-22 09:41:44 -08:00
func (c *Client) Version(ctx context.Context) (string, error) {
var version struct {
Version string `json:"version"`
}
if err := c.do(ctx, http.MethodGet, "/api/version", nil, &version); err != nil {
return "", err
}
return version.Version, nil
}