mirror of https://github.com/ollama/ollama.git
				
				
				
			
		
			
				
	
	
		
			431 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Go
		
	
	
	
			
		
		
	
	
			431 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			Go
		
	
	
	
| // Package api implements the client-side API for code wishing to interact
 | |
| // with the ollama service. The methods of the [Client] type correspond to
 | |
| // the ollama REST API as described in [the API documentation].
 | |
| // The ollama command-line client itself uses this package to interact with
 | |
| // the backend service.
 | |
| //
 | |
| // # Examples
 | |
| //
 | |
| // Several examples of using this package are available [in the GitHub
 | |
| // repository].
 | |
| //
 | |
| // [the API documentation]: https://github.com/ollama/ollama/blob/main/docs/api.md
 | |
| // [in the GitHub repository]: https://github.com/ollama/ollama/tree/main/api/examples
 | |
| package api
 | |
| 
 | |
| import (
 | |
| 	"bufio"
 | |
| 	"bytes"
 | |
| 	"context"
 | |
| 	"encoding/json"
 | |
| 	"errors"
 | |
| 	"fmt"
 | |
| 	"io"
 | |
| 	"net/http"
 | |
| 	"net/url"
 | |
| 	"runtime"
 | |
| 	"strconv"
 | |
| 	"time"
 | |
| 
 | |
| 	"github.com/ollama/ollama/auth"
 | |
| 	"github.com/ollama/ollama/envconfig"
 | |
| 	"github.com/ollama/ollama/format"
 | |
| 	"github.com/ollama/ollama/version"
 | |
| )
 | |
| 
 | |
| // Client encapsulates client state for interacting with the ollama
 | |
| // service. Use [ClientFromEnvironment] to create new Clients.
 | |
| type Client struct {
 | |
| 	base *url.URL
 | |
| 	http *http.Client
 | |
| }
 | |
| 
 | |
| func checkError(resp *http.Response, body []byte) error {
 | |
| 	if resp.StatusCode < http.StatusBadRequest {
 | |
| 		return nil
 | |
| 	}
 | |
| 
 | |
| 	apiError := StatusError{StatusCode: resp.StatusCode}
 | |
| 
 | |
| 	err := json.Unmarshal(body, &apiError)
 | |
| 	if err != nil {
 | |
| 		// Use the full body as the message if we fail to decode a response.
 | |
| 		apiError.ErrorMessage = string(body)
 | |
| 	}
 | |
| 
 | |
| 	return apiError
 | |
| }
 | |
| 
 | |
| // ClientFromEnvironment creates a new [Client] using configuration from the
 | |
| // environment variable OLLAMA_HOST, which points to the network host and
 | |
| // port on which the ollama service is listening. The format of this variable
 | |
| // is:
 | |
| //
 | |
| //	<scheme>://<host>:<port>
 | |
| //
 | |
| // If the variable is not specified, a default ollama host and port will be
 | |
| // used.
 | |
| func ClientFromEnvironment() (*Client, error) {
 | |
| 	return &Client{
 | |
| 		base: envconfig.Host(),
 | |
| 		http: http.DefaultClient,
 | |
| 	}, nil
 | |
| }
 | |
| 
 | |
| func NewClient(base *url.URL, http *http.Client) *Client {
 | |
| 	return &Client{
 | |
| 		base: base,
 | |
| 		http: http,
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func getAuthorizationToken(ctx context.Context, challenge string) (string, error) {
 | |
| 	token, err := auth.Sign(ctx, []byte(challenge))
 | |
| 	if err != nil {
 | |
| 		return "", err
 | |
| 	}
 | |
| 	return token, nil
 | |
| }
 | |
| 
 | |
| func (c *Client) do(ctx context.Context, method, path string, reqData, respData any) error {
 | |
| 	var reqBody io.Reader
 | |
| 	var data []byte
 | |
| 	var err error
 | |
| 
 | |
| 	switch reqData := reqData.(type) {
 | |
| 	case io.Reader:
 | |
| 		// reqData is already an io.Reader
 | |
| 		reqBody = reqData
 | |
| 	case nil:
 | |
| 		// noop
 | |
| 	default:
 | |
| 		data, err = json.Marshal(reqData)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		reqBody = bytes.NewReader(data)
 | |
| 	}
 | |
| 
 | |
| 	requestURL := c.base.JoinPath(path)
 | |
| 
 | |
| 	var token string
 | |
| 	if envconfig.UseAuth() || c.base.Hostname() == "ollama.com" {
 | |
| 		now := strconv.FormatInt(time.Now().Unix(), 10)
 | |
| 		chal := fmt.Sprintf("%s,%s?ts=%s", method, path, now)
 | |
| 		token, err = getAuthorizationToken(ctx, chal)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		q := requestURL.Query()
 | |
| 		q.Set("ts", now)
 | |
| 		requestURL.RawQuery = q.Encode()
 | |
| 	}
 | |
| 
 | |
| 	request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), reqBody)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	request.Header.Set("Content-Type", "application/json")
 | |
| 	request.Header.Set("Accept", "application/json")
 | |
| 	request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
 | |
| 
 | |
| 	if token != "" {
 | |
| 		request.Header.Set("Authorization", token)
 | |
| 	}
 | |
| 
 | |
| 	respObj, err := c.http.Do(request)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	defer respObj.Body.Close()
 | |
| 
 | |
| 	respBody, err := io.ReadAll(respObj.Body)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	if err := checkError(respObj, respBody); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	if len(respBody) > 0 && respData != nil {
 | |
| 		if err := json.Unmarshal(respBody, respData); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| const maxBufferSize = 512 * format.KiloByte
 | |
| 
 | |
| func (c *Client) stream(ctx context.Context, method, path string, data any, fn func([]byte) error) error {
 | |
| 	var buf io.Reader
 | |
| 	if data != nil {
 | |
| 		bts, err := json.Marshal(data)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		buf = bytes.NewBuffer(bts)
 | |
| 	}
 | |
| 
 | |
| 	requestURL := c.base.JoinPath(path)
 | |
| 
 | |
| 	var token string
 | |
| 	if envconfig.UseAuth() || c.base.Hostname() == "ollama.com" {
 | |
| 		var err error
 | |
| 		now := strconv.FormatInt(time.Now().Unix(), 10)
 | |
| 		chal := fmt.Sprintf("%s,%s?ts=%s", method, path, now)
 | |
| 		token, err = getAuthorizationToken(ctx, chal)
 | |
| 		if err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		q := requestURL.Query()
 | |
| 		q.Set("ts", now)
 | |
| 		requestURL.RawQuery = q.Encode()
 | |
| 	}
 | |
| 
 | |
| 	request, err := http.NewRequestWithContext(ctx, method, requestURL.String(), buf)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 
 | |
| 	request.Header.Set("Content-Type", "application/json")
 | |
| 	request.Header.Set("Accept", "application/x-ndjson")
 | |
| 	request.Header.Set("User-Agent", fmt.Sprintf("ollama/%s (%s %s) Go/%s", version.Version, runtime.GOARCH, runtime.GOOS, runtime.Version()))
 | |
| 
 | |
| 	if token != "" {
 | |
| 		request.Header.Set("Authorization", token)
 | |
| 	}
 | |
| 
 | |
| 	response, err := c.http.Do(request)
 | |
| 	if err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	defer response.Body.Close()
 | |
| 
 | |
| 	scanner := bufio.NewScanner(response.Body)
 | |
| 	// increase the buffer size to avoid running out of space
 | |
| 	scanBuf := make([]byte, 0, maxBufferSize)
 | |
| 	scanner.Buffer(scanBuf, maxBufferSize)
 | |
| 	for scanner.Scan() {
 | |
| 		var errorResponse struct {
 | |
| 			Error string `json:"error,omitempty"`
 | |
| 		}
 | |
| 
 | |
| 		bts := scanner.Bytes()
 | |
| 		if err := json.Unmarshal(bts, &errorResponse); err != nil {
 | |
| 			return fmt.Errorf("unmarshal: %w", err)
 | |
| 		}
 | |
| 
 | |
| 		if errorResponse.Error != "" {
 | |
| 			return errors.New(errorResponse.Error)
 | |
| 		}
 | |
| 
 | |
| 		if response.StatusCode >= http.StatusBadRequest {
 | |
| 			return StatusError{
 | |
| 				StatusCode:   response.StatusCode,
 | |
| 				Status:       response.Status,
 | |
| 				ErrorMessage: errorResponse.Error,
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		if err := fn(bts); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // GenerateResponseFunc is a function that [Client.Generate] invokes every time
 | |
| // a response is received from the service. If this function returns an error,
 | |
| // [Client.Generate] will stop generating and return this error.
 | |
| type GenerateResponseFunc func(GenerateResponse) error
 | |
| 
 | |
| // Generate generates a response for a given prompt. The req parameter should
 | |
| // be populated with prompt details. fn is called for each response (there may
 | |
| // be multiple responses, e.g. in case streaming is enabled).
 | |
| func (c *Client) Generate(ctx context.Context, req *GenerateRequest, fn GenerateResponseFunc) error {
 | |
| 	return c.stream(ctx, http.MethodPost, "/api/generate", req, func(bts []byte) error {
 | |
| 		var resp GenerateResponse
 | |
| 		if err := json.Unmarshal(bts, &resp); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		return fn(resp)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| // ChatResponseFunc is a function that [Client.Chat] invokes every time
 | |
| // a response is received from the service. If this function returns an error,
 | |
| // [Client.Chat] will stop generating and return this error.
 | |
| type ChatResponseFunc func(ChatResponse) error
 | |
| 
 | |
| // Chat generates the next message in a chat. [ChatRequest] may contain a
 | |
| // sequence of messages which can be used to maintain chat history with a model.
 | |
| // fn is called for each response (there may be multiple responses, e.g. if case
 | |
| // streaming is enabled).
 | |
| func (c *Client) Chat(ctx context.Context, req *ChatRequest, fn ChatResponseFunc) error {
 | |
| 	return c.stream(ctx, http.MethodPost, "/api/chat", req, func(bts []byte) error {
 | |
| 		var resp ChatResponse
 | |
| 		if err := json.Unmarshal(bts, &resp); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		return fn(resp)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| // PullProgressFunc is a function that [Client.Pull] invokes every time there
 | |
| // is progress with a "pull" request sent to the service. If this function
 | |
| // returns an error, [Client.Pull] will stop the process and return this error.
 | |
| type PullProgressFunc func(ProgressResponse) error
 | |
| 
 | |
| // Pull downloads a model from the ollama library. fn is called each time
 | |
| // progress is made on the request and can be used to display a progress bar,
 | |
| // etc.
 | |
| func (c *Client) Pull(ctx context.Context, req *PullRequest, fn PullProgressFunc) error {
 | |
| 	return c.stream(ctx, http.MethodPost, "/api/pull", req, func(bts []byte) error {
 | |
| 		var resp ProgressResponse
 | |
| 		if err := json.Unmarshal(bts, &resp); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		return fn(resp)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| // PushProgressFunc is a function that [Client.Push] invokes when progress is
 | |
| // made.
 | |
| // It's similar to other progress function types like [PullProgressFunc].
 | |
| type PushProgressFunc func(ProgressResponse) error
 | |
| 
 | |
| // Push uploads a model to the model library; requires registering for ollama.ai
 | |
| // and adding a public key first. fn is called each time progress is made on
 | |
| // the request and can be used to display a progress bar, etc.
 | |
| func (c *Client) Push(ctx context.Context, req *PushRequest, fn PushProgressFunc) error {
 | |
| 	return c.stream(ctx, http.MethodPost, "/api/push", req, func(bts []byte) error {
 | |
| 		var resp ProgressResponse
 | |
| 		if err := json.Unmarshal(bts, &resp); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		return fn(resp)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| // CreateProgressFunc is a function that [Client.Create] invokes when progress
 | |
| // is made.
 | |
| // It's similar to other progress function types like [PullProgressFunc].
 | |
| type CreateProgressFunc func(ProgressResponse) error
 | |
| 
 | |
| // Create creates a model from a [Modelfile]. fn is a progress function that
 | |
| // behaves similarly to other methods (see [Client.Pull]).
 | |
| //
 | |
| // [Modelfile]: https://github.com/ollama/ollama/blob/main/docs/modelfile.md
 | |
| func (c *Client) Create(ctx context.Context, req *CreateRequest, fn CreateProgressFunc) error {
 | |
| 	return c.stream(ctx, http.MethodPost, "/api/create", req, func(bts []byte) error {
 | |
| 		var resp ProgressResponse
 | |
| 		if err := json.Unmarshal(bts, &resp); err != nil {
 | |
| 			return err
 | |
| 		}
 | |
| 
 | |
| 		return fn(resp)
 | |
| 	})
 | |
| }
 | |
| 
 | |
| // List lists models that are available locally.
 | |
| func (c *Client) List(ctx context.Context) (*ListResponse, error) {
 | |
| 	var lr ListResponse
 | |
| 	if err := c.do(ctx, http.MethodGet, "/api/tags", nil, &lr); err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	return &lr, nil
 | |
| }
 | |
| 
 | |
| // ListRunning lists running models.
 | |
| func (c *Client) ListRunning(ctx context.Context) (*ProcessResponse, error) {
 | |
| 	var lr ProcessResponse
 | |
| 	if err := c.do(ctx, http.MethodGet, "/api/ps", nil, &lr); err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	return &lr, nil
 | |
| }
 | |
| 
 | |
| // Copy copies a model - creating a model with another name from an existing
 | |
| // model.
 | |
| func (c *Client) Copy(ctx context.Context, req *CopyRequest) error {
 | |
| 	if err := c.do(ctx, http.MethodPost, "/api/copy", req, nil); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Delete deletes a model and its data.
 | |
| func (c *Client) Delete(ctx context.Context, req *DeleteRequest) error {
 | |
| 	if err := c.do(ctx, http.MethodDelete, "/api/delete", req, nil); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Show obtains model information, including details, modelfile, license etc.
 | |
| func (c *Client) Show(ctx context.Context, req *ShowRequest) (*ShowResponse, error) {
 | |
| 	var resp ShowResponse
 | |
| 	if err := c.do(ctx, http.MethodPost, "/api/show", req, &resp); err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	return &resp, nil
 | |
| }
 | |
| 
 | |
| // Heartbeat checks if the server has started and is responsive; if yes, it
 | |
| // returns nil, otherwise an error.
 | |
| func (c *Client) Heartbeat(ctx context.Context) error {
 | |
| 	if err := c.do(ctx, http.MethodHead, "/", nil, nil); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Embed generates embeddings from a model.
 | |
| func (c *Client) Embed(ctx context.Context, req *EmbedRequest) (*EmbedResponse, error) {
 | |
| 	var resp EmbedResponse
 | |
| 	if err := c.do(ctx, http.MethodPost, "/api/embed", req, &resp); err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	return &resp, nil
 | |
| }
 | |
| 
 | |
| // Embeddings generates an embedding from a model.
 | |
| func (c *Client) Embeddings(ctx context.Context, req *EmbeddingRequest) (*EmbeddingResponse, error) {
 | |
| 	var resp EmbeddingResponse
 | |
| 	if err := c.do(ctx, http.MethodPost, "/api/embeddings", req, &resp); err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	return &resp, nil
 | |
| }
 | |
| 
 | |
| // CreateBlob creates a blob from a file on the server. digest is the
 | |
| // expected SHA256 digest of the file, and r represents the file.
 | |
| func (c *Client) CreateBlob(ctx context.Context, digest string, r io.Reader) error {
 | |
| 	return c.do(ctx, http.MethodPost, fmt.Sprintf("/api/blobs/%s", digest), r, nil)
 | |
| }
 | |
| 
 | |
| // Version returns the Ollama server version as a string.
 | |
| func (c *Client) Version(ctx context.Context) (string, error) {
 | |
| 	var version struct {
 | |
| 		Version string `json:"version"`
 | |
| 	}
 | |
| 
 | |
| 	if err := c.do(ctx, http.MethodGet, "/api/version", nil, &version); err != nil {
 | |
| 		return "", err
 | |
| 	}
 | |
| 
 | |
| 	return version.Version, nil
 | |
| }
 |