Ollama Provider

The Ollama provider integrates with local Ollama instances for running LLM inference, embeddings generation, and text completion.

Installation

go get github.com/resolute/resolute/providers/ollama

Configuration

OllamaConfig

type OllamaConfig struct {
    Host    string        // Ollama server host (default: "http://localhost:11434")
    Timeout time.Duration // Request timeout (default: 5m)
}

Environment Variables

Variable	Description	Default
`OLLAMA_HOST`	Ollama server URL	`http://localhost:11434`
`OLLAMA_TIMEOUT`	Request timeout	`5m`

Provider Constructor

NewProvider

func NewProvider(cfg OllamaConfig) *OllamaProvider

Creates a new Ollama provider.

Parameters:

cfg - Ollama configuration

Returns: *OllamaProvider implementing core.Provider

Example:

provider := ollama.NewProvider(ollama.OllamaConfig{
    Host:    "http://localhost:11434",
    Timeout: 10 * time.Minute,
})

Types

Message

type Message struct {
    Role    string `json:"role"`    // "system", "user", or "assistant"
    Content string `json:"content"` // Message content
}

GenerateOptions

type GenerateOptions struct {
    Temperature   float64 `json:"temperature"`    // Sampling temperature (0.0-1.0)
    TopP          float64 `json:"top_p"`          // Nucleus sampling threshold
    TopK          int     `json:"top_k"`          // Top-k sampling
    NumPredict    int     `json:"num_predict"`    // Max tokens to generate
    Stop          []string `json:"stop"`          // Stop sequences
    RepeatPenalty float64 `json:"repeat_penalty"` // Repetition penalty
}

EmbeddingOptions

type EmbeddingOptions struct {
    Truncate bool `json:"truncate"` // Truncate input if too long
}

Activities

Generate

Generates text completion using a specified model.

Input:

type GenerateInput struct {
    Model   string          `json:"model"`   // Model name (e.g., "llama3.2")
    Prompt  string          `json:"prompt"`  // Input prompt
    System  string          `json:"system"`  // System prompt
    Options GenerateOptions `json:"options"` // Generation options
    Stream  bool            `json:"stream"`  // Enable streaming (default: false)
}

Output:

type GenerateOutput struct {
    Response         string `json:"response"`
    Model            string `json:"model"`
    TotalDuration    int64  `json:"total_duration"`
    LoadDuration     int64  `json:"load_duration"`
    PromptEvalCount  int    `json:"prompt_eval_count"`
    EvalCount        int    `json:"eval_count"`
}

Node Factory:

func Generate(input GenerateInput) *core.Node[GenerateInput, GenerateOutput]

Example:

generateNode := ollama.Generate(ollama.GenerateInput{
    Model:  "llama3.2",
    Prompt: "Explain the concept of workflows in software engineering",
    System: "You are a helpful technical writer.",
    Options: ollama.GenerateOptions{
        Temperature: 0.7,
        NumPredict:  500,
    },
})

Chat

Conducts a multi-turn chat conversation.

Input:

type ChatInput struct {
    Model    string          `json:"model"`
    Messages []Message       `json:"messages"`
    Options  GenerateOptions `json:"options"`
    Stream   bool            `json:"stream"`
}

Output:

type ChatOutput struct {
    Message          Message `json:"message"`
    Model            string  `json:"model"`
    TotalDuration    int64   `json:"total_duration"`
    PromptEvalCount  int     `json:"prompt_eval_count"`
    EvalCount        int     `json:"eval_count"`
}

Node Factory:

func Chat(input ChatInput) *core.Node[ChatInput, ChatOutput]

Example:

chatNode := ollama.Chat(ollama.ChatInput{
    Model: "llama3.2",
    Messages: []ollama.Message{
        {Role: "system", Content: "You are a code reviewer."},
        {Role: "user", Content: "Review this function for bugs..."},
    },
    Options: ollama.GenerateOptions{
        Temperature: 0.3,
    },
})

Embed

Generates embeddings for text input.

Input:

type EmbedInput struct {
    Model   string           `json:"model"`   // Embedding model (e.g., "nomic-embed-text")
    Input   string           `json:"input"`   // Single text input
    Inputs  []string         `json:"inputs"`  // Multiple text inputs
    Options EmbeddingOptions `json:"options"` // Embedding options
}

Output:

type EmbedOutput struct {
    Embeddings [][]float32 `json:"embeddings"`
    Model      string      `json:"model"`
}

Node Factory:

func Embed(input EmbedInput) *core.Node[EmbedInput, EmbedOutput]

Example:

// Single text
embedNode := ollama.Embed(ollama.EmbedInput{
    Model: "nomic-embed-text",
    Input: "What is workflow orchestration?",
})

// Batch embedding
embedNode := ollama.Embed(ollama.EmbedInput{
    Model: "nomic-embed-text",
    Inputs: []string{
        "First document text",
        "Second document text",
        "Third document text",
    },
})

BatchEmbed

Generates embeddings for documents from a DataRef. Uses the batch /api/embed endpoint with concurrent requests for throughput.

Internally processes documents in batches of 256 texts with 4 concurrent workers via errgroup.

Input:

type BatchEmbedInput struct {
    BaseURL      string
    Model        string
    DocumentsRef core.DataRef
}

Output:

type BatchEmbedOutput struct {
    Ref    core.DataRef
    Count  int
    Failed int
}

Node Factory:

func BatchEmbed(input BatchEmbedInput) *core.Node[BatchEmbedInput, BatchEmbedOutput]

Example:

embedNode := ollama.BatchEmbed(ollama.BatchEmbedInput{
    BaseURL:      "http://ollama:11434",
    Model:        "nomic-embed-text",
    DocumentsRef: core.OutputRef("chunks"),
})

ListModels

Lists available models on the Ollama server.

Input:

type ListModelsInput struct{}

Output:

type ListModelsOutput struct {
    Models []ModelInfo `json:"models"`
}

type ModelInfo struct {
    Name       string    `json:"name"`
    ModifiedAt time.Time `json:"modified_at"`
    Size       int64     `json:"size"`
    Digest     string    `json:"digest"`
}

Node Factory:

func ListModels(input ListModelsInput) *core.Node[ListModelsInput, ListModelsOutput]

PullModel

Pulls (downloads) a model from the Ollama library.

Input:

type PullModelInput struct {
    Name     string `json:"name"`     // Model name to pull
    Insecure bool   `json:"insecure"` // Allow insecure connections
}

Output:

type PullModelOutput struct {
    Status string `json:"status"`
}

Node Factory:

func PullModel(input PullModelInput) *core.Node[PullModelInput, PullModelOutput]

Usage Patterns

Text Generation Flow

flow := core.NewFlow("text-generator").
    TriggeredBy(core.Manual("api")).
    Then(ollama.Generate(ollama.GenerateInput{
        Model:  "llama3.2",
        Prompt: core.Output("input.prompt"),
        Options: ollama.GenerateOptions{
            Temperature: 0.7,
            NumPredict:  1000,
        },
    }).As("generation")).
    Build()

Embedding Pipeline

flow := core.NewFlow("embedding-pipeline").
    TriggeredBy(core.Schedule("0 2 * * *")).
    Then(fetchDocumentsNode.As("docs")).
    Then(ollama.BatchEmbed(ollama.BatchEmbedInput{
        BaseURL:      "http://ollama:11434",
        Model:        "nomic-embed-text",
        DocumentsRef: core.OutputRef("docs"),
    }).As("embeddings")).
    Then(storeVectorsNode).
    Build()

RAG (Retrieval-Augmented Generation)

flow := core.NewFlow("rag-query").
    TriggeredBy(core.Manual("api")).
    // Generate query embedding
    Then(ollama.Embed(ollama.EmbedInput{
        Model: "nomic-embed-text",
        Input: core.Output("input.query"),
    }).As("query-embedding")).
    // Search vector store
    Then(qdrant.Search(qdrant.SearchInput{
        Collection: "documents",
        Vector:     core.Output("query-embedding.Embeddings[0]"),
        Limit:      5,
    }).As("context")).
    // Generate response with context
    Then(ollama.Chat(ollama.ChatInput{
        Model: "llama3.2",
        Messages: []ollama.Message{
            {Role: "system", Content: "Answer based on the provided context."},
            {Role: "user", Content: core.Output("context.formatted_prompt")},
        },
    }).As("response")).
    Build()

Model Preparation Flow

flow := core.NewFlow("model-setup").
    TriggeredBy(core.Manual("setup")).
    Then(ollama.ListModels(ollama.ListModelsInput{}).As("available")).
    When(func(s *core.FlowState) bool {
        models := core.Get[ollama.ListModelsOutput](s, "available")
        for _, m := range models.Models {
            if m.Name == "llama3.2" {
                return false // Model already exists
            }
        }
        return true
    }).
        Then(ollama.PullModel(ollama.PullModelInput{
            Name: "llama3.2",
        })).
    EndWhen().
    Build()

Complete Example

package main

import (
    "time"

    "github.com/resolute/resolute/core"
    "github.com/resolute/resolute/providers/ollama"
    "github.com/resolute/resolute/providers/qdrant"
)

func main() {
    // Configure providers
    ollamaProvider := ollama.NewProvider(ollama.OllamaConfig{
        Host:    "http://localhost:11434",
        Timeout: 10 * time.Minute,
    })

    qdrantProvider := qdrant.NewProvider(qdrant.QdrantConfig{
        Host: "localhost:6334",
    })

    // Document processing node
    processDocsNode := core.NewNode("process-docs", ProcessDocsActivity, ProcessDocsInput{})

    // Build embedding pipeline
    flow := core.NewFlow("document-embedder").
        TriggeredBy(core.Schedule("0 3 * * *")).
        Then(fetchNewDocumentsNode.As("docs")).
        When(func(s *core.FlowState) bool {
            docs := core.Get[FetchDocsOutput](s, "docs")
            return len(docs.Documents) > 0
        }).
            Then(processDocsNode.As("processed")).
            Then(ollama.BatchEmbed(ollama.BatchEmbedInput{
                BaseURL:      "http://localhost:11434",
                Model:        "nomic-embed-text",
                DocumentsRef: core.OutputRef("processed"),
            }).As("embeddings")).
            Then(qdrant.Upsert(qdrant.UpsertInput{
                Collection: "documents",
                Points:     core.Output("embeddings.points"),
            })).
        EndWhen().
        Build()

    // Run worker
    err := core.NewWorker().
        WithConfig(core.WorkerConfig{
            TaskQueue: "embeddings",
        }).
        WithFlow(flow).
        WithProviders(ollamaProvider, qdrantProvider).
        Run()

    if err != nil {
        panic(err)
    }
}

Docs

Resolute

Title here

Ollama Provider

Ollama Provider

Installation

Configuration

OllamaConfig

Environment Variables

Provider Constructor

NewProvider

Types

Message

GenerateOptions

EmbeddingOptions

Activities

Generate

Chat

Embed

BatchEmbed

ListModels

PullModel

Usage Patterns

Text Generation Flow

Embedding Pipeline

RAG (Retrieval-Augmented Generation)

Model Preparation Flow

Complete Example

See Also

Ollama Provider

Ollama Provider

Installation#

Configuration#

OllamaConfig#

Environment Variables#

Provider Constructor#

NewProvider#

Types#

Message#

GenerateOptions#

EmbeddingOptions#

Activities#

Generate#

Chat#

Embed#

BatchEmbed#

ListModels#

PullModel#

Usage Patterns#

Text Generation Flow#

Embedding Pipeline#

RAG (Retrieval-Augmented Generation)#

Model Preparation Flow#

Complete Example#

See Also#

Installation

Configuration

OllamaConfig

Environment Variables

Provider Constructor

NewProvider

Types

Message

GenerateOptions

EmbeddingOptions

Activities

Generate

Chat

Embed

BatchEmbed

ListModels

PullModel

Usage Patterns

Text Generation Flow

Embedding Pipeline

RAG (Retrieval-Augmented Generation)

Model Preparation Flow

Complete Example

See Also