Changes: - drizzle/schema.ts: added llmProviders table (AES-256-GCM encrypted API keys) - drizzle/0004_llm_providers.sql: migration for llmProviders - server/providers.ts: full CRUD + AES-256-GCM encrypt/decrypt + seedDefaultProvider - server/routers.ts: replaced hardcoded config.providers with DB-backed providers router; added providers.list/create/update/delete/activate tRPC endpoints - server/seed.ts: calls seedDefaultProvider() on startup to seed from env if table empty - server/_core/index.ts: added POST /api/orchestrator/stream SSE proxy route to Go Gateway - gateway/internal/llm/client.go: added ChatStream (SSE) + UpdateCredentials - gateway/internal/orchestrator/orchestrator.go: added ChatWithEvents (tool-call callbacks) - gateway/internal/api/handlers.go: added OrchestratorStream (SSE) + ProvidersReload endpoints - gateway/internal/db/db.go: added GetActiveProvider from llmProviders table - gateway/cmd/gateway/main.go: registered /api/orchestrator/stream + /api/providers/reload routes - client/src/pages/Chat.tsx: full rebuild — 3-panel layout (left: conversation list, centre: messages with SSE streaming + markdown, right: live tool-call console) - client/src/pages/Settings.tsx: full rebuild — DB-backed provider CRUD (add/edit/activate/delete), no hardcoded keys, key shown masked from DB hint
284 lines
7.1 KiB
Go
284 lines
7.1 KiB
Go
// Package llm provides an OpenAI-compatible client for the Ollama Cloud API.
|
|
package llm
|
|
|
|
import (
|
|
"bufio"
|
|
"bytes"
|
|
"context"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io"
|
|
"net/http"
|
|
"strings"
|
|
"time"
|
|
)
|
|
|
|
// ─── Types ────────────────────────────────────────────────────────────────────
|
|
|
|
type Message struct {
|
|
Role string `json:"role"`
|
|
Content string `json:"content"`
|
|
ToolCallID string `json:"tool_call_id,omitempty"`
|
|
Name string `json:"name,omitempty"`
|
|
ToolCalls []ToolCall `json:"tool_calls,omitempty"`
|
|
}
|
|
|
|
type ToolCall struct {
|
|
ID string `json:"id"`
|
|
Type string `json:"type"`
|
|
Function ToolCallFunction `json:"function"`
|
|
}
|
|
|
|
type ToolCallFunction struct {
|
|
Name string `json:"name"`
|
|
Arguments string `json:"arguments"`
|
|
}
|
|
|
|
type Tool struct {
|
|
Type string `json:"type"`
|
|
Function ToolFunction `json:"function"`
|
|
}
|
|
|
|
type ToolFunction struct {
|
|
Name string `json:"name"`
|
|
Description string `json:"description"`
|
|
Parameters map[string]any `json:"parameters"`
|
|
}
|
|
|
|
type ChatRequest struct {
|
|
Model string `json:"model"`
|
|
Messages []Message `json:"messages"`
|
|
Stream bool `json:"stream"`
|
|
Temperature *float64 `json:"temperature,omitempty"`
|
|
MaxTokens *int `json:"max_tokens,omitempty"`
|
|
Tools []Tool `json:"tools,omitempty"`
|
|
ToolChoice string `json:"tool_choice,omitempty"`
|
|
}
|
|
|
|
type ChatChoice struct {
|
|
Index int `json:"index"`
|
|
Message Message `json:"message"`
|
|
FinishReason string `json:"finish_reason"`
|
|
}
|
|
|
|
type Usage struct {
|
|
PromptTokens int `json:"prompt_tokens"`
|
|
CompletionTokens int `json:"completion_tokens"`
|
|
TotalTokens int `json:"total_tokens"`
|
|
}
|
|
|
|
type ChatResponse struct {
|
|
ID string `json:"id"`
|
|
Object string `json:"object"`
|
|
Created int64 `json:"created"`
|
|
Model string `json:"model"`
|
|
Choices []ChatChoice `json:"choices"`
|
|
Usage *Usage `json:"usage,omitempty"`
|
|
}
|
|
|
|
type Model struct {
|
|
ID string `json:"id"`
|
|
Object string `json:"object"`
|
|
Created int64 `json:"created"`
|
|
OwnedBy string `json:"owned_by"`
|
|
}
|
|
|
|
type ModelsResponse struct {
|
|
Object string `json:"object"`
|
|
Data []Model `json:"data"`
|
|
}
|
|
|
|
// ─── Client ───────────────────────────────────────────────────────────────────
|
|
|
|
type Client struct {
|
|
baseURL string
|
|
apiKey string
|
|
httpClient *http.Client
|
|
}
|
|
|
|
func NewClient(baseURL, apiKey string) *Client {
|
|
return &Client{
|
|
baseURL: strings.TrimRight(baseURL, "/"),
|
|
apiKey: apiKey,
|
|
httpClient: &http.Client{
|
|
Timeout: 180 * time.Second,
|
|
},
|
|
}
|
|
}
|
|
|
|
// UpdateCredentials updates the LLM client's base URL and API key at runtime.
|
|
// Called when the active provider is changed via the Settings UI.
|
|
func (c *Client) UpdateCredentials(baseURL, apiKey string) {
|
|
c.baseURL = strings.TrimRight(baseURL, "/")
|
|
c.apiKey = apiKey
|
|
}
|
|
|
|
func (c *Client) headers() map[string]string {
|
|
h := map[string]string{
|
|
"Content-Type": "application/json",
|
|
}
|
|
if c.apiKey != "" {
|
|
h["Authorization"] = "Bearer " + c.apiKey
|
|
}
|
|
return h
|
|
}
|
|
|
|
// Health checks if the Ollama API is reachable.
|
|
func (c *Client) Health(ctx context.Context) (bool, int64, error) {
|
|
start := time.Now()
|
|
req, err := http.NewRequestWithContext(ctx, http.MethodGet, c.baseURL+"/models", nil)
|
|
if err != nil {
|
|
return false, 0, err
|
|
}
|
|
for k, v := range c.headers() {
|
|
req.Header.Set(k, v)
|
|
}
|
|
resp, err := c.httpClient.Do(req)
|
|
latency := time.Since(start).Milliseconds()
|
|
if err != nil {
|
|
return false, latency, err
|
|
}
|
|
defer resp.Body.Close()
|
|
return resp.StatusCode == http.StatusOK, latency, nil
|
|
}
|
|
|
|
// ListModels returns available models.
|
|
func (c *Client) ListModels(ctx context.Context) (*ModelsResponse, error) {
|
|
req, err := http.NewRequestWithContext(ctx, http.MethodGet, c.baseURL+"/models", nil)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
for k, v := range c.headers() {
|
|
req.Header.Set(k, v)
|
|
}
|
|
resp, err := c.httpClient.Do(req)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer resp.Body.Close()
|
|
if resp.StatusCode != http.StatusOK {
|
|
body, _ := io.ReadAll(resp.Body)
|
|
return nil, fmt.Errorf("ollama API error (%d): %s", resp.StatusCode, string(body))
|
|
}
|
|
var result ModelsResponse
|
|
if err := json.NewDecoder(resp.Body).Decode(&result); err != nil {
|
|
return nil, err
|
|
}
|
|
return &result, nil
|
|
}
|
|
|
|
// ChatStream sends a streaming chat completion request (SSE).
|
|
// It calls the callback for each chunk received.
|
|
func (c *Client) ChatStream(ctx context.Context, req ChatRequest, onChunk func(delta string, done bool)) error {
|
|
req.Stream = true
|
|
|
|
body, err := json.Marshal(req)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
httpReq, err := http.NewRequestWithContext(ctx, http.MethodPost,
|
|
c.baseURL+"/chat/completions", bytes.NewReader(body))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for k, v := range c.headers() {
|
|
httpReq.Header.Set(k, v)
|
|
}
|
|
httpReq.Header.Set("Accept", "text/event-stream")
|
|
|
|
// Use a client without timeout for streaming
|
|
streamClient := &http.Client{Timeout: 0}
|
|
resp, err := streamClient.Do(httpReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer resp.Body.Close()
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
respBody, _ := io.ReadAll(resp.Body)
|
|
return fmt.Errorf("ollama stream API error (%d): %s", resp.StatusCode, string(respBody))
|
|
}
|
|
|
|
// Parse SSE stream
|
|
scanner := bufio.NewScanner(resp.Body)
|
|
for scanner.Scan() {
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
default:
|
|
}
|
|
|
|
line := scanner.Text()
|
|
if !strings.HasPrefix(line, "data: ") {
|
|
continue
|
|
}
|
|
data := strings.TrimPrefix(line, "data: ")
|
|
if data == "[DONE]" {
|
|
onChunk("", true)
|
|
return nil
|
|
}
|
|
|
|
var chunk struct {
|
|
Choices []struct {
|
|
Delta struct {
|
|
Content string `json:"content"`
|
|
} `json:"delta"`
|
|
FinishReason *string `json:"finish_reason"`
|
|
} `json:"choices"`
|
|
}
|
|
if err := json.Unmarshal([]byte(data), &chunk); err != nil {
|
|
continue
|
|
}
|
|
if len(chunk.Choices) > 0 {
|
|
delta := chunk.Choices[0].Delta.Content
|
|
if delta != "" {
|
|
onChunk(delta, false)
|
|
}
|
|
if chunk.Choices[0].FinishReason != nil && *chunk.Choices[0].FinishReason == "stop" {
|
|
onChunk("", true)
|
|
return nil
|
|
}
|
|
}
|
|
}
|
|
if err := scanner.Err(); err != nil {
|
|
return err
|
|
}
|
|
onChunk("", true)
|
|
return nil
|
|
}
|
|
func (c *Client) Chat(ctx context.Context, req ChatRequest) (*ChatResponse, error) {
|
|
req.Stream = false
|
|
|
|
body, err := json.Marshal(req)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
httpReq, err := http.NewRequestWithContext(ctx, http.MethodPost,
|
|
c.baseURL+"/chat/completions", bytes.NewReader(body))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
for k, v := range c.headers() {
|
|
httpReq.Header.Set(k, v)
|
|
}
|
|
|
|
resp, err := c.httpClient.Do(httpReq)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer resp.Body.Close()
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
respBody, _ := io.ReadAll(resp.Body)
|
|
return nil, fmt.Errorf("ollama chat API error (%d): %s", resp.StatusCode, string(respBody))
|
|
}
|
|
|
|
var result ChatResponse
|
|
if err := json.NewDecoder(resp.Body).Decode(&result); err != nil {
|
|
return nil, err
|
|
}
|
|
return &result, nil
|
|
}
|