Add AI provider configuration

2026-06-08 13:42:18 +03:00
parent 0081e910ba
commit 0da278a45e
4 changed files with 49 additions and 0 deletions
--- a/README.md
+++ b/README.md
@@ -41,9 +41,23 @@ service.
 - `HTTP_PORT`, default `8080`
 - `DATABASE_URL`, required
 - `MIGRATE_ON_START`, default `true`
 - `LLM_BASE_URL`, primary OpenAI-compatible LLM endpoint
 - `LLM_API_KEY`, primary LLM API key
 - `LLM_MODEL`, default `qwen2.5-14b`
 - `LLM_TIMEOUT`, default `5m`
 - `WHISPERX_URL`, WhisperX endpoint for transcription jobs
 - `OPENCLAW_URL`, optional OpenClaw gateway URL if we route through OpenClaw
  instead of direct vLLM
 ## Next integration step
 `telephony` should first mirror low-risk analysis jobs into this service while
 continuing local processing. Remote execution can then be enabled by feature
 flag per task type.
 ## OpenClaw note
 Current Portal services call the local AI server directly: vLLM for LLM tasks
 and WhisperX for transcription. OpenClaw is not required for the current
 `ai-service` queue deployment. It becomes useful if we want centralized model
 routing, provider fallback, request policy and cross-model gateway behavior.
--- a/internal/config/config.go
+++ b/internal/config/config.go
@@ -3,6 +3,7 @@ package config
 import (
 	"os"
 	"strconv"
 	"time"
 )
 type Config struct {
@@ -10,6 +11,13 @@ type Config struct {
 	HTTPPort       int
 	DatabaseURL    string
 	MigrateOnStart bool
 	LLMBaseURL  string
 	LLMAPIKey   string
 	LLMModel    string
 	LLMTimeout  time.Duration
 	WhisperXURL string
 	OpenClawURL string
 }
 func Load() Config {
@@ -18,6 +26,13 @@ func Load() Config {
 		HTTPPort:       envInt("HTTP_PORT", 8080),
 		DatabaseURL:    envString("DATABASE_URL", ""),
 		MigrateOnStart: envBool("MIGRATE_ON_START", true),
 		LLMBaseURL:  envString("LLM_BASE_URL", ""),
 		LLMAPIKey:   envString("LLM_API_KEY", ""),
 		LLMModel:    envString("LLM_MODEL", "qwen2.5-14b"),
 		LLMTimeout:  envDuration("LLM_TIMEOUT", 5*time.Minute),
 		WhisperXURL: envString("WHISPERX_URL", ""),
 		OpenClawURL: envString("OPENCLAW_URL", ""),
 	}
 }
@@ -51,3 +66,15 @@ func envBool(key string, fallback bool) bool {
 	}
 	return v
 }
 func envDuration(key string, fallback time.Duration) time.Duration {
 	raw := os.Getenv(key)
 	if raw == "" {
 		return fallback
 	}
 	v, err := time.ParseDuration(raw)
 	if err != nil {
 		return fallback
 	}
 	return v
 }
--- a/k8s/configmap.yaml
+++ b/k8s/configmap.yaml
@@ -7,3 +7,10 @@ data:
  HTTP_HOST: "0.0.0.0"
  HTTP_PORT: "8080"
  MIGRATE_ON_START: "true"
  # Default direct AI endpoints. OpenClaw can replace LLM_BASE_URL later when
  # we decide to route model traffic through a gateway instead of direct vLLM.
  LLM_BASE_URL: "http://10.2.3.5:8002"
  LLM_MODEL: "qwen2.5-14b"
  LLM_TIMEOUT: "5m"
  WHISPERX_URL: "http://10.2.3.5:8001"
  OPENCLAW_URL: ""
--- a/k8s/secrets.yaml
+++ b/k8s/secrets.yaml
@@ -17,3 +17,4 @@ metadata:
 type: Opaque
 stringData:
  DATABASE_URL: "postgres://ai_service:ai_service@postgres:5432/ai_service?sslmode=disable"
  LLM_API_KEY: "sk-111f838ccec43406e078cd9094b6797307cb895236179f32"