35 lines
1.0 KiB
YAML
35 lines
1.0 KiB
YAML
apiVersion: v1
|
|
kind: ConfigMap
|
|
metadata:
|
|
name: ai-service-config
|
|
namespace: ai-service
|
|
data:
|
|
HTTP_HOST: "0.0.0.0"
|
|
HTTP_PORT: "8080"
|
|
MIGRATE_ON_START: "true"
|
|
# Direct AI endpoints on the local AI server.
|
|
LLM_BASE_URL: "http://10.2.3.5:8002"
|
|
LLM_MODEL: "qwen2.5-14b"
|
|
LLM_TIMEOUT: "5m"
|
|
TRANSCRIPTION_PROVIDERS: "voxtral-small"
|
|
WHISPERX_URL: "http://10.2.3.5:8001"
|
|
WHISPERX_TIMEOUT: "10m"
|
|
WHISPERX_LEAD_SILENCE: "800ms"
|
|
# Fill these after Qwen2-Audio and Voxtral are exposed as OpenAI-compatible
|
|
# chat-completions endpoints on the AI server.
|
|
QWEN_AUDIO_BASE_URL: ""
|
|
QWEN_AUDIO_MODEL: "Qwen/Qwen2-Audio-7B-Instruct"
|
|
QWEN_AUDIO_TIMEOUT: "10m"
|
|
VOXTRAL_BASE_URL: "http://10.2.3.5:8004"
|
|
VOXTRAL_MODEL: "mistralai/Voxtral-Small-24B-2507"
|
|
VOXTRAL_TIMEOUT: "10m"
|
|
AUDIO_LLM_MAX_TOKENS: "4096"
|
|
FFMPEG_PATH: "/usr/bin/ffmpeg"
|
|
AI_STATS_SIDECAR_URL: "http://10.2.3.5:9090"
|
|
AI_STATS_TIMEOUT: "8s"
|
|
WORKER_POLL_INTERVAL: "2s"
|
|
WORKER_HTTP_HOST: "0.0.0.0"
|
|
WORKER_HTTP_PORT: "8081"
|
|
WORKER_CLAIM_LIMIT: "4"
|
|
WORKER_LEASE_TIMEOUT: "15m"
|