Make Voxtral the only transcription provider
This commit is contained in:
@@ -1,60 +1,4 @@
|
||||
services:
|
||||
qwen-audio:
|
||||
build:
|
||||
context: .
|
||||
dockerfile: vllm-audio.Dockerfile
|
||||
image: vllm-audio:local
|
||||
container_name: qwen-audio
|
||||
profiles:
|
||||
- qwen-audio
|
||||
- audio-compare
|
||||
restart: unless-stopped
|
||||
ipc: host
|
||||
runtime: nvidia
|
||||
deploy:
|
||||
resources:
|
||||
reservations:
|
||||
devices:
|
||||
- driver: nvidia
|
||||
count: all
|
||||
capabilities: [gpu]
|
||||
environment:
|
||||
HUGGING_FACE_HUB_TOKEN: ${HF_TOKEN}
|
||||
VLLM_API_KEY: ${VLLM_API_KEY}
|
||||
HF_HOME: /cache
|
||||
volumes:
|
||||
- ./data/vllm-cache:/cache
|
||||
networks:
|
||||
- audio-models
|
||||
ports:
|
||||
- "10.2.3.5:8003:8000"
|
||||
command:
|
||||
- "--model"
|
||||
- "Qwen/Qwen2-Audio-7B-Instruct"
|
||||
- "--served-model-name"
|
||||
- "Qwen/Qwen2-Audio-7B-Instruct"
|
||||
- "--trust-remote-code"
|
||||
- "--host"
|
||||
- "0.0.0.0"
|
||||
- "--port"
|
||||
- "8000"
|
||||
- "--max-model-len"
|
||||
- "8192"
|
||||
- "--gpu-memory-utilization"
|
||||
- "0.25"
|
||||
- "--api-key"
|
||||
- "${VLLM_API_KEY}"
|
||||
- "--max-num-seqs"
|
||||
- "4"
|
||||
- "--max-num-batched-tokens"
|
||||
- "4096"
|
||||
healthcheck:
|
||||
test: ["CMD", "python3", "-c", "import urllib.request; urllib.request.urlopen('http://localhost:8000/health')"]
|
||||
interval: 30s
|
||||
timeout: 5s
|
||||
retries: 5
|
||||
start_period: 900s
|
||||
|
||||
voxtral-small:
|
||||
build:
|
||||
context: .
|
||||
@@ -63,7 +7,6 @@ services:
|
||||
container_name: voxtral-small
|
||||
profiles:
|
||||
- voxtral-small
|
||||
- audio-compare
|
||||
restart: unless-stopped
|
||||
ipc: host
|
||||
runtime: nvidia
|
||||
|
||||
@@ -1,20 +0,0 @@
|
||||
upstream whisperx_upstream {
|
||||
server whisperx-1:8000 max_fails=3 fail_timeout=30s;
|
||||
}
|
||||
|
||||
server {
|
||||
listen 80 default_server;
|
||||
client_max_body_size 200m;
|
||||
|
||||
location / {
|
||||
proxy_pass http://whisperx_upstream;
|
||||
proxy_set_header Host $host;
|
||||
proxy_set_header X-Real-IP $remote_addr;
|
||||
proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
|
||||
proxy_connect_timeout 30s;
|
||||
proxy_send_timeout 10m;
|
||||
proxy_read_timeout 10m;
|
||||
proxy_request_buffering off;
|
||||
proxy_buffering off;
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user