Tune audio model GPU profiles

This commit is contained in:
Grendgi
2026-06-09 12:52:13 +03:00
parent f49ba7abd5
commit cac8d89e64

View File

@@ -36,7 +36,7 @@ services:
- "--max-model-len" - "--max-model-len"
- "8192" - "8192"
- "--gpu-memory-utilization" - "--gpu-memory-utilization"
- "0.45" - "0.25"
- "--api-key" - "--api-key"
- "${VLLM_API_KEY}" - "${VLLM_API_KEY}"
- "--max-num-seqs" - "--max-num-seqs"
@@ -95,7 +95,7 @@ services:
- "--max-model-len" - "--max-model-len"
- "32768" - "32768"
- "--gpu-memory-utilization" - "--gpu-memory-utilization"
- "0.72" - "0.62"
- "--api-key" - "--api-key"
- "${VLLM_API_KEY}" - "${VLLM_API_KEY}"
- "--max-num-seqs" - "--max-num-seqs"