From ae1802dab98287a54367f6c981858a20cb14d17d Mon Sep 17 00:00:00 2001 From: Grendgi Date: Wed, 10 Jun 2026 11:30:08 +0300 Subject: [PATCH] Stop sending prompt to Whisper transcription --- internal/config/config.go | 2 +- internal/transcription/client.go | 3 --- internal/transcription/client_test.go | 6 +++++- 3 files changed, 6 insertions(+), 5 deletions(-) diff --git a/internal/config/config.go b/internal/config/config.go index b991372..bc720fa 100644 --- a/internal/config/config.go +++ b/internal/config/config.go @@ -133,7 +133,7 @@ func envCSVDefault(key string, fallback []string) []string { } func defaultAudioPrompt() string { - return "Расшифруй речь из аудио максимально точно. Сохрани русский язык, имена, телефоны, суммы и смысловые паузы. Не добавляй комментарии, анализ, Markdown или JSON. Верни только чистый текст расшифровки." + return "" } func hostname() string { diff --git a/internal/transcription/client.go b/internal/transcription/client.go index dcba17d..82e9a13 100644 --- a/internal/transcription/client.go +++ b/internal/transcription/client.go @@ -112,9 +112,6 @@ func New(baseURL string, timeout time.Duration, ffmpegPath string, leadSilence t func NewWithOptions(opts Options) *Client { audioPrompt := strings.TrimSpace(opts.AudioPrompt) - if audioPrompt == "" { - audioPrompt = "Transcribe the audio exactly. Return only the transcript text." - } provider := buildAudioProvider(opts, audioPrompt) if provider.BaseURL == "" { return nil diff --git a/internal/transcription/client_test.go b/internal/transcription/client_test.go index 21ab7f1..9a2f6d0 100644 --- a/internal/transcription/client_test.go +++ b/internal/transcription/client_test.go @@ -28,7 +28,7 @@ func TestWhisperUsesAudioTranscriptionsEndpoint(t *testing.T) { })) defer audioSrv.Close() - var gotPath, gotModel, gotResponseFormat string + var gotPath, gotModel, gotResponseFormat, gotPrompt string providerSrv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) { gotPath = r.URL.Path if err := r.ParseMultipartForm(16 << 20); err != nil { @@ -36,6 +36,7 @@ func TestWhisperUsesAudioTranscriptionsEndpoint(t *testing.T) { } gotModel = r.FormValue("model") gotResponseFormat = r.FormValue("response_format") + gotPrompt = r.FormValue("prompt") if _, _, err := r.FormFile("file"); err != nil { t.Fatalf("FormFile: %v", err) } @@ -69,6 +70,9 @@ func TestWhisperUsesAudioTranscriptionsEndpoint(t *testing.T) { if gotResponseFormat != "json" { t.Fatalf("response_format = %q, want json", gotResponseFormat) } + if gotPrompt != "" { + t.Fatalf("prompt = %q, want empty", gotPrompt) + } if len(got.Segments) != 2 || got.Segments[0].Text != "Алло, тест." || got.Segments[1].Start != 1.2 { t.Fatalf("segments = %#v", got.Segments) }