fix: handle processor.decode returning a list of strings

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-05-29 03:00:09 +08:00
parent cf18335235
commit 843ec534d1
1 changed files with 2 additions and 1 deletions
@@ -27,7 +27,8 @@ def transcribe_audio(processor, model, audio, language="en"):
    inputs = processor(audio, sampling_rate=SAMPLE_RATE, return_tensors="pt", language=language)
    inputs.to(model.device, dtype=model.dtype)
    outputs = model.generate(**inputs, max_new_tokens=256)
-    return processor.decode(outputs, skip_special_tokens=True)
+    texts = processor.decode(outputs, skip_special_tokens=True)
    return " ".join(texts) if isinstance(texts, list) else texts
 def record_audio(duration):