fix: handle processor.decode returning a list of strings
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
+2
-1
@@ -27,7 +27,8 @@ def transcribe_audio(processor, model, audio, language="en"):
|
|||||||
inputs = processor(audio, sampling_rate=SAMPLE_RATE, return_tensors="pt", language=language)
|
inputs = processor(audio, sampling_rate=SAMPLE_RATE, return_tensors="pt", language=language)
|
||||||
inputs.to(model.device, dtype=model.dtype)
|
inputs.to(model.device, dtype=model.dtype)
|
||||||
outputs = model.generate(**inputs, max_new_tokens=256)
|
outputs = model.generate(**inputs, max_new_tokens=256)
|
||||||
return processor.decode(outputs, skip_special_tokens=True)
|
texts = processor.decode(outputs, skip_special_tokens=True)
|
||||||
|
return " ".join(texts) if isinstance(texts, list) else texts
|
||||||
|
|
||||||
|
|
||||||
def record_audio(duration):
|
def record_audio(duration):
|
||||||
|
|||||||
Reference in New Issue
Block a user