We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 01dffe6 commit abc5d30Copy full SHA for abc5d30
api.py
@@ -10,6 +10,8 @@
10
import torchaudio
11
from model import SenseVoiceSmall
12
from funasr.utils.postprocess_utils import rich_transcription_postprocess
13
+from io import BytesIO
14
+
15
16
class Language(str, Enum):
17
auto = "auto"
@@ -49,9 +51,11 @@ async def turn_audio_to_text(files: Annotated[List[bytes], File(description="wav
49
51
audios = []
50
52
audio_fs = 0
53
for file in files:
- data_or_path_or_list, audio_fs = torchaudio.load(file)
54
+ file_io = BytesIO(file)
55
+ data_or_path_or_list, audio_fs = torchaudio.load(file_io)
56
data_or_path_or_list = data_or_path_or_list.mean(0)
57
audios.append(data_or_path_or_list)
58
+ file_io.close()
59
if lang == "":
60
lang = "auto"
61
if keys == "":
0 commit comments