|
|
@ -49,6 +49,8 @@ def stt_bytes(audio_bytes: bytearray, mime_type="audio/wav"):
|
|
|
|
return stt_wav(wav_file_path)
|
|
|
|
return stt_wav(wav_file_path)
|
|
|
|
|
|
|
|
|
|
|
|
def stt_wav(wav_file_path: str):
|
|
|
|
def stt_wav(wav_file_path: str):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if os.getenv('ALL_LOCAL') == 'False':
|
|
|
|
audio_file = open(wav_file_path, "rb")
|
|
|
|
audio_file = open(wav_file_path, "rb")
|
|
|
|
try:
|
|
|
|
try:
|
|
|
|
transcript = client.audio.transcriptions.create(
|
|
|
|
transcript = client.audio.transcriptions.create(
|
|
|
@ -62,3 +64,14 @@ def stt_wav(wav_file_path: str):
|
|
|
|
|
|
|
|
|
|
|
|
print("Transcription result:", transcript)
|
|
|
|
print("Transcription result:", transcript)
|
|
|
|
return transcript
|
|
|
|
return transcript
|
|
|
|
|
|
|
|
else:
|
|
|
|
|
|
|
|
# Local whisper here, given `wav_file_path`
|
|
|
|
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def stt(input_data, mime_type="audio/wav"):
|
|
|
|
|
|
|
|
if isinstance(input_data, str):
|
|
|
|
|
|
|
|
return stt_wav(input_data)
|
|
|
|
|
|
|
|
elif isinstance(input_data, bytearray):
|
|
|
|
|
|
|
|
return stt_bytes(input_data, mime_type)
|
|
|
|
|
|
|
|
else:
|
|
|
|
|
|
|
|
raise ValueError("Input data should be either a path to a wav file (str) or audio bytes (bytearray)")
|