Ready for whisper

pull/11/head
killian 11 months ago
parent 6a96670460
commit 375192afe6

@ -26,10 +26,6 @@ SERVER_PORT=$(echo $SERVER_URL | grep -oE "[0-9]+")
if [ -n "$SERVER_PORT" ]; then
lsof -ti tcp:$SERVER_PORT | xargs kill
fi
DEVICE_PORT=$(echo $DEVICE_URL | grep -oE "[0-9]+")
if [ -n "$DEVICE_PORT" ]; then
lsof -ti tcp:$DEVICE_PORT | xargs kill
fi
### START

@ -49,16 +49,29 @@ def stt_bytes(audio_bytes: bytearray, mime_type="audio/wav"):
return stt_wav(wav_file_path)
def stt_wav(wav_file_path: str):
audio_file = open(wav_file_path, "rb")
try:
transcript = client.audio.transcriptions.create(
model="whisper-1",
file=audio_file,
response_format="text"
)
except openai.BadRequestError as e:
print("openai.BadRequestError:", e)
return None
print("Transcription result:", transcript)
return transcript
if os.getenv('ALL_LOCAL') == 'False':
audio_file = open(wav_file_path, "rb")
try:
transcript = client.audio.transcriptions.create(
model="whisper-1",
file=audio_file,
response_format="text"
)
except openai.BadRequestError as e:
print("openai.BadRequestError:", e)
return None
print("Transcription result:", transcript)
return transcript
else:
# Local whisper here, given `wav_file_path`
pass
def stt(input_data, mime_type="audio/wav"):
if isinstance(input_data, str):
return stt_wav(input_data)
elif isinstance(input_data, bytearray):
return stt_bytes(input_data, mime_type)
else:
raise ValueError("Input data should be either a path to a wav file (str) or audio bytes (bytearray)")
Loading…
Cancel
Save