Ready for whisper
This commit is contained in:
parent
6a96670460
commit
375192afe6
|
@ -26,10 +26,6 @@ SERVER_PORT=$(echo $SERVER_URL | grep -oE "[0-9]+")
|
||||||
if [ -n "$SERVER_PORT" ]; then
|
if [ -n "$SERVER_PORT" ]; then
|
||||||
lsof -ti tcp:$SERVER_PORT | xargs kill
|
lsof -ti tcp:$SERVER_PORT | xargs kill
|
||||||
fi
|
fi
|
||||||
DEVICE_PORT=$(echo $DEVICE_URL | grep -oE "[0-9]+")
|
|
||||||
if [ -n "$DEVICE_PORT" ]; then
|
|
||||||
lsof -ti tcp:$DEVICE_PORT | xargs kill
|
|
||||||
fi
|
|
||||||
|
|
||||||
### START
|
### START
|
||||||
|
|
||||||
|
|
37
OS/01/stt.py
37
OS/01/stt.py
|
@ -49,16 +49,29 @@ def stt_bytes(audio_bytes: bytearray, mime_type="audio/wav"):
|
||||||
return stt_wav(wav_file_path)
|
return stt_wav(wav_file_path)
|
||||||
|
|
||||||
def stt_wav(wav_file_path: str):
|
def stt_wav(wav_file_path: str):
|
||||||
audio_file = open(wav_file_path, "rb")
|
|
||||||
try:
|
|
||||||
transcript = client.audio.transcriptions.create(
|
|
||||||
model="whisper-1",
|
|
||||||
file=audio_file,
|
|
||||||
response_format="text"
|
|
||||||
)
|
|
||||||
except openai.BadRequestError as e:
|
|
||||||
print("openai.BadRequestError:", e)
|
|
||||||
return None
|
|
||||||
|
|
||||||
print("Transcription result:", transcript)
|
if os.getenv('ALL_LOCAL') == 'False':
|
||||||
return transcript
|
audio_file = open(wav_file_path, "rb")
|
||||||
|
try:
|
||||||
|
transcript = client.audio.transcriptions.create(
|
||||||
|
model="whisper-1",
|
||||||
|
file=audio_file,
|
||||||
|
response_format="text"
|
||||||
|
)
|
||||||
|
except openai.BadRequestError as e:
|
||||||
|
print("openai.BadRequestError:", e)
|
||||||
|
return None
|
||||||
|
|
||||||
|
print("Transcription result:", transcript)
|
||||||
|
return transcript
|
||||||
|
else:
|
||||||
|
# Local whisper here, given `wav_file_path`
|
||||||
|
pass
|
||||||
|
|
||||||
|
def stt(input_data, mime_type="audio/wav"):
|
||||||
|
if isinstance(input_data, str):
|
||||||
|
return stt_wav(input_data)
|
||||||
|
elif isinstance(input_data, bytearray):
|
||||||
|
return stt_bytes(input_data, mime_type)
|
||||||
|
else:
|
||||||
|
raise ValueError("Input data should be either a path to a wav file (str) or audio bytes (bytearray)")
|
Loading…
Reference in New Issue