Ready for whisper

2024-02-09 23:45:58 -08:00 · 2024-02-09 23:45:58 -08:00 · 375192afe6
parent 6a96670460
commit 375192afe6
2 changed files with 25 additions and 16 deletions
--- a/OS/01/start.sh
+++ b/OS/01/start.sh
@ -26,10 +26,6 @@ SERVER_PORT=$(echo $SERVER_URL | grep -oE "[0-9]+")
 if [ -n "$SERVER_PORT" ]; then
    lsof -ti tcp:$SERVER_PORT | xargs kill
 fi
 DEVICE_PORT=$(echo $DEVICE_URL | grep -oE "[0-9]+")
 if [ -n "$DEVICE_PORT" ]; then
    lsof -ti tcp:$DEVICE_PORT | xargs kill
 fi
 ### START
--- a/OS/01/stt.py
+++ b/OS/01/stt.py
@ -49,16 +49,29 @@ def stt_bytes(audio_bytes: bytearray, mime_type="audio/wav"):
        return stt_wav(wav_file_path)
 def stt_wav(wav_file_path: str):
    audio_file = open(wav_file_path, "rb")
    try:
        transcript = client.audio.transcriptions.create(
            model="whisper-1", 
            file=audio_file,
            response_format="text"
        )
    except openai.BadRequestError as e:
        print("openai.BadRequestError:", e)
        return None
-    print("Transcription result:", transcript)
+    if os.getenv('ALL_LOCAL') == 'False':
-    return transcript
+        audio_file = open(wav_file_path, "rb")
        try:
            transcript = client.audio.transcriptions.create(
                model="whisper-1", 
                file=audio_file,
                response_format="text"
            )
        except openai.BadRequestError as e:
            print("openai.BadRequestError:", e)
            return None
        print("Transcription result:", transcript)
        return transcript
    else:
        # Local whisper here, given `wav_file_path`
        pass
 def stt(input_data, mime_type="audio/wav"):
    if isinstance(input_data, str):
        return stt_wav(input_data)
    elif isinstance(input_data, bytearray):
        return stt_bytes(input_data, mime_type)
    else:
        raise ValueError("Input data should be either a path to a wav file (str) or audio bytes (bytearray)")