feat: tts

2024-02-04 00:40:58 -08:00 · 2024-02-04 00:40:58 -08:00 · bb8da14e8a
parent 0fa932cb06
commit bb8da14e8a
1 changed files with 32 additions and 8 deletions
--- a/OS/01/assistant/tts.py
+++ b/OS/01/assistant/tts.py
@ -3,16 +3,40 @@ Defines a function which takes text and returns a path to an audio file.
 """

 from openai import OpenAI
+import pydub
+import pydub.playback
+import tempfile
+import os
+from datetime import datetime
+from io import BytesIO

 client = OpenAI()
+chunk_size = 1024
+read_chunk_size = 4096

-def tts(text, file_path):
+def tts(text):

-    response = client.with_streaming_response.audio.speech.create(
-        model="tts-1",
-        voice="alloy",
-        input=text,
-    )
+    temp_dir = tempfile.gettempdir()
+    output_path = os.path.join(temp_dir, f"output_{datetime.now().strftime('%Y%m%d%H%M%S%f')}.mp3")

-    response.stream_to_file(file_path)
-    
+    try:
+        with (
+            client.with_streaming_response.audio.speech.create(
+            model="tts-1",
+            voice="alloy",
+            input=text,
+            response_format='mp3',
+            speed=1.2)
+        ) as response:
+            with open(output_path, 'wb') as f:
+                for chunk in response.iter_bytes(chunk_size):                    
+                    f.write(chunk)
+        
+        with open(output_path, 'rb') as f:
+            byte_chunk = f.read(read_chunk_size)
+            yield byte_chunk
+
+        seg = pydub.AudioSegment.from_mp3(output_path)
+        pydub.playback.play(seg)
+    finally:
+        os.remove(output_path)