01/OS/01/user/user.py

import asyncio
import threading
import websockets
import os
import pyaudio
from queue import Queue
from pynput import keyboard
import json
import pydub
import ast

# Configuration for Audio Recording
CHUNK = 1024  # Record in chunks of 1024 samples
FORMAT = pyaudio.paInt16  # 16 bits per sample
CHANNELS = 1  # Mono
RATE = 44100  # Sample rate
RECORDING = False  # Flag to control recording state
SPACEBAR_PRESSED = False  # Flag to track spacebar press state

# Configuration for WebSocket
PORT = os.getenv('ASSISTANT_PORT', '8000')
WS_URL = f"ws://localhost:{PORT}/user"

# Initialize PyAudio
p = pyaudio.PyAudio()

# Queue for sending data
data_queue = Queue()

import wave
import tempfile
from datetime import datetime


def record_audio():
    """Record audio from the microphone and add it to the queue."""
    stream = p.open(format=FORMAT, channels=CHANNELS, rate=RATE, input=True, frames_per_buffer=CHUNK)
    print("Recording started...")
    global RECORDING

    # Create a temporary WAV file to store the audio data
    temp_dir = tempfile.gettempdir()
    wav_path = os.path.join(temp_dir, f"audio_{datetime.now().strftime('%Y%m%d%H%M%S%f')}.wav")
    wav_file = wave.open(wav_path, 'wb')
    wav_file.setnchannels(CHANNELS)
    wav_file.setsampwidth(p.get_sample_size(FORMAT))
    wav_file.setframerate(RATE)

    while RECORDING:
        data = stream.read(CHUNK, exception_on_overflow=False)
        wav_file.writeframes(data)

    wav_file.close()
    stream.stop_stream()
    stream.close()
    print("Recording stopped.")

    # After recording is done, read and stream the audio file in chunks
    with open(wav_path, 'rb') as audio_file:
        byte_data = audio_file.read(CHUNK)
        while byte_data:
            data_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "content": str(byte_data)})
            byte_data = audio_file.read(CHUNK)

    data_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "end": True})


def toggle_recording(state):
    """Toggle the recording state."""
    global RECORDING, SPACEBAR_PRESSED
    if state and not SPACEBAR_PRESSED:
        SPACEBAR_PRESSED = True
        if not RECORDING:
            RECORDING = True
            threading.Thread(target=record_audio).start()
    elif not state and SPACEBAR_PRESSED:
        SPACEBAR_PRESSED = False
        RECORDING = False

async def websocket_communication():
    """Handle WebSocket communication and listen for incoming messages."""
    while True:
        try:
            async with websockets.connect(WS_URL) as websocket:

                print("Press the spacebar to start/stop recording. Press ESC to exit.")

                while True:
                    # Send data from the queue to the server
                    while not data_queue.empty():
                        data = data_queue.get_nowait()
                        print(f"Sending data to the server: {data}")
                        await websocket.send(json.dumps(data))

                    # Listen for incoming messages from the server
                    try:
                        chunk = await websocket.recv()
                        print(f"Received from server: {str(chunk)[:100]}")

                        if chunk["type"] == "audio":
                            print("Received audio data from server.")
                            if "start" in chunk:
                                print("Start of audio data received.")
                                audio_chunks = bytearray()
                            if "content" in chunk:
                                print("Audio content received.")
                                audio_chunks.extend(bytes(ast.literal_eval(chunk["content"])))
                            if "end" in chunk:
                                print("End of audio data received.")
                                with tempfile.NamedTemporaryFile(suffix=".mp3") as f:
                                    f.write(audio_chunks)
                                    f.seek(0)
                                    seg = pydub.AudioSegment.from_mp3(f.name)
                                    print("Playing received audio.")
                                    pydub.playback.play(seg)

                    except Exception as e:
                        print(f"Error receiving data: {e}")

                    print("Sleeping for 0.05 seconds.")
                    await asyncio.sleep(0.05)
        except Exception as e:
            print(f"Websocket not ready, retrying... ({e})")
            await asyncio.sleep(1)


def on_press(key):
    """Detect spacebar press."""
    if key == keyboard.Key.space:
        toggle_recording(True)

def on_release(key):
    """Detect spacebar release and ESC key press."""
    if key == keyboard.Key.space:
        toggle_recording(False)
    elif key == keyboard.Key.esc:
        print("Exiting...")
        os._exit(0)

def main():
    # Start the WebSocket communication in a separate asyncio event loop
    ws_thread = threading.Thread(target=lambda: asyncio.run(websocket_communication()), daemon=True)
    ws_thread.start()

    # Keyboard listener for spacebar press/release
    with keyboard.Listener(on_press=on_press, on_release=on_release) as listener:
        print("In a moment, press the spacebar to start/stop recording. Press ESC to exit.")
        listener.join()

    p.terminate()

if __name__ == "__main__":
    main()