From fbc876099050cba12706ba90135eb0b32d6525f6 Mon Sep 17 00:00:00 2001 From: Zohaib Rauf Date: Sat, 10 Feb 2024 22:21:47 -0800 Subject: [PATCH 1/5] Exposed the server with ngrok --- OS/01/.env.example | 5 +++++ OS/01/device.py | 10 +++++----- OS/01/requirements.txt | 3 ++- OS/01/server.py | 23 +++++++++++++++++++++++ OS/01/start.sh | 19 +++++++++++++------ 5 files changed, 48 insertions(+), 12 deletions(-) diff --git a/OS/01/.env.example b/OS/01/.env.example index 01f14df..444c447 100644 --- a/OS/01/.env.example +++ b/OS/01/.env.example @@ -14,9 +14,14 @@ WHISPER_MODEL_NAME="ggml-tiny.en.bin" PIPER_VOICE_URL="https://huggingface.co/rhasspy/piper-voices/resolve/main/en/en_US/lessac/medium/" PIPER_VOICE_NAME="en_US-lessac-medium.onnx" +# Expose through Ngrok +# Uncomment following line with your Ngrok auth token (https://dashboard.ngrok.com/get-started/your-authtoken) +#NGROK_AUTHTOKEN="" + # If SERVER_START, this is where we'll serve the server. # If DEVICE_START, this is where the device expects the server to be. SERVER_URL=ws://localhost:8000/ +SERVER_CONNECTION_URL=ws://localhost:8000/ # Comment if setting up through Ngrok SERVER_START=True DEVICE_START=True diff --git a/OS/01/device.py b/OS/01/device.py index d0c6687..3241532 100644 --- a/OS/01/device.py +++ b/OS/01/device.py @@ -38,11 +38,6 @@ RATE = 44100 # Sample rate RECORDING = False # Flag to control recording state SPACEBAR_PRESSED = False # Flag to track spacebar press state -# Configuration for WebSocket -WS_URL = os.getenv('SERVER_URL') -if not WS_URL: - raise ValueError("The environment variable SERVER_URL is not set. Please set it to proceed.") - # Specify OS current_platform = get_system_info() @@ -203,6 +198,11 @@ async def websocket_communication(WS_URL): if __name__ == "__main__": async def main(): + # Configuration for WebSocket + WS_URL = os.getenv('SERVER_CONNECTION_URL') + if not WS_URL: + raise ValueError("The environment variable SERVER_URL is not set. Please set it to proceed.") + # Start the WebSocket communication asyncio.create_task(websocket_communication(WS_URL)) diff --git a/OS/01/requirements.txt b/OS/01/requirements.txt index 6e70eb4..9fd1aa3 100644 --- a/OS/01/requirements.txt +++ b/OS/01/requirements.txt @@ -9,4 +9,5 @@ playsound python-dotenv ffmpeg-python textual -pydub \ No newline at end of file +pydub +ngrok \ No newline at end of file diff --git a/OS/01/server.py b/OS/01/server.py index cc6cbc9..341e27c 100644 --- a/OS/01/server.py +++ b/OS/01/server.py @@ -14,6 +14,7 @@ import threading import uvicorn import re from fastapi import FastAPI +from fastapi.responses import PlainTextResponse from threading import Thread from starlette.websockets import WebSocket from stt import stt_bytes @@ -24,6 +25,7 @@ import urllib.parse from utils.kernel import put_kernel_messages_into_queue from i import configure_interpreter from interpreter import interpreter +import ngrok from utils.logs import setup_logging from utils.logs import logger @@ -93,6 +95,10 @@ if os.getenv('CODE_RUNNER') == "device": # Configure interpreter interpreter = configure_interpreter(interpreter) +app.get("/ping") +async def ping(): + return PlainTextResponse("pong") + @app.websocket("/") async def websocket_endpoint(websocket: WebSocket): await websocket.accept() @@ -229,6 +235,17 @@ async def stream_or_play_tts(sentence): await to_device.put({"role": "assistant", "type": "audio", "format": "audio/mp3", "content": str(audio_bytes)}) await to_device.put({"role": "assistant", "type": "audio", "format": "audio/mp3", "end": True}) +async def setup_ngrok(ngrok_auth_token, parsed_url): + # Set up Ngrok + logger.info("Setting up Ngrok") + ngrok_listener = await ngrok.forward(f"{parsed_url.hostname}:{parsed_url.port}", authtoken=ngrok_auth_token, domain="project01.ngrok.dev") + ngrok_parsed_url = urllib.parse.urlparse(ngrok_listener.url()) + + # Setup SERVER_URL environment variable for device to use + connection_url = f"wss://{ngrok_parsed_url.hostname}/" + logger.info(f"Ngrok established at {ngrok_parsed_url.geturl()}") + logger.info(f"\033[1mSERVER_CONNECTION_URL should be set to \"{connection_url}\"\033[0m") + from uvicorn import Config, Server @@ -247,6 +264,12 @@ if __name__ == "__main__": if not server_url: raise ValueError("The environment variable SERVER_URL is not set. Please set it to proceed.") parsed_url = urllib.parse.urlparse(server_url) + + # Set up Ngrok + ngrok_auth_token = os.getenv('NGROK_AUTHTOKEN') + if ngrok_auth_token is not None: + await setup_ngrok(ngrok_auth_token, parsed_url) + logger.info("Starting `server.py`...") config = Config(app, host=parsed_url.hostname, port=parsed_url.port, lifespan='on') diff --git a/OS/01/start.sh b/OS/01/start.sh index 5327767..945ea25 100755 --- a/OS/01/start.sh +++ b/OS/01/start.sh @@ -63,6 +63,13 @@ fi start_device() { echo "Starting device..." + if [[ -n $NGROK_AUTHTOKEN ]]; then + echo "Waiting for Ngrok to setup" + sleep 7 + read -p "Enter the Ngrok URL: " ngrok_url + export SERVER_CONNECTION_URL=$ngrok_url + echo "SERVER_CONNECTION_URL set to $SERVER_CONNECTION_URL" + fi python device.py & DEVICE_PID=$! echo "Device started as process $DEVICE_PID" @@ -90,18 +97,18 @@ stop_processes() { # Trap SIGINT and SIGTERM to stop processes when the script is terminated trap stop_processes SIGINT SIGTERM -# DEVICE -# Start device if DEVICE_START is True -if [[ "$DEVICE_START" == "True" ]]; then - start_device -fi - # SERVER # Start server if SERVER_START is True if [[ "$SERVER_START" == "True" ]]; then start_server fi +# DEVICE +# Start device if DEVICE_START is True +if [[ "$DEVICE_START" == "True" ]]; then + start_device +fi + # Wait for device and server processes to exit wait $DEVICE_PID wait $SERVER_PID From be18ac2177de8fb53cf6ec23a90e1d2d48c8720f Mon Sep 17 00:00:00 2001 From: Zohaib Rauf Date: Sun, 11 Feb 2024 04:57:17 -0800 Subject: [PATCH 2/5] Fixed small issue with ping --- OS/01/.env.example | 5 +++-- OS/01/server.py | 2 +- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/OS/01/.env.example b/OS/01/.env.example index 444c447..9202db6 100644 --- a/OS/01/.env.example +++ b/OS/01/.env.example @@ -16,12 +16,13 @@ PIPER_VOICE_NAME="en_US-lessac-medium.onnx" # Expose through Ngrok # Uncomment following line with your Ngrok auth token (https://dashboard.ngrok.com/get-started/your-authtoken) -#NGROK_AUTHTOKEN="" +#NGROK_AUTHTOKEN="AUTH TOKEN" # If SERVER_START, this is where we'll serve the server. # If DEVICE_START, this is where the device expects the server to be. SERVER_URL=ws://localhost:8000/ -SERVER_CONNECTION_URL=ws://localhost:8000/ # Comment if setting up through Ngrok +# If you are setting up Ngrok then either change the below to Ngrok URL if running device separately, else comment it +SERVER_CONNECTION_URL=ws://localhost:8000/ SERVER_START=True DEVICE_START=True diff --git a/OS/01/server.py b/OS/01/server.py index 341e27c..d891b65 100644 --- a/OS/01/server.py +++ b/OS/01/server.py @@ -95,7 +95,7 @@ if os.getenv('CODE_RUNNER') == "device": # Configure interpreter interpreter = configure_interpreter(interpreter) -app.get("/ping") +@app.get("/ping") async def ping(): return PlainTextResponse("pong") From e2d39a8c6d84de7374c8b303254792682caa1109 Mon Sep 17 00:00:00 2001 From: Zohaib Rauf Date: Sun, 11 Feb 2024 05:12:20 -0800 Subject: [PATCH 3/5] Fixed an issue from main --- OS/01/i.py | 1 - 1 file changed, 1 deletion(-) diff --git a/OS/01/i.py b/OS/01/i.py index 805bf86..5d0518c 100644 --- a/OS/01/i.py +++ b/OS/01/i.py @@ -9,7 +9,6 @@ from interpreter import OpenInterpreter def configure_interpreter(interpreter: OpenInterpreter): -def configure_interpreter(interpreter): ### SYSTEM MESSAGE # The system message is where most of the 01's behavior is configured. From 5df2baf787bb283732dc090b3439bde4b9d97fcf Mon Sep 17 00:00:00 2001 From: Zohaib Rauf Date: Sun, 11 Feb 2024 05:15:41 -0800 Subject: [PATCH 4/5] Removed domain from ngrok --- OS/01/server.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/OS/01/server.py b/OS/01/server.py index d891b65..6b07877 100644 --- a/OS/01/server.py +++ b/OS/01/server.py @@ -238,7 +238,7 @@ async def stream_or_play_tts(sentence): async def setup_ngrok(ngrok_auth_token, parsed_url): # Set up Ngrok logger.info("Setting up Ngrok") - ngrok_listener = await ngrok.forward(f"{parsed_url.hostname}:{parsed_url.port}", authtoken=ngrok_auth_token, domain="project01.ngrok.dev") + ngrok_listener = await ngrok.forward(f"{parsed_url.hostname}:{parsed_url.port}", authtoken=ngrok_auth_token) ngrok_parsed_url = urllib.parse.urlparse(ngrok_listener.url()) # Setup SERVER_URL environment variable for device to use From 724942e1b4d1dc7c89f863e26d81b5b83398891a Mon Sep 17 00:00:00 2001 From: Zohaib Rauf Date: Sun, 11 Feb 2024 05:32:43 -0800 Subject: [PATCH 5/5] Fixed an error message --- OS/01/device.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/OS/01/device.py b/OS/01/device.py index 3241532..3e71554 100644 --- a/OS/01/device.py +++ b/OS/01/device.py @@ -201,7 +201,7 @@ if __name__ == "__main__": # Configuration for WebSocket WS_URL = os.getenv('SERVER_CONNECTION_URL') if not WS_URL: - raise ValueError("The environment variable SERVER_URL is not set. Please set it to proceed.") + raise ValueError("The environment variable SERVER_CONNECTION_URL is not set. Please set it to proceed.") # Start the WebSocket communication asyncio.create_task(websocket_communication(WS_URL))