01/software/main.py

from yaspin import yaspin
spinner = yaspin()
spinner.start()

import typer
import ngrok
import platform
import threading
import os
import importlib
from source.server.server import start_server
import subprocess
import webview
import socket
import json
import segno
from livekit import api
import time
from dotenv import load_dotenv
import signal
from source.server.livekit.worker import main as worker_main
from source.server.livekit.multimodal import main as multimodal_main
import warnings
import requests

load_dotenv()

system_type = platform.system()

app = typer.Typer()

@app.command()
def run(
    server: str = typer.Option(
        None,
        "--server",
        help="Run server (accepts `livekit` or `light`)",
    ),
    server_host: str = typer.Option(
        "0.0.0.0",
        "--server-host",
        help="Specify the server host where the server will deploy",
    ),
    server_port: int = typer.Option(
        10101,
        "--server-port",
        help="Specify the server port where the server will deploy",
    ),
    expose: bool = typer.Option(False, "--expose", help="Expose server over the internet"),
    domain: str = typer.Option(None, "--domain", help="Use `--expose` with a custom ngrok domain"),
    client: str = typer.Option(None, "--client", help="Run client of a particular type. Accepts `light-python`, defaults to `light-python`"),
    server_url: str = typer.Option(
        None,
        "--server-url",
        help="Specify the server URL that the --client should expect. Defaults to server-host and server-port",
    ),
    qr: bool = typer.Option(
        False, "--qr", help="Display QR code containing the server connection information (will be ngrok url if `--expose` is used)"
    ),
    profiles: bool = typer.Option(
        False,
        "--profiles",
        help="Opens the folder where profiles are contained",
    ),
    profile: str = typer.Option(
        "default.py",
        "--profile",
        help="Specify the path to the profile, or the name of the file if it's in the `profiles` directory (run `--profiles` to open the profiles directory)",
    ),
    debug: bool = typer.Option(
        False,
        "--debug",
        help="Print latency measurements and save microphone recordings locally for manual playback",
    ),
    multimodal: bool = typer.Option(
        False,
        "--multimodal",
        help="Run the multimodal agent",
    ),
):

    threads = []

    # Handle `01` with no arguments, which should start server + client
    if not server and not client:
        server = "light"
        client = "light-python"

    ### PROFILES

    profiles_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)), "source", "server", "profiles")

    if profiles:
        if platform.system() == "Windows":
            subprocess.Popen(['explorer', profiles_dir])
        elif platform.system() == "Darwin":
            subprocess.Popen(['open', profiles_dir])
        elif platform.system() == "Linux":
            subprocess.Popen(['xdg-open', profiles_dir])
        else:
            subprocess.Popen(['open', profiles_dir])
        exit(0)

    if profile:
        if not os.path.isfile(profile):
            profile = os.path.join(profiles_dir, profile)
            if not os.path.isfile(profile):
                profile += ".py"
                if not os.path.isfile(profile):
                    print(f"Invalid profile path: {profile}")
                    exit(1)

    # Load the profile module from the provided path
    spec = importlib.util.spec_from_file_location("profile", profile)
    profile_module = importlib.util.module_from_spec(spec)
    spec.loader.exec_module(profile_module)

    # Get the interpreter from the profile
    interpreter = profile_module.interpreter

    ### SERVER

    if system_type == "Windows":
        server_host = "localhost"

    if not server_url:
        server_url = f"{server_host}:{server_port}"

    if server:

        ### LIGHT SERVER (required by livekit)

        if server == "light":
            light_server_port = server_port
            light_server_host = server_host
            voice = True # The light server will support voice
        elif server == "livekit":
            # The light server should run at a different port if we want to run a livekit server
            spinner.stop()
            print(f"Starting light server (required for livekit server) on localhost, on the port before `--server-port` (port {server_port-1}), unless the `AN_OPEN_PORT` env var is set.")
            print(f"The livekit server will be started on port {server_port}.")
            light_server_port = os.getenv('AN_OPEN_PORT', server_port-1)
            light_server_host = "localhost"
            voice = False # The light server will NOT support voice. It will just run Open Interpreter. The Livekit server will handle voice

        server_thread = threading.Thread(
            target=start_server,
            args=(
                light_server_host,
                light_server_port,
                interpreter,
                voice,
                debug
            ),
        )
        spinner.stop()
        print("Starting server...")
        server_thread.start()
        threads.append(server_thread)

        if server == "livekit":

            ### LIVEKIT SERVER

            def run_command(command):
                subprocess.run(command, shell=True, check=True)

            # Start the livekit server
            if debug:
                command = f'livekit-server --dev --bind "{server_host}" --port {server_port}'
            else:
                command = f'livekit-server --dev --bind "{server_host}" --port {server_port} > /dev/null 2>&1'
            livekit_thread = threading.Thread(
                target=run_command, args=(command,)
            )
            time.sleep(7)
            livekit_thread.start()
            threads.append(livekit_thread)

            local_livekit_url = f"ws://{server_host}:{server_port}"

        if expose:

            ### EXPOSE OVER INTERNET
            listener = ngrok.forward(f"{server_host}:{server_port}", authtoken_from_env=True, domain=domain)
            url = listener.url()

        else:

            ### GET LOCAL URL
            s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
            s.connect(("8.8.8.8", 80))
            ip_address = s.getsockname()[0]
            s.close()
            url = f"http://{ip_address}:{server_port}"


        if server == "livekit":
            print("Livekit server will run at:", url)


    ### CLIENT

    if client:
        
        module = importlib.import_module(
            f".clients.{client}.client", package="source"
        )

        client_thread = threading.Thread(target=module.run, args=[server_url, debug])
        spinner.stop()
        print("Starting client...")
        client_thread.start()
        threads.append(client_thread)


    ### WAIT FOR THREADS TO FINISH, HANDLE CTRL-C

    # Signal handler for termination signals
    def signal_handler(sig, frame):
        print("Termination signal received. Shutting down...")
        for thread in threads:
            if thread.is_alive():
                # Kill subprocess associated with thread
                subprocess.run(f"pkill -P {os.getpid()}", shell=True)
        os._exit(0)

    # Register signal handler for SIGINT and SIGTERM
    signal.signal(signal.SIGINT, signal_handler)
    signal.signal(signal.SIGTERM, signal_handler)

    try:

        # Verify the server is running
        for attempt in range(10):
            try:
                response = requests.get(url)
                status = "OK" if response.status_code == 200 else "Not OK"
                if status == "OK":
                    break
            except requests.RequestException:
                pass
            time.sleep(1)
        else:
            raise Exception(f"Server at {url} failed to respond after 10 attempts")

        ### DISPLAY QR CODE
        if qr:
            def display_qr_code():
                time.sleep(10)
                content = json.dumps({"livekit_server": url})
                qr_code = segno.make(content)
                qr_code.terminal(compact=True)

            qr_thread = threading.Thread(target=display_qr_code)
            qr_thread.start()
            threads.append(qr_thread)

        ### START LIVEKIT WORKER
        if server == "livekit":
            time.sleep(1)
            # These are needed to communicate with the worker's entrypoint
            os.environ['INTERPRETER_SERVER_HOST'] = light_server_host
            os.environ['INTERPRETER_SERVER_PORT'] = str(light_server_port)
            os.environ['01_TTS'] = interpreter.tts
            os.environ['01_STT'] = interpreter.stt

            token = str(api.AccessToken('devkey', 'secret') \
                .with_identity("identity") \
                .with_name("my name") \
                .with_grants(api.VideoGrants(
                    room_join=True,
                    room="my-room",
            )).to_jwt())

            # meet_url = f'http://localhost:3000/custom?liveKitUrl={url.replace("http", "ws")}&token={token}\n\n'
            meet_url = f'https://meet.livekit.io/custom?liveKitUrl={url.replace("http", "ws")}&token={token}\n\n'
            print("\n")
            print("For debugging, you can join a video call with your assistant. Click the link below, then send a chat message that says {CONTEXT_MODE_OFF}, then begin speaking:")
            print(meet_url)

            for attempt in range(30):
                try:
                    if multimodal:
                        multimodal_main(local_livekit_url)
                    else:
                        worker_main(local_livekit_url)
                except KeyboardInterrupt:
                    print("Exiting.")
                    raise
                except Exception as e:
                    print(f"Error occurred: {e}")
                print("Retrying...")
                time.sleep(1)

        # Wait for all threads to complete
        for thread in threads:
            thread.join()
    except KeyboardInterrupt:
        # On KeyboardInterrupt, send SIGINT to self
        os.kill(os.getpid(), signal.SIGINT)
01.1 5 months ago			`from yaspin import yaspin`
			`spinner = yaspin()`
			`spinner.start()`

`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`import typer`
support ngrok tunnels on livekit 5 months ago			`import ngrok`
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`import platform`
			`import threading`
			`import os`
			`import importlib`
01.1 5 months ago			`from source.server.server import start_server`
Implemented `profiles` 6 months ago			`import subprocess`
Meet URL 4 months ago			`import webview`
add livekit command 5 months ago			`import socket`
			`import json`
			`import segno`
Meet URL 4 months ago			`from livekit import api`
add livekit command 5 months ago			`import time`
support ngrok tunnels on livekit 5 months ago			`from dotenv import load_dotenv`
The pythonization of `tunnel` 10 months ago			`import signal`
Change worker to be a python file 4 months ago			`from source.server.livekit.worker import main as worker_main`
init livekit quickstart multimodal worker 3 months ago			`from source.server.livekit.multimodal import main as multimodal_main`
Change worker to be a python file 4 months ago			`import warnings`
			`import requests`
Add updated list of linted files 9 months ago
support ngrok tunnels on livekit 5 months ago			`load_dotenv()`
Add updated list of linted files 9 months ago
Cleaned up starting logic 5 months ago			`system_type = platform.system()`

			`app = typer.Typer()`

`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`@app.command()`
			`def run(`
Cleaned up starting logic 5 months ago			`server: str = typer.Option(`
			`None,`
			`"--server",`
			help="Run server (accepts `livekit` or `light`)",
			`),`
Re-lint after rebase 9 months ago			`server_host: str = typer.Option(`
			`"0.0.0.0",`
			`"--server-host",`
			`help="Specify the server host where the server will deploy",`
			`),`
			`server_port: int = typer.Option(`
Cleaned up starting logic 5 months ago			`10101,`
Re-lint after rebase 9 months ago			`"--server-port",`
			`help="Specify the server port where the server will deploy",`
			`),`
Cleaned up starting logic 5 months ago			`expose: bool = typer.Option(False, "--expose", help="Expose server over the internet"),`
			domain: str = typer.Option(None, "--domain", help="Use `--expose` with a custom ngrok domain"),
			client: str = typer.Option(None, "--client", help="Run client of a particular type. Accepts `light-python`, defaults to `light-python`"),
Re-lint after rebase 9 months ago			`server_url: str = typer.Option(`
			`None,`
			`"--server-url",`
Cleaned up starting logic 5 months ago			`help="Specify the server URL that the --client should expect. Defaults to server-host and server-port",`
Re-lint after rebase 9 months ago			`),`
remove unused cmd-line files 7 months ago			`qr: bool = typer.Option(`
Cleaned up starting logic 5 months ago			False, "--qr", help="Display QR code containing the server connection information (will be ngrok url if `--expose` is used)"
Revert "refactor domain into expose" This reverts commit 7182f10c38547e4be49a3195d36c89cff762e45b. 5 months ago			`),`
Implemented `profiles` 6 months ago			`profiles: bool = typer.Option(`
			`False,`
			`"--profiles",`
Cleaned up starting logic 5 months ago			`help="Opens the folder where profiles are contained",`
Implemented `profiles` 6 months ago			`),`
			`profile: str = typer.Option(`
Cleaned up starting logic 5 months ago			`"default.py",`
Implemented `profiles` 6 months ago			`"--profile",`
			help="Specify the path to the profile, or the name of the file if it's in the `profiles` directory (run `--profiles` to open the profiles directory)",
			`),`
add debug flag 7 months ago			`debug: bool = typer.Option(`
			`False,`
			`"--debug",`
Cleaned up starting logic 5 months ago			`help="Print latency measurements and save microphone recordings locally for manual playback",`
add livekit command 5 months ago			`),`
init livekit quickstart multimodal worker 3 months ago			`multimodal: bool = typer.Option(`
			`False,`
			`"--multimodal",`
			`help="Run the multimodal agent",`
			`),`
Re-lint after rebase 9 months ago			`):`
Cleaned up starting logic 5 months ago
			`threads = []`

			# Handle `01` with no arguments, which should start server + client
			`if not server and not client:`
			`server = "light"`
			`client = "light-python"`

			`### PROFILES`
add async-interpreter 7 months ago
Implemented `profiles` 6 months ago			`profiles_dir = os.path.join(os.path.dirname(os.path.realpath(__file__)), "source", "server", "profiles")`

			`if profiles:`
			`if platform.system() == "Windows":`
			`subprocess.Popen(['explorer', profiles_dir])`
			`elif platform.system() == "Darwin":`
			`subprocess.Popen(['open', profiles_dir])`
			`elif platform.system() == "Linux":`
			`subprocess.Popen(['xdg-open', profiles_dir])`
			`else:`
			`subprocess.Popen(['open', profiles_dir])`
			`exit(0)`

			`if profile:`
			`if not os.path.isfile(profile):`
			`profile = os.path.join(profiles_dir, profile)`
			`if not os.path.isfile(profile):`
			`profile += ".py"`
			`if not os.path.isfile(profile):`
			`print(f"Invalid profile path: {profile}")`
			`exit(1)`

Change tts and stt from profiles for app, set context mode to be True at the start 4 months ago			`# Load the profile module from the provided path`
			`spec = importlib.util.spec_from_file_location("profile", profile)`
			`profile_module = importlib.util.module_from_spec(spec)`
			`spec.loader.exec_module(profile_module)`

			`# Get the interpreter from the profile`
			`interpreter = profile_module.interpreter`
Cleaned up starting logic 5 months ago
			`### SERVER`

Fixed non-connection issue 9 months ago			`if system_type == "Windows":`
			`server_host = "localhost"`
Add updated list of linted files 9 months ago
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`if not server_url:`
			`server_url = f"{server_host}:{server_port}"`
Add updated list of linted files 9 months ago
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`if server:`
Added tests 6 months ago
Cleaned up starting logic 5 months ago			`### LIGHT SERVER (required by livekit)`
Added tests 6 months ago
Cleaned up starting logic 5 months ago			`if server == "light":`
			`light_server_port = server_port`
Docs changes, minor fixes 4 months ago			`light_server_host = server_host`
01.1 5 months ago			`voice = True # The light server will support voice`
Cleaned up starting logic 5 months ago			`elif server == "livekit":`
			`# The light server should run at a different port if we want to run a livekit server`
01.1 5 months ago			`spinner.stop()`
Docs changes, minor fixes 4 months ago			print(f"Starting light server (required for livekit server) on localhost, on the port before `--server-port` (port {server_port-1}), unless the `AN_OPEN_PORT` env var is set.")
Cleaned up starting logic 5 months ago			`print(f"The livekit server will be started on port {server_port}.")`
			`light_server_port = os.getenv('AN_OPEN_PORT', server_port-1)`
Docs changes, minor fixes 4 months ago			`light_server_host = "localhost"`
01.1 5 months ago			`voice = False # The light server will NOT support voice. It will just run Open Interpreter. The Livekit server will handle voice`
Added tests 6 months ago
Add updated list of linted files 9 months ago			`server_thread = threading.Thread(`
Use official OI server. 3 second latency. 6 months ago			`target=start_server,`
Add updated list of linted files 9 months ago			`args=(`
Docs changes, minor fixes 4 months ago			`light_server_host,`
Cleaned up starting logic 5 months ago			`light_server_port,`
Change tts and stt from profiles for app, set context mode to be True at the start 4 months ago			`interpreter,`
01.1 5 months ago			`voice,`
Cleaned up starting logic 5 months ago			`debug`
Add updated list of linted files 9 months ago			`),`
			`)`
01.1 5 months ago			`spinner.stop()`
			`print("Starting server...")`
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`server_thread.start()`
Cleaned up starting logic 5 months ago			`threads.append(server_thread)`
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago
Cleaned up starting logic 5 months ago			`if server == "livekit":`
add async interpreter with coqui, openai, elevenlabs tts 7 months ago
Cleaned up starting logic 5 months ago			`### LIVEKIT SERVER`
Added tests 6 months ago
Cleaned up starting logic 5 months ago			`def run_command(command):`
			`subprocess.run(command, shell=True, check=True)`
Removed print statements, better audio playback 6 months ago
Cleaned up starting logic 5 months ago			`# Start the livekit server`
OpenAI TTS and worker retry logic 4 months ago			`if debug:`
			`command = f'livekit-server --dev --bind "{server_host}" --port {server_port}'`
			`else:`
			`command = f'livekit-server --dev --bind "{server_host}" --port {server_port} > /dev/null 2>&1'`
Cleaned up starting logic 5 months ago			`livekit_thread = threading.Thread(`
OpenAI TTS and worker retry logic 4 months ago			`target=run_command, args=(command,)`
Cleaned up starting logic 5 months ago			`)`
			`time.sleep(7)`
			`livekit_thread.start()`
			`threads.append(livekit_thread)`

Meet URL 4 months ago			`local_livekit_url = f"ws://{server_host}:{server_port}"`
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago
Cleaned up starting logic 5 months ago			`if expose:`
add livekit command 5 months ago
Cleaned up starting logic 5 months ago			`### EXPOSE OVER INTERNET`
			`listener = ngrok.forward(f"{server_host}:{server_port}", authtoken_from_env=True, domain=domain)`
			`url = listener.url()`
add livekit command 5 months ago
Cleaned up starting logic 5 months ago			`else:`
add livekit command 5 months ago
Cleaned up starting logic 5 months ago			`### GET LOCAL URL`
support ngrok tunnels on livekit 5 months ago			`s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)`
			`s.connect(("8.8.8.8", 80))`
			`ip_address = s.getsockname()[0]`
			`s.close()`
Cleaned up starting logic 5 months ago			`url = f"http://{ip_address}:{server_port}"`


			`if server == "livekit":`
			`print("Livekit server will run at:", url)`

add livekit command 5 months ago
Cleaned up starting logic 5 months ago			`### CLIENT`

			`if client:`

			`module = importlib.import_module(`
			`f".clients.{client}.client", package="source"`
			`)`
add livekit command 5 months ago
Cleaned up starting logic 5 months ago			`client_thread = threading.Thread(target=module.run, args=[server_url, debug])`
01.1 5 months ago			`spinner.stop()`
			`print("Starting client...")`
Cleaned up starting logic 5 months ago			`client_thread.start()`
			`threads.append(client_thread)`
add livekit command 5 months ago

Cleaned up starting logic 5 months ago			`### WAIT FOR THREADS TO FINISH, HANDLE CTRL-C`

			`# Signal handler for termination signals`
			`def signal_handler(sig, frame):`
			`print("Termination signal received. Shutting down...")`
add livekit command 5 months ago			`for thread in threads:`
Cleaned up starting logic 5 months ago			`if thread.is_alive():`
			`# Kill subprocess associated with thread`
			`subprocess.run(f"pkill -P {os.getpid()}", shell=True)`
			`os._exit(0)`

			`# Register signal handler for SIGINT and SIGTERM`
			`signal.signal(signal.SIGINT, signal_handler)`
			`signal.signal(signal.SIGTERM, signal_handler)`
add livekit command 5 months ago
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`try:`
Change worker to be a python file 4 months ago
			`# Verify the server is running`
			`for attempt in range(10):`
			`try:`
			`response = requests.get(url)`
			`status = "OK" if response.status_code == 200 else "Not OK"`
			`if status == "OK":`
			`break`
			`except requests.RequestException:`
			`pass`
			`time.sleep(1)`
			`else:`
			`raise Exception(f"Server at {url} failed to respond after 10 attempts")`

Meet URL 4 months ago			`### DISPLAY QR CODE`
			`if qr:`
Better default profile, better QR 4 months ago			`def display_qr_code():`
			`time.sleep(10)`
			`content = json.dumps({"livekit_server": url})`
			`qr_code = segno.make(content)`
			`qr_code.terminal(compact=True)`

			`qr_thread = threading.Thread(target=display_qr_code)`
			`qr_thread.start()`
			`threads.append(qr_thread)`
Meet URL 4 months ago
			`### START LIVEKIT WORKER`
Change worker to be a python file 4 months ago			`if server == "livekit":`
Cartesia 2 months ago			`time.sleep(1)`
Change worker to be a python file 4 months ago			`# These are needed to communicate with the worker's entrypoint`
			`os.environ['INTERPRETER_SERVER_HOST'] = light_server_host`
			`os.environ['INTERPRETER_SERVER_PORT'] = str(light_server_port)`
Change tts and stt from profiles for app, set context mode to be True at the start 4 months ago			`os.environ['01_TTS'] = interpreter.tts`
			`os.environ['01_STT'] = interpreter.stt`
Meet URL 4 months ago
			`token = str(api.AccessToken('devkey', 'secret') \`
			`.with_identity("identity") \`
			`.with_name("my name") \`
			`.with_grants(api.VideoGrants(`
			`room_join=True,`
			`room="my-room",`
			`)).to_jwt())`

Multimodal code execution 3 months ago			`# meet_url = f'http://localhost:3000/custom?liveKitUrl={url.replace("http", "ws")}&token={token}\n\n'`
Cartesia 2 months ago			`meet_url = f'https://meet.livekit.io/custom?liveKitUrl={url.replace("http", "ws")}&token={token}\n\n'`
Change tts and stt from profiles for app, set context mode to be True at the start 4 months ago			`print("\n")`
			`print("For debugging, you can join a video call with your assistant. Click the link below, then send a chat message that says {CONTEXT_MODE_OFF}, then begin speaking:")`
Meet URL 4 months ago			`print(meet_url)`

OpenAI TTS and worker retry logic 4 months ago			`for attempt in range(30):`
			`try:`
init livekit quickstart multimodal worker 3 months ago			`if multimodal:`
			`multimodal_main(local_livekit_url)`
			`else:`
			`worker_main(local_livekit_url)`
OpenAI TTS and worker retry logic 4 months ago			`except KeyboardInterrupt:`
			`print("Exiting.")`
			`raise`
			`except Exception as e:`
			`print(f"Error occurred: {e}")`
			`print("Retrying...")`
			`time.sleep(1)`
Change worker to be a python file 4 months ago
Cleaned up starting logic 5 months ago			`# Wait for all threads to complete`
			`for thread in threads:`
			`thread.join()`
`start.py`, modular architecture, OI flags, mutable items to user dir 10 months ago			`except KeyboardInterrupt:`
Cleaned up starting logic 5 months ago			`# On KeyboardInterrupt, send SIGINT to self`
			`os.kill(os.getpid(), signal.SIGINT)`