parent
f429dac85c
commit
38a0039a8f
@ -0,0 +1,242 @@
|
|||||||
|
from dotenv import load_dotenv
|
||||||
|
load_dotenv() # take environment variables from .env.
|
||||||
|
|
||||||
|
import asyncio
|
||||||
|
import threading
|
||||||
|
import os
|
||||||
|
import pyaudio
|
||||||
|
from starlette.websockets import WebSocket
|
||||||
|
from queue import Queue
|
||||||
|
from pynput import keyboard
|
||||||
|
import json
|
||||||
|
import traceback
|
||||||
|
import websockets
|
||||||
|
import queue
|
||||||
|
import pydub
|
||||||
|
import ast
|
||||||
|
from pydub import AudioSegment
|
||||||
|
from pydub.playback import play
|
||||||
|
import io
|
||||||
|
import time
|
||||||
|
import wave
|
||||||
|
import tempfile
|
||||||
|
from datetime import datetime
|
||||||
|
from interpreter import interpreter # Just for code execution. Maybe we should let people do from interpreter.computer import run?
|
||||||
|
from ..server.utils.kernel import put_kernel_messages_into_queue
|
||||||
|
from ..server.utils.get_system_info import get_system_info
|
||||||
|
from ..server.stt.stt import stt_wav
|
||||||
|
|
||||||
|
from ..server.utils.logs import setup_logging
|
||||||
|
from ..server.utils.logs import logger
|
||||||
|
setup_logging()
|
||||||
|
|
||||||
|
# Configuration for Audio Recording
|
||||||
|
CHUNK = 1024 # Record in chunks of 1024 samples
|
||||||
|
FORMAT = pyaudio.paInt16 # 16 bits per sample
|
||||||
|
CHANNELS = 1 # Mono
|
||||||
|
RATE = 44100 # Sample rate
|
||||||
|
RECORDING = False # Flag to control recording state
|
||||||
|
SPACEBAR_PRESSED = False # Flag to track spacebar press state
|
||||||
|
|
||||||
|
# Specify OS
|
||||||
|
current_platform = get_system_info()
|
||||||
|
|
||||||
|
# Initialize PyAudio
|
||||||
|
p = pyaudio.PyAudio()
|
||||||
|
|
||||||
|
import asyncio
|
||||||
|
|
||||||
|
send_queue = queue.Queue()
|
||||||
|
|
||||||
|
class Device:
|
||||||
|
def __init__(self):
|
||||||
|
pass
|
||||||
|
|
||||||
|
def record_audio(self):
|
||||||
|
|
||||||
|
if os.getenv('STT_RUNNER') == "server":
|
||||||
|
# STT will happen on the server. we're sending audio.
|
||||||
|
send_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "start": True})
|
||||||
|
elif os.getenv('STT_RUNNER') == "client":
|
||||||
|
# STT will happen here, on the client. we're sending text.
|
||||||
|
send_queue.put({"role": "user", "type": "message", "start": True})
|
||||||
|
else:
|
||||||
|
raise Exception("STT_RUNNER must be set to either 'client' or 'server'.")
|
||||||
|
|
||||||
|
"""Record audio from the microphone and add it to the queue."""
|
||||||
|
stream = p.open(format=FORMAT, channels=CHANNELS, rate=RATE, input=True, frames_per_buffer=CHUNK)
|
||||||
|
logger.info("Recording started...")
|
||||||
|
global RECORDING
|
||||||
|
|
||||||
|
# Create a temporary WAV file to store the audio data
|
||||||
|
temp_dir = tempfile.gettempdir()
|
||||||
|
wav_path = os.path.join(temp_dir, f"audio_{datetime.now().strftime('%Y%m%d%H%M%S%f')}.wav")
|
||||||
|
wav_file = wave.open(wav_path, 'wb')
|
||||||
|
wav_file.setnchannels(CHANNELS)
|
||||||
|
wav_file.setsampwidth(p.get_sample_size(FORMAT))
|
||||||
|
wav_file.setframerate(RATE)
|
||||||
|
|
||||||
|
while RECORDING:
|
||||||
|
data = stream.read(CHUNK, exception_on_overflow=False)
|
||||||
|
wav_file.writeframes(data)
|
||||||
|
|
||||||
|
wav_file.close()
|
||||||
|
stream.stop_stream()
|
||||||
|
stream.close()
|
||||||
|
logger.info("Recording stopped.")
|
||||||
|
|
||||||
|
duration = wav_file.getnframes() / RATE
|
||||||
|
if duration < 0.3:
|
||||||
|
# Just pressed it. Send stop message
|
||||||
|
if os.getenv('STT_RUNNER') == "client":
|
||||||
|
send_queue.put({"role": "user", "type": "message", "content": "stop"})
|
||||||
|
send_queue.put({"role": "user", "type": "message", "end": True})
|
||||||
|
else:
|
||||||
|
send_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "content": ""})
|
||||||
|
send_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "end": True})
|
||||||
|
else:
|
||||||
|
if os.getenv('STT_RUNNER') == "client":
|
||||||
|
# Run stt then send text
|
||||||
|
text = stt_wav(wav_path)
|
||||||
|
send_queue.put({"role": "user", "type": "message", "content": text})
|
||||||
|
send_queue.put({"role": "user", "type": "message", "end": True})
|
||||||
|
else:
|
||||||
|
# Stream audio
|
||||||
|
with open(wav_path, 'rb') as audio_file:
|
||||||
|
byte_data = audio_file.read(CHUNK)
|
||||||
|
while byte_data:
|
||||||
|
send_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "content": str(byte_data)})
|
||||||
|
byte_data = audio_file.read(CHUNK)
|
||||||
|
send_queue.put({"role": "user", "type": "audio", "format": "audio/wav", "end": True})
|
||||||
|
|
||||||
|
if os.path.exists(wav_path):
|
||||||
|
os.remove(wav_path)
|
||||||
|
|
||||||
|
def toggle_recording(self, state):
|
||||||
|
"""Toggle the recording state."""
|
||||||
|
global RECORDING, SPACEBAR_PRESSED
|
||||||
|
if state and not SPACEBAR_PRESSED:
|
||||||
|
SPACEBAR_PRESSED = True
|
||||||
|
if not RECORDING:
|
||||||
|
RECORDING = True
|
||||||
|
threading.Thread(target=self.record_audio).start()
|
||||||
|
elif not state and SPACEBAR_PRESSED:
|
||||||
|
SPACEBAR_PRESSED = False
|
||||||
|
RECORDING = False
|
||||||
|
|
||||||
|
def on_press(self, key):
|
||||||
|
"""Detect spacebar press."""
|
||||||
|
if key == keyboard.Key.space:
|
||||||
|
self.toggle_recording(True)
|
||||||
|
|
||||||
|
def on_release(self, key):
|
||||||
|
"""Detect spacebar release and ESC key press."""
|
||||||
|
if key == keyboard.Key.space:
|
||||||
|
self.toggle_recording(False)
|
||||||
|
elif key == keyboard.Key.esc or key == keyboard.Key.ctrl_c:
|
||||||
|
logger.info("Exiting...")
|
||||||
|
os._exit(0)
|
||||||
|
|
||||||
|
async def message_sender(self, websocket):
|
||||||
|
while True:
|
||||||
|
message = await asyncio.get_event_loop().run_in_executor(None, send_queue.get)
|
||||||
|
await websocket.send(json.dumps(message))
|
||||||
|
send_queue.task_done()
|
||||||
|
|
||||||
|
async def websocket_communication(self, WS_URL):
|
||||||
|
while True:
|
||||||
|
try:
|
||||||
|
async with websockets.connect(WS_URL) as websocket:
|
||||||
|
logger.info("Press the spacebar to start/stop recording. Press ESC to exit.")
|
||||||
|
asyncio.create_task(self.message_sender(websocket))
|
||||||
|
|
||||||
|
initial_message = {"role": None, "type": None, "format": None, "content": None}
|
||||||
|
message_so_far = initial_message
|
||||||
|
|
||||||
|
while True:
|
||||||
|
message = await websocket.recv()
|
||||||
|
|
||||||
|
logger.debug(f"Got this message from the server: {type(message)} {message}")
|
||||||
|
|
||||||
|
if type(message) == str:
|
||||||
|
message = json.loads(message)
|
||||||
|
|
||||||
|
if message.get("end"):
|
||||||
|
logger.debug(f"Complete message from the server: {message_so_far}")
|
||||||
|
logger.info("\n")
|
||||||
|
message_so_far = initial_message
|
||||||
|
|
||||||
|
if "content" in message:
|
||||||
|
print(message['content'], end="", flush=True)
|
||||||
|
if any(message_so_far[key] != message[key] for key in message_so_far if key != "content"):
|
||||||
|
message_so_far = message
|
||||||
|
else:
|
||||||
|
message_so_far["content"] += message["content"]
|
||||||
|
|
||||||
|
if message["type"] == "audio" and "content" in message:
|
||||||
|
audio_bytes = bytes(ast.literal_eval(message["content"]))
|
||||||
|
|
||||||
|
# Convert bytes to audio file
|
||||||
|
audio_file = io.BytesIO(audio_bytes)
|
||||||
|
audio = AudioSegment.from_mp3(audio_file)
|
||||||
|
|
||||||
|
# Play the audio
|
||||||
|
play(audio)
|
||||||
|
|
||||||
|
await asyncio.sleep(1)
|
||||||
|
|
||||||
|
# Run the code if that's the client's job
|
||||||
|
if os.getenv('CODE_RUNNER') == "client":
|
||||||
|
if message["type"] == "code" and "end" in message:
|
||||||
|
language = message_so_far["format"]
|
||||||
|
code = message_so_far["content"]
|
||||||
|
result = interpreter.computer.run(language, code)
|
||||||
|
send_queue.put(result)
|
||||||
|
|
||||||
|
|
||||||
|
except:
|
||||||
|
# traceback.print_exc()
|
||||||
|
logger.info(f"Connecting to `{WS_URL}`...")
|
||||||
|
await asyncio.sleep(2)
|
||||||
|
|
||||||
|
async def start_async(self):
|
||||||
|
# Configuration for WebSocket
|
||||||
|
WS_URL = os.getenv('SERVER_URL')
|
||||||
|
if not WS_URL:
|
||||||
|
raise ValueError("The environment variable SERVER_URL is not set. Please set it to proceed.")
|
||||||
|
|
||||||
|
# Start the WebSocket communication
|
||||||
|
asyncio.create_task(self.websocket_communication(WS_URL))
|
||||||
|
|
||||||
|
# Start watching the kernel if it's your job to do that
|
||||||
|
if os.getenv('CODE_RUNNER') == "client":
|
||||||
|
asyncio.create_task(put_kernel_messages_into_queue(send_queue))
|
||||||
|
|
||||||
|
|
||||||
|
# If Raspberry Pi, add the button listener, otherwise use the spacebar
|
||||||
|
if current_platform.startswith("raspberry-pi"):
|
||||||
|
logger.info("Raspberry Pi detected, using button on GPIO pin 15")
|
||||||
|
# Use GPIO pin 15
|
||||||
|
pindef = ["gpiochip4", "15"] # gpiofind PIN15
|
||||||
|
print("PINDEF", pindef)
|
||||||
|
|
||||||
|
# HACK: needs passwordless sudo
|
||||||
|
process = await asyncio.create_subprocess_exec("sudo", "gpiomon", "-brf", *pindef, stdout=asyncio.subprocess.PIPE)
|
||||||
|
while True:
|
||||||
|
line = await process.stdout.readline()
|
||||||
|
if line:
|
||||||
|
line = line.decode().strip()
|
||||||
|
if "FALLING" in line:
|
||||||
|
self.toggle_recording(False)
|
||||||
|
elif "RISING" in line:
|
||||||
|
self.toggle_recording(True)
|
||||||
|
else:
|
||||||
|
break
|
||||||
|
else:
|
||||||
|
# Keyboard listener for spacebar press/release
|
||||||
|
listener = keyboard.Listener(on_press=self.on_press, on_release=self.on_release)
|
||||||
|
listener.start()
|
||||||
|
|
||||||
|
def start(self):
|
||||||
|
asyncio.run(self.start_async())
|
||||||
|
p.terminate()
|
@ -0,0 +1,4 @@
|
|||||||
|
from ..base_device import Device
|
||||||
|
|
||||||
|
desktop_device = Device()
|
||||||
|
desktop_device.start()
|
@ -0,0 +1,4 @@
|
|||||||
|
from ..base_device import Device
|
||||||
|
|
||||||
|
rpi_device = Device()
|
||||||
|
rpi_device.start()
|
@ -0,0 +1,8 @@
|
|||||||
|
DEVICE=$(uname -n)
|
||||||
|
if [[ "$DEVICE" == "rpi" ]]; then
|
||||||
|
cd 01OS
|
||||||
|
python -m 01OS.clients.rpi.device &
|
||||||
|
else
|
||||||
|
cd 01OS
|
||||||
|
python -m 01OS.clients.macos.device &
|
||||||
|
fi
|
Binary file not shown.
@ -1,34 +1,27 @@
|
|||||||
from dotenv import load_dotenv
|
from dotenv import load_dotenv
|
||||||
load_dotenv() # take environment variables from .env.
|
load_dotenv() # take environment variables from .env.
|
||||||
|
|
||||||
from starlette.websockets import WebSocketDisconnect
|
|
||||||
import ast
|
import ast
|
||||||
import json
|
import json
|
||||||
import time
|
|
||||||
import queue
|
import queue
|
||||||
import os
|
import os
|
||||||
import traceback
|
import traceback
|
||||||
from queue import Queue
|
|
||||||
from threading import Thread
|
|
||||||
import threading
|
|
||||||
import uvicorn
|
|
||||||
import re
|
import re
|
||||||
from fastapi import FastAPI
|
from fastapi import FastAPI
|
||||||
from fastapi.responses import PlainTextResponse
|
from fastapi.responses import PlainTextResponse
|
||||||
from threading import Thread
|
|
||||||
from starlette.websockets import WebSocket
|
from starlette.websockets import WebSocket
|
||||||
from stt import stt_bytes
|
from .stt.stt import stt_bytes
|
||||||
from tts import tts
|
from .tts.tts import tts
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
import asyncio
|
import asyncio
|
||||||
import urllib.parse
|
import urllib.parse
|
||||||
from utils.kernel import put_kernel_messages_into_queue
|
from .utils.kernel import put_kernel_messages_into_queue
|
||||||
from i import configure_interpreter
|
from .i import configure_interpreter
|
||||||
from interpreter import interpreter
|
from interpreter import interpreter
|
||||||
import ngrok
|
import ngrok
|
||||||
|
|
||||||
from utils.logs import setup_logging
|
from .utils.logs import setup_logging
|
||||||
from utils.logs import logger
|
from .utils.logs import logger
|
||||||
setup_logging()
|
setup_logging()
|
||||||
|
|
||||||
|
|
Binary file not shown.
File diff suppressed because it is too large
Load Diff
@ -0,0 +1,34 @@
|
|||||||
|
[tool.poetry]
|
||||||
|
name = "01OS"
|
||||||
|
packages = [
|
||||||
|
{include = "01OS"},
|
||||||
|
]
|
||||||
|
include = [".env.example", "start.py", "start.sh"]
|
||||||
|
version = "0.0.1"
|
||||||
|
description = "The open-source language model computer"
|
||||||
|
authors = ["Killian <killian@openinterpreter.com>"]
|
||||||
|
license = "AGPL"
|
||||||
|
readme = "README.md"
|
||||||
|
|
||||||
|
[tool.poetry.dependencies]
|
||||||
|
python = ">=3.9,<3.12"
|
||||||
|
asyncio = "^3.4.3"
|
||||||
|
pyaudio = "^0.2.14"
|
||||||
|
pynput = "^1.7.6"
|
||||||
|
fastapi = "^0.109.2"
|
||||||
|
uvicorn = "^0.27.1"
|
||||||
|
websockets = "^12.0"
|
||||||
|
python-dotenv = "^1.0.1"
|
||||||
|
ffmpeg-python = "^0.2.0"
|
||||||
|
textual = "^0.50.1"
|
||||||
|
pydub = "^0.25.1"
|
||||||
|
ngrok = "^1.0.0"
|
||||||
|
open-interpreter = "^0.2.0"
|
||||||
|
simpleaudio = "^1.0.4"
|
||||||
|
|
||||||
|
[build-system]
|
||||||
|
requires = ["poetry-core"]
|
||||||
|
build-backend = "poetry.core.masonry.api"
|
||||||
|
|
||||||
|
[tool.poetry.scripts]
|
||||||
|
01 = "start:main"
|
@ -0,0 +1,23 @@
|
|||||||
|
"""
|
||||||
|
This is just for the Python package — we need a Python entrypoint.
|
||||||
|
Just starts `start.sh` with all the same command line arguments. Aliased to 01.
|
||||||
|
"""
|
||||||
|
|
||||||
|
import os
|
||||||
|
import subprocess
|
||||||
|
import sys
|
||||||
|
|
||||||
|
def main():
|
||||||
|
|
||||||
|
# Get command line arguments
|
||||||
|
args = sys.argv[1:]
|
||||||
|
|
||||||
|
# Get the directory of the current script
|
||||||
|
dir_path = os.path.dirname(os.path.realpath(__file__))
|
||||||
|
|
||||||
|
# Prepare the command
|
||||||
|
command = [os.path.join(dir_path, 'start.sh')] + args
|
||||||
|
|
||||||
|
# Start start.sh with the command line arguments
|
||||||
|
subprocess.run(command, check=True)
|
||||||
|
|
@ -0,0 +1,172 @@
|
|||||||
|
#!/usr/bin/env bash
|
||||||
|
|
||||||
|
### Import Environment Variables from .env
|
||||||
|
SCRIPT_DIR="$(dirname "$0")"
|
||||||
|
if [ ! -f "$SCRIPT_DIR/.env" ]; then
|
||||||
|
echo "No .env file found. Copying from .env.example..."
|
||||||
|
cp "$SCRIPT_DIR/.env.example" "$SCRIPT_DIR/.env"
|
||||||
|
fi
|
||||||
|
set -a; source "$SCRIPT_DIR/.env"; set +a
|
||||||
|
|
||||||
|
### COMMAND LINE ARGUMENTS
|
||||||
|
|
||||||
|
# Set both SERVER_START and CLIENT_START to False if "--server" or "--client" is passed as an argument
|
||||||
|
# (This way, --server runs only the server, --client runs only the client.)
|
||||||
|
if [[ "$@" == *"--server"* ]] || [[ "$@" == *"--client"* ]]; then
|
||||||
|
export SERVER_START="False"
|
||||||
|
export CLIENT_START="False"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Check if "--local" is passed as an argument
|
||||||
|
if [[ "$@" == *"--local"* ]]; then
|
||||||
|
# If "--local" is passed, set ALL_LOCAL to True
|
||||||
|
export ALL_LOCAL="True"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Check if "--server" is passed as an argument
|
||||||
|
if [[ "$@" == *"--server"* ]]; then
|
||||||
|
# If "--server" is passed, set SERVER_START to True
|
||||||
|
export SERVER_START="True"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Check if "--client" is passed as an argument
|
||||||
|
if [[ "$@" == *"--client"* ]]; then
|
||||||
|
# If "--client" is passed, set CLIENT_START to True
|
||||||
|
export CLIENT_START="True"
|
||||||
|
# Extract the client type from the arguments
|
||||||
|
CLIENT_TYPE=$(echo "$@" | sed -n -e 's/^.*--client //p' | awk '{print $1}')
|
||||||
|
# If client type is not empty, export it
|
||||||
|
if [[ ! -z "$CLIENT_TYPE" ]]; then
|
||||||
|
export CLIENT_TYPE
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Check if "--expose" is passed as an argument
|
||||||
|
if [[ "$@" == *"--expose"* ]]; then
|
||||||
|
# If "--expose" is passed, set SERVER_EXPOSE_PUBLICALLY to True
|
||||||
|
export SERVER_EXPOSE_PUBLICALLY="True"
|
||||||
|
fi
|
||||||
|
|
||||||
|
### SETUP
|
||||||
|
|
||||||
|
if [[ "$ALL_LOCAL" == "True" ]]; then
|
||||||
|
# if using local models, install the models / executables
|
||||||
|
|
||||||
|
## WHISPER
|
||||||
|
|
||||||
|
WHISPER_MODEL_URL="https://huggingface.co/ggerganov/whisper.cpp/resolve/main/"
|
||||||
|
WHISPER_PATH="$SCRIPT_DIR/01OS/server/stt/local_service"
|
||||||
|
if [[ ! -f "${WHISPER_PATH}/${WHISPER_MODEL_NAME}" ]]; then
|
||||||
|
mkdir -p "${WHISPER_PATH}"
|
||||||
|
curl -L "${WHISPER_MODEL_URL}${WHISPER_MODEL_NAME}" -o "${WHISPER_PATH}/${WHISPER_MODEL_NAME}"
|
||||||
|
fi
|
||||||
|
|
||||||
|
## PIPER
|
||||||
|
|
||||||
|
PIPER_FILE_PATH="$SCRIPT_DIR/01OS/server/tts/local_service${PIPER_URL}${PIPER_ASSETNAME}"
|
||||||
|
if [[ ! -f "$PIPER_FILE_PATH" ]]; then
|
||||||
|
|
||||||
|
mkdir -p "${PIPER_FILE_PATH}"
|
||||||
|
|
||||||
|
OS=$(uname -s)
|
||||||
|
ARCH=$(uname -m)
|
||||||
|
if [ "$OS" = "Darwin" ]; then
|
||||||
|
OS="macos"
|
||||||
|
if [ "$ARCH" = "arm64" ]; then
|
||||||
|
ARCH="aarch64"
|
||||||
|
elif [ "$ARCH" = "x86_64" ]; then
|
||||||
|
ARCH="x64"
|
||||||
|
else
|
||||||
|
echo "Piper: unsupported architecture"
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
PIPER_ASSETNAME="piper_${OS}_${ARCH}.tar.gz"
|
||||||
|
PIPER_URL="https://github.com/rhasspy/piper/releases/latest/download/"
|
||||||
|
|
||||||
|
# Save the current working directory
|
||||||
|
CWD=$(pwd)
|
||||||
|
|
||||||
|
# Navigate to SCRIPT_DIR/01OS/server/tts/local_service
|
||||||
|
cd $SCRIPT_DIR/01OS/server/tts/local_service
|
||||||
|
|
||||||
|
curl -L "${PIPER_URL}${PIPER_ASSETNAME}" -o "${PIPER_ASSETNAME}"
|
||||||
|
tar -xvzf $PIPER_ASSETNAME
|
||||||
|
cd piper
|
||||||
|
if [ "$OS" = "macos" ]; then
|
||||||
|
if [ "$ARCH" = "x64" ]; then
|
||||||
|
softwareupdate --install-rosetta --agree-to-license
|
||||||
|
fi
|
||||||
|
PIPER_PHONEMIZE_ASSETNAME="piper-phonemize_${OS}_${ARCH}.tar.gz"
|
||||||
|
PIPER_PHONEMIZE_URL="https://github.com/rhasspy/piper-phonemize/releases/latest/download/"
|
||||||
|
|
||||||
|
curl -OL "${PIPER_PHONEMIZE_URL}${PIPER_PHONEMIZE_ASSETNAME}"
|
||||||
|
tar -xvzf $PIPER_PHONEMIZE_ASSETNAME
|
||||||
|
curl -OL "${PIPER_VOICE_URL}${PIPER_VOICE_NAME}"
|
||||||
|
curl -OL "${PIPER_VOICE_URL}${PIPER_VOICE_NAME}.json"
|
||||||
|
PIPER_DIR=`pwd`
|
||||||
|
install_name_tool -change @rpath/libespeak-ng.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libespeak-ng.1.dylib" "${PIPER_DIR}/piper"
|
||||||
|
install_name_tool -change @rpath/libonnxruntime.1.14.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libonnxruntime.1.14.1.dylib" "${PIPER_DIR}/piper"
|
||||||
|
install_name_tool -change @rpath/libpiper_phonemize.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libpiper_phonemize.1.dylib" "${PIPER_DIR}/piper"
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Navigate back to the current working directory
|
||||||
|
cd $CWD
|
||||||
|
fi
|
||||||
|
fi
|
||||||
|
|
||||||
|
### START
|
||||||
|
|
||||||
|
start_client() {
|
||||||
|
echo "Starting client..."
|
||||||
|
bash 01OS/clients/start.sh &
|
||||||
|
CLIENT_PID=$!
|
||||||
|
echo "client started as process $CLIENT_PID"
|
||||||
|
}
|
||||||
|
|
||||||
|
# Function to start server
|
||||||
|
start_server() {
|
||||||
|
echo "Starting server..."
|
||||||
|
python -m 01OS.server.server &
|
||||||
|
SERVER_PID=$!
|
||||||
|
echo "Server started as process $SERVER_PID"
|
||||||
|
}
|
||||||
|
|
||||||
|
stop_processes() {
|
||||||
|
if [[ -n $CLIENT_PID ]]; then
|
||||||
|
echo "Stopping client..."
|
||||||
|
kill $CLIENT_PID
|
||||||
|
fi
|
||||||
|
if [[ -n $SERVER_PID ]]; then
|
||||||
|
echo "Stopping server..."
|
||||||
|
kill $SERVER_PID
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
# Trap SIGINT and SIGTERM to stop processes when the script is terminated
|
||||||
|
trap stop_processes SIGINT SIGTERM
|
||||||
|
|
||||||
|
# SERVER
|
||||||
|
# Start server if SERVER_START is True
|
||||||
|
if [[ "$SERVER_START" == "True" ]]; then
|
||||||
|
start_server
|
||||||
|
fi
|
||||||
|
|
||||||
|
# CLIENT
|
||||||
|
# Start client if CLIENT_START is True
|
||||||
|
if [[ "$CLIENT_START" == "True" ]]; then
|
||||||
|
start_client
|
||||||
|
fi
|
||||||
|
|
||||||
|
# Wait for client and server processes to exit
|
||||||
|
wait $CLIENT_PID
|
||||||
|
wait $SERVER_PID
|
||||||
|
|
||||||
|
# TTS, STT
|
||||||
|
|
||||||
|
# (todo)
|
||||||
|
# (i think we should start with hosted services)
|
||||||
|
|
||||||
|
# LLM
|
||||||
|
|
||||||
|
# (disabled, we'll start with hosted services)
|
||||||
|
# python core/llm/start.py &
|
@ -1 +0,0 @@
|
|||||||
conversations/user.json
|
|
@ -1,14 +0,0 @@
|
|||||||
git+https://github.com/KillianLucas/open-interpreter.git
|
|
||||||
asyncio
|
|
||||||
PyAudio
|
|
||||||
pynput
|
|
||||||
fastapi
|
|
||||||
uvicorn
|
|
||||||
websockets
|
|
||||||
playsound
|
|
||||||
python-dotenv
|
|
||||||
ffmpeg-python
|
|
||||||
textual
|
|
||||||
pydub
|
|
||||||
python-dotenv
|
|
||||||
ngrok
|
|
@ -1,124 +0,0 @@
|
|||||||
#!/usr/bin/env bash
|
|
||||||
|
|
||||||
### Import Environment Variables from .env
|
|
||||||
if [ ! -f ".env" ]; then
|
|
||||||
echo "Error: .env file does not exist. To create one, see .env.example for an example."
|
|
||||||
exit 1
|
|
||||||
fi
|
|
||||||
set -a; source .env; set +a
|
|
||||||
|
|
||||||
### SETUP
|
|
||||||
|
|
||||||
if [[ "$ALL_LOCAL" == "True" ]]; then
|
|
||||||
# if using local models, install the models / executables
|
|
||||||
WHISPER_MODEL_URL="https://huggingface.co/ggerganov/whisper.cpp/resolve/main/"
|
|
||||||
WHISPER_RUST_PATH="`pwd`/local_stt/whisper-rust"
|
|
||||||
curl -OL "${WHISPER_MODEL_URL}${WHISPER_MODEL_NAME}" --output-dir ${WHISPER_RUST_PATH}
|
|
||||||
OS=$(uname -s)
|
|
||||||
ARCH=$(uname -m)
|
|
||||||
if [ "$OS" = "Darwin" ]; then
|
|
||||||
OS="macos"
|
|
||||||
if [ "$ARCH" = "arm64" ]; then
|
|
||||||
ARCH="aarch64"
|
|
||||||
elif [ "$ARCH" = "x86_64" ]; then
|
|
||||||
ARCH="x64"
|
|
||||||
else
|
|
||||||
echo "Piper: unsupported architecture"
|
|
||||||
fi
|
|
||||||
fi
|
|
||||||
PIPER_ASSETNAME="piper_${OS}_${ARCH}.tar.gz"
|
|
||||||
PIPER_URL="https://github.com/rhasspy/piper/releases/latest/download/"
|
|
||||||
mkdir local_tts
|
|
||||||
cd local_tts
|
|
||||||
curl -OL "${PIPER_URL}${PIPER_ASSETNAME}"
|
|
||||||
tar -xvzf $PIPER_ASSETNAME
|
|
||||||
cd piper
|
|
||||||
if [ "$OS" = "macos" ]; then
|
|
||||||
if [ "$ARCH" = "x64" ]; then
|
|
||||||
softwareupdate --install-rosetta --agree-to-license
|
|
||||||
fi
|
|
||||||
PIPER_PHONEMIZE_ASSETNAME="piper-phonemize_${OS}_${ARCH}.tar.gz"
|
|
||||||
PIPER_PHONEMIZE_URL="https://github.com/rhasspy/piper-phonemize/releases/latest/download/"
|
|
||||||
|
|
||||||
curl -OL "${PIPER_PHONEMIZE_URL}${PIPER_PHONEMIZE_ASSETNAME}"
|
|
||||||
tar -xvzf $PIPER_PHONEMIZE_ASSETNAME
|
|
||||||
curl -OL "${PIPER_VOICE_URL}${PIPER_VOICE_NAME}"
|
|
||||||
curl -OL "${PIPER_VOICE_URL}${PIPER_VOICE_NAME}.json"
|
|
||||||
PIPER_DIR=`pwd`
|
|
||||||
install_name_tool -change @rpath/libespeak-ng.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libespeak-ng.1.dylib" "${PIPER_DIR}/piper"
|
|
||||||
install_name_tool -change @rpath/libonnxruntime.1.14.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libonnxruntime.1.14.1.dylib" "${PIPER_DIR}/piper"
|
|
||||||
install_name_tool -change @rpath/libpiper_phonemize.1.dylib "${PIPER_DIR}/piper-phonemize/lib/libpiper_phonemize.1.dylib" "${PIPER_DIR}/piper"
|
|
||||||
fi
|
|
||||||
cd ../..
|
|
||||||
fi
|
|
||||||
|
|
||||||
# (for dev, reset the ports we were using)
|
|
||||||
|
|
||||||
SERVER_PORT=$(echo $SERVER_URL | grep -oE "[0-9]+")
|
|
||||||
if [ -n "$SERVER_PORT" ]; then
|
|
||||||
lsof -ti tcp:$SERVER_PORT | xargs kill 2>/dev/null || true
|
|
||||||
fi
|
|
||||||
|
|
||||||
### START
|
|
||||||
|
|
||||||
start_device() {
|
|
||||||
echo "Starting device..."
|
|
||||||
if [[ -n $NGROK_AUTHTOKEN ]]; then
|
|
||||||
echo "Waiting for Ngrok to setup"
|
|
||||||
sleep 7
|
|
||||||
read -p "Enter the Ngrok URL: " ngrok_url
|
|
||||||
export SERVER_CONNECTION_URL=$ngrok_url
|
|
||||||
echo "SERVER_CONNECTION_URL set to $SERVER_CONNECTION_URL"
|
|
||||||
fi
|
|
||||||
python device.py &
|
|
||||||
DEVICE_PID=$!
|
|
||||||
echo "Device started as process $DEVICE_PID"
|
|
||||||
}
|
|
||||||
|
|
||||||
# Function to start server
|
|
||||||
start_server() {
|
|
||||||
echo "Starting server..."
|
|
||||||
python server.py &
|
|
||||||
SERVER_PID=$!
|
|
||||||
echo "Server started as process $SERVER_PID"
|
|
||||||
}
|
|
||||||
|
|
||||||
stop_processes() {
|
|
||||||
if [[ -n $DEVICE_PID ]]; then
|
|
||||||
echo "Stopping device..."
|
|
||||||
kill $DEVICE_PID
|
|
||||||
fi
|
|
||||||
if [[ -n $SERVER_PID ]]; then
|
|
||||||
echo "Stopping server..."
|
|
||||||
kill $SERVER_PID
|
|
||||||
fi
|
|
||||||
}
|
|
||||||
|
|
||||||
# Trap SIGINT and SIGTERM to stop processes when the script is terminated
|
|
||||||
trap stop_processes SIGINT SIGTERM
|
|
||||||
|
|
||||||
# SERVER
|
|
||||||
# Start server if SERVER_START is True
|
|
||||||
if [[ "$SERVER_START" == "True" ]]; then
|
|
||||||
start_server
|
|
||||||
fi
|
|
||||||
|
|
||||||
# DEVICE
|
|
||||||
# Start device if DEVICE_START is True
|
|
||||||
if [[ "$DEVICE_START" == "True" ]]; then
|
|
||||||
start_device
|
|
||||||
fi
|
|
||||||
|
|
||||||
# Wait for device and server processes to exit
|
|
||||||
wait $DEVICE_PID
|
|
||||||
wait $SERVER_PID
|
|
||||||
|
|
||||||
# TTS, STT
|
|
||||||
|
|
||||||
# (todo)
|
|
||||||
# (i think we should start with hosted services)
|
|
||||||
|
|
||||||
# LLM
|
|
||||||
|
|
||||||
# (disabled, we'll start with hosted services)
|
|
||||||
# python core/llm/start.py &
|
|
Before Width: | Height: | Size: 470 KiB After Width: | Height: | Size: 470 KiB |
Before Width: | Height: | Size: 702 KiB After Width: | Height: | Size: 702 KiB |
Before Width: | Height: | Size: 1022 KiB After Width: | Height: | Size: 1022 KiB |
Loading…
Reference in new issue