Merge pull request #22 from shivenmian/u/shivenmian/local

fix: download whisper local model directly from huggingface
pull/23/head
killian 12 months ago committed by GitHub
commit 17a477ae7f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

@ -1,10 +1,12 @@
### SETTINGS ### SETTINGS
# If ALL_LOCAL is False, we'll use OpenAI's services # If ALL_LOCAL is False, we'll use OpenAI's services
# If setting ALL_LOCAL to true, set the path to the WHISPER local model # else we use whisper.cpp and piper local models
export ALL_LOCAL=False export ALL_LOCAL=False
# export WHISPER_MODEL_PATH=... export WHISPER_MODEL_NAME="ggml-tiny.en.bin"
export OPENAI_API_KEY="sk-..."
# Uncomment and set the OpenAI API key for OpenInterpreter to work
# export OPENAI_API_KEY="sk-..."
# Expose through Ngrok # Expose through Ngrok
# Uncomment following line with your Ngrok auth token (https://dashboard.ngrok.com/get-started/your-authtoken) # Uncomment following line with your Ngrok auth token (https://dashboard.ngrok.com/get-started/your-authtoken)
@ -38,6 +40,11 @@ export LOG_LEVEL="INFO"
### SETUP ### SETUP
# if using local models, install the models / executables # if using local models, install the models / executables
WHISPER_MODEL_URL="https://huggingface.co/ggerganov/whisper.cpp/resolve/main/"
WHISPER_RUST_PATH="`pwd`/local_stt/whisper-rust"
curl -OL "${WHISPER_MODEL_URL}${WHISPER_MODEL_NAME}" --output-dir ${WHISPER_RUST_PATH}
if [[ "$ALL_LOCAL" == "True" ]]; then if [[ "$ALL_LOCAL" == "True" ]]; then
OS=$(uname -s) OS=$(uname -s)
ARCH=$(uname -m) ARCH=$(uname -m)

@ -53,13 +53,14 @@ def run_command(command):
return result.stdout, result.stderr return result.stdout, result.stderr
def get_transcription_file(wav_file_path: str): def get_transcription_file(wav_file_path: str):
model_path = os.getenv("WHISPER_MODEL_PATH") whisper_rust_path = os.path.join(os.path.dirname(__file__), 'local_stt', 'whisper-rust')
if not model_path: model_name = os.getenv('WHISPER_MODEL_NAME')
raise EnvironmentError("WHISPER_MODEL_PATH environment variable is not set.") if not model_name:
raise EnvironmentError("WHISPER_MODEL_NAME environment variable is not set.")
output, error = run_command([ output, error = run_command([
os.path.join(os.path.dirname(__file__), 'local_stt', 'whisper-rust', 'whisper-rust'), os.path.join(whisper_rust_path, 'whisper-rust'),
'--model-path', model_path, '--model-path', os.path.join(whisper_rust_path, model_name),
'--file-path', wav_file_path '--file-path', wav_file_path
]) ])

@ -23,8 +23,6 @@ python -m pip install -r requirements.txt
``` ```
NB: Depending on your local Python version, you may run into [this issue↗](https://github.com/TaylorSMarks/playsound/issues/150) installing playsound. Workarounds are provided in the issue. NB: Depending on your local Python version, you may run into [this issue↗](https://github.com/TaylorSMarks/playsound/issues/150) installing playsound. Workarounds are provided in the issue.
If you want to run local speech-to-text from whisper, download the GGML Whisper model from [Huggingface](https://huggingface.co/ggerganov/whisper.cpp). Then in `OS/01/start.sh`, set `ALL_LOCAL=TRUE` and set `WHISPER_MODEL_PATH` to the path of the model.
## Usage ## Usage
```bash ```bash
@ -32,6 +30,7 @@ cd OS/01
bash start.sh bash start.sh
``` ```
If you want to run local text-to-speech and speech-to-text, set `ALL_LOCAL` in the `start.sh` script to True. This will use the [whisper.cpp](https://github.com/ggerganov/whisper.cpp) and [Piper](https://github.com/rhasspy/piper) models.
<br> <br>
## Background ## Background

Loading…
Cancel
Save