From 473da1b4ecb83fea23492c4515c6114abfd884df Mon Sep 17 00:00:00 2001 From: Dani Date: Mon, 8 May 2023 23:07:33 -0400 Subject: [PATCH] First Commit PocketSphinx Just Barely works to recoginze 'Jade' as the wake word Using https://github.com/suno-ai/bark for the TTS part of the code --- .gitignore | 160 +++++++++++++++++++++++++++++++++++++++++++++++++++++ LICENSE | 21 +++++++ README.MD | 1 + intents.py | 7 +++ main.py | 33 +++++++++++ voice.py | 14 +++++ 6 files changed, 236 insertions(+) create mode 100644 .gitignore create mode 100644 LICENSE create mode 100644 README.MD create mode 100644 intents.py create mode 100644 main.py create mode 100644 voice.py diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..68bc17f --- /dev/null +++ b/.gitignore @@ -0,0 +1,160 @@ +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +lib/ +lib64/ +parts/ +sdist/ +var/ +wheels/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +cover/ + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +.pybuilder/ +target/ + +# Jupyter Notebook +.ipynb_checkpoints + +# IPython +profile_default/ +ipython_config.py + +# pyenv +# For a library or package, you might want to ignore these files since the code is +# intended to run in multiple environments; otherwise, check them in: +# .python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# poetry +# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control. +# This is especially recommended for binary packages to ensure reproducibility, and is more +# commonly ignored for libraries. +# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control +#poetry.lock + +# pdm +# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control. +#pdm.lock +# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it +# in version control. +# https://pdm.fming.dev/#use-with-ide +.pdm.toml + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# pytype static type analyzer +.pytype/ + +# Cython debug symbols +cython_debug/ + +# PyCharm +# JetBrains specific template is maintained in a separate JetBrains.gitignore that can +# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore +# and can be added to the global gitignore or merged into this file. For a more nuclear +# option (not recommended) you can uncomment the following to ignore the entire idea folder. +#.idea/ diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..f7be8ec --- /dev/null +++ b/LICENSE @@ -0,0 +1,21 @@ +MIT License + +Copyright (c) 2023 [fullname] + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. diff --git a/README.MD b/README.MD new file mode 100644 index 0000000..330cabe --- /dev/null +++ b/README.MD @@ -0,0 +1 @@ +# Jade - A Voice Assistant \ No newline at end of file diff --git a/intents.py b/intents.py new file mode 100644 index 0000000..4fcc2ef --- /dev/null +++ b/intents.py @@ -0,0 +1,7 @@ +def handle_intent(intent): + if intent == "greeting": + return "Hello, how can I assist you?" + elif intent == "weather": + return "The weather today is sunny." + else: + return "I'm sorry, I don't understand that command." \ No newline at end of file diff --git a/main.py b/main.py new file mode 100644 index 0000000..fc775cc --- /dev/null +++ b/main.py @@ -0,0 +1,33 @@ +import speech_recognition as sr +from voice import say +from intents import handle_intent + +# Define the wake word +wake_word = "Jade" + +# Define the speech recognition function +def recognize_speech(): + r = sr.Recognizer() + with sr.Microphone() as source: + print("Say something!") + audio = r.listen(source) + try: + text = r.recognize_sphinx(audio) + print(f"You said: {text}") + if wake_word.lower() in text.lower(): + # Get the intent from the text + intent = get_intent(text) + response = handle_intent(intent) + say(response) + except sr.UnknownValueError: + print("PocketSphinx could not understand audio") + except sr.RequestError as e: + print(f"PocketSphinx error; {e}") + +# Define the function to get the intent from text +def get_intent(text): + # TODO: implement intent recognition + return "greeting" + +# Call the speech recognition function +recognize_speech() diff --git a/voice.py b/voice.py new file mode 100644 index 0000000..96309df --- /dev/null +++ b/voice.py @@ -0,0 +1,14 @@ +import sounddevice as sd +import numpy as np +from bark import generate_audio, SAMPLE_RATE, preload_models + +preload_models() + +def say(text): + audio_array = generate_audio(text, history_prompt="v2/en_speaker_9") + audio_array = np.expand_dims(audio_array, axis=1) + stream = sd.OutputStream(samplerate=SAMPLE_RATE, channels=1) + stream.start() + stream.write(audio_array) + stream.stop() + stream.close() \ No newline at end of file