Upload

2023-06-12 12:06:24 -04:00 · 2023-06-12 12:06:24 -04:00 · 15d1a0b58b
commit 15d1a0b58b
12 changed files with 182 additions and 0 deletions
--- a/ai.py
+++ b/ai.py
@ -0,0 +1,16 @@
 from revChatGPT.V1 import Chatbot
 chatbot = Chatbot(config={
  "email": "pushes_mouthy_0x@icloud.com",
  "password": "9hCyLiGWUdr9MX2mepTk"
 })
 prompt = "how many beaches does portugal have?"
 response = ""
 for data in chatbot.ask(
  prompt
 ):
    response = data["message"]
 print(response)
--- a/main.py
+++ b/main.py
@ -0,0 +1,24 @@
 import time
 import speech_recognition as sr
 def callback(recognizer, audio):
    try:
        print("Processing...")
        text = r.recognize_whisper(audio, language="english")
        print(f"Apollo (Whisper Model) thinks you said: {text}")
    except sr.UnknownValueError:
        print("Could not understand audio.")
    except sr.RequestError as e:
        print("Could not request result from Whisper")
 r = sr.Recognizer()
 m = sr.Microphone()
 with m as source:
    r.adjust_for_ambient_noise(source)
 stop_listening = r.listen_in_background(m, callback)
 print("Listening...")
 while True:
    time.sleep(0.1)
--- a/setup.sh
+++ b/setup.sh
@ -0,0 +1,20 @@
 #Switch to virtual python enviroment
 source .venv/bin/activate
 #install homebrew (https://brew.sh)
 /bin/bash -c "$(curl -fsSL https://raw.githubusercontent.com/Homebrew/install/HEAD/install.sh)"
 #Install brew dependencies
 brew install portaudio
 brew install ffmpeg
 # Install python dependencies
 pip install -U pyaudio # Microphone
 pip install numpy
 pip install pillow
 pip install --pre torch torchvision torchaudio --index-url https://download.pytorch.org/whl/nightly/cpu
 pip install -U openai-whisper # Speech to text model (needed by speechrecognition)
 pip install -U SpeechRecognition # Speech to text logic
 pip install -U revChatGPT # Interacts with OpenAI ChatGPT
 pip install speechbrain
--- a/talk.py
+++ b/talk.py
@ -0,0 +1,17 @@
 import pyttsx3
 engine = pyttsx3.init()
 voices = engine.getProperty('voices')
 # engine.setProperty('voice', voices[3].id)
 # engine.say("I will speak this text")
 # engine.runAndWait()
 # engine = pyttsx3.init()
 # voices = engine.getProperty('voices')
 # print(voices)
 for voice in voices:
   engine.setProperty('voice', voice.id)
   print(voice)
   engine.say('The quick brown fox jumped over the lazy dog.')
 engine.runAndWait()
--- a/test.html
+++ b/test.html
@ -0,0 +1,14 @@
 <!DOCTYPE html>
 <html>
 <head>
 	<meta charset="utf-8">
 	<meta name="viewport" content="width=device-width, initial-scale=1">
 	<title>test</title>
 </head>
 <body>
 	<script type="text/javascript" src="https://files.coinmarketcap.com/static/widget/coinPriceBlock.js"></script>
 	<div id="coinmarketcap-widget-coin-price-block" coins="1,1027,1839,52,3890" currency="USD" theme="light" transparent="false" show-symbol-logo="true"></div>
 </body>
 </html>
--- a/tmpdir_tts/hyperparams.yaml
+++ b/tmpdir_tts/hyperparams.yaml
@ -0,0 +1 @@
 /Users/sam/.cache/huggingface/hub/models--speechbrain--tts-tacotron2-ljspeech/snapshots/f0c9855a337493070f576ef94dacd0ed407e04f2/hyperparams.yaml
--- a/tmpdir_tts/model.ckpt
+++ b/tmpdir_tts/model.ckpt
@ -0,0 +1 @@
 /Users/sam/.cache/huggingface/hub/models--speechbrain--tts-tacotron2-ljspeech/snapshots/f0c9855a337493070f576ef94dacd0ed407e04f2/model.ckpt
--- a/tmpdir_vocoder/generator.ckpt
+++ b/tmpdir_vocoder/generator.ckpt
@ -0,0 +1 @@
 /Users/sam/.cache/huggingface/hub/models--speechbrain--tts-hifigan-ljspeech/snapshots/e0cc1f9be5b65d4612013f26867ca600e98bc1b6/generator.ckpt
--- a/tmpdir_vocoder/hyperparams.yaml
+++ b/tmpdir_vocoder/hyperparams.yaml
@ -0,0 +1 @@
 /Users/sam/.cache/huggingface/hub/models--speechbrain--tts-hifigan-ljspeech/snapshots/e0cc1f9be5b65d4612013f26867ca600e98bc1b6/hyperparams.yaml
--- a/tts.py
+++ b/tts.py
@ -0,0 +1,20 @@
 import torchaudio
 from speechbrain.pretrained import Tacotron2
 from speechbrain.pretrained import HIFIGAN
 import sounddevice as sd
 # Intialize TTS (tacotron2) and Vocoder (HiFIGAN)
 tacotron2 = Tacotron2.from_hparams(source="speechbrain/tts-tacotron2-ljspeech", savedir="tmpdir_tts")
 hifi_gan = HIFIGAN.from_hparams(source="speechbrain/tts-hifigan-ljspeech", savedir="tmpdir_vocoder")
 # Running the TTS
 mel_output, mel_length, alignment = tacotron2.encode_text("This is an open-source toolkit for the development of speech technologies.")
 # Running Vocoder (spectrogram-to-waveform)
 waveforms = hifi_gan.decode_batch(mel_output)
 print(waveforms)
 #Audio(waveforms.detach().cpu().squeeze(), rate=22050)
 # sd.play(waveforms, 22050)
 torchaudio.io.play_audio(waveform=waveforms, sample_rate=22050)
 # torchaudio.Audio(waveforms.detach().cpu().squeeze(), rate=22050)
--- a/untitled.py
+++ b/untitled.py
@ -0,0 +1,28 @@
        print("Processing...")
        text = r.recognize_whisper(audio, language="english")
        print(f"Whisper thinks you said {text}")            
        #TODO: Check for Apollo
 def callback(recognizer, audio):
    try:
        pass
    except sr.UnknownValueError:
        print("Whisper could not understand audio")
    except sr.RequestError as e:
        print("Could not request results from Whisper")
 r = sr.Recognizer()
 m = sr.Microphone()
 with m as source:
    r.adjust_for_ambient_noise(source)  # we only need to calibrate once, before we start listening
 stop_listening = r.listen_in_background(m, callback)
 print("Listening...")
 while True: 
    time.sleep(0.1)  # we're not listening anymore, 
    # print('1')
--- a/voice.py
+++ b/voice.py
@ -0,0 +1,39 @@
 #!/usr/bin/env python3
 import time
 import speech_recognition as sr
 # this is called from the background thread
 def callback(recognizer, audio):
    # received audio data, now we'll recognize it using Google Speech Recognition
    try:
        print("Processing...")
        text = r.recognize_whisper(audio, language="english")
        print(f"Whisper thinks you said {text}")
    except sr.UnknownValueError:
        print("Whisper could not understand audio")
    except sr.RequestError as e:
        print("Could not request results from Whisper")
 r = sr.Recognizer()
 m = sr.Microphone()
 with m as source:
    r.adjust_for_ambient_noise(source)  # we only need to calibrate once, before we start listening
 # start listening in the background (note that we don't have to do this inside a `with` statement)
 stop_listening = r.listen_in_background(m, callback)
 # `stop_listening` is now a function that, when called, stops background listening
 # do some unrelated computations for 5 seconds
 # for _ in range(50): 
    # time.sleep(0.1)  # we're still listening even though the main thread is doing other things
    # print('0')
 # calling this function requests that the background listener stop listening
 # stop_listening(wait_for_stop=False)
 # do some more unrelated things
 print("Listening...")
 while True: 
    time.sleep(0.1)  # we're not listening anymore, 
    # print('1')
		`@ -0,0 +1 @@`
							`/Users/sam/.cache/huggingface/hub/models--speechbrain--tts-tacotron2-ljspeech/snapshots/f0c9855a337493070f576ef94dacd0ed407e04f2/hyperparams.yaml`