diff --git a/ai_voice_assistant.py b/ai_voice_assistant.py new file mode 100644 index 0000000..5e756ba --- /dev/null +++ b/ai_voice_assistant.py @@ -0,0 +1,23 @@ +import subprocess +from playsound import playsound +import os + +def get_ai_response(prompt): + # Replace this later with LLaMA integration + return f"Echo: {prompt}" + +def generate_voice(text): + subprocess.run(f'python tortoise/do_tts.py --text "{text}" --voice random', shell=True) + +def play_response(): + playsound("tortoise/results/generated_audio.wav") + +if __name__ == "__main__": + while True: + user_input = input("\nYou: ") + if user_input.lower() == "exit": + break + response = get_ai_response(user_input) + print("AI:", response) + generate_voice(response) + play_response() diff --git a/requirements.txt b/requirements.txt index fd8d538..28e648f 100644 --- a/requirements.txt +++ b/requirements.txt @@ -18,7 +18,7 @@ appdirs nbconvert==5.3.1 tornado==4.2 pydantic==1.9.1 -deepspeed==0.8.3 +#deepspeed==0.17.0 py-cpuinfo hjson psutil diff --git a/setup.py b/setup.py index 807670a..085175c 100644 --- a/setup.py +++ b/setup.py @@ -28,7 +28,7 @@ setuptools.setup( 'scipy', 'librosa', 'transformers==4.31.0', - 'tokenizers==0.14.0', + 'tokenizers==0.13.0', 'scipy==1.13.1' # 'deepspeed==0.8.3', ], diff --git a/tortoise/do_tts.py b/tortoise/do_tts.py index c6e2b17..bbbd39f 100644 --- a/tortoise/do_tts.py +++ b/tortoise/do_tts.py @@ -4,8 +4,8 @@ import os import torch import torchaudio -from api import TextToSpeech, MODELS_DIR -from utils.audio import load_voices +from tortoise.api import TextToSpeech, MODELS_DIR +from tortoise.utils.audio import load_voice, load_voices if __name__ == '__main__': parser = argparse.ArgumentParser() diff --git a/tortoise/voices/armaan/1.wav b/tortoise/voices/armaan/1.wav new file mode 100644 index 0000000..e3c1512 Binary files /dev/null and b/tortoise/voices/armaan/1.wav differ diff --git a/tortoise/voices/armaan/2.wav b/tortoise/voices/armaan/2.wav new file mode 100644 index 0000000..c04fb36 Binary files /dev/null and b/tortoise/voices/armaan/2.wav differ diff --git a/tortoise/voices/armaan/3.wav b/tortoise/voices/armaan/3.wav new file mode 100644 index 0000000..370abc6 Binary files /dev/null and b/tortoise/voices/armaan/3.wav differ diff --git a/tortoise/voices/armaan/4.wav b/tortoise/voices/armaan/4.wav new file mode 100644 index 0000000..e6666a4 Binary files /dev/null and b/tortoise/voices/armaan/4.wav differ diff --git a/tortoise/voices/armaan/5.wav b/tortoise/voices/armaan/5.wav new file mode 100644 index 0000000..ac43904 Binary files /dev/null and b/tortoise/voices/armaan/5.wav differ diff --git a/tortoise/voices/armaan/armaan.pth b/tortoise/voices/armaan/armaan.pth new file mode 100644 index 0000000..59f25fe Binary files /dev/null and b/tortoise/voices/armaan/armaan.pth differ