Spaces:

aar2dee2
/

chatty_vader

Runtime error

App Files Files Community

aar2dee2 commited on Apr 7, 2023

Commit

838a92b

1 Parent(s): 2930d08

add audio files

Browse files

Files changed (40) hide show

README.md +1 -1
app.ipynb +138 -0
data/metadata.csv +3 -0
data/wavs/wav1.wav +3 -0
data/wavs/wav10.wav +3 -0
data/wavs/wav11.wav +3 -0
data/wavs/wav12.wav +3 -0
data/wavs/wav13.wav +3 -0
data/wavs/wav14.wav +3 -0
data/wavs/wav15.wav +3 -0
data/wavs/wav16.wav +3 -0
data/wavs/wav17.wav +3 -0
data/wavs/wav18.wav +3 -0
data/wavs/wav19.wav +3 -0
data/wavs/wav2.wav +3 -0
data/wavs/wav20.wav +3 -0
data/wavs/wav21.wav +3 -0
data/wavs/wav22.wav +3 -0
data/wavs/wav23.wav +3 -0
data/wavs/wav24.wav +3 -0
data/wavs/wav25.wav +3 -0
data/wavs/wav26.wav +3 -0
data/wavs/wav27.wav +3 -0
data/wavs/wav28.wav +3 -0
data/wavs/wav29.mp3 +0 -0
data/wavs/wav3.wav +3 -0
data/wavs/wav30.mp3 +0 -0
data/wavs/wav31.mp3 +0 -0
data/wavs/wav32.mp3 +0 -0
data/wavs/wav33.mp3 +0 -0
data/wavs/wav34.wav +3 -0
data/wavs/wav4.wav +3 -0
data/wavs/wav5.wav +3 -0
data/wavs/wav6.wav +3 -0
data/wavs/wav7.wav +3 -0
data/wavs/wav8.wav +3 -0
data/wavs/wav9.wav +3 -0
gpt-data.md +43 -0
resources.md +18 -0
test.py +31 -0

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 title: Chatty Vader
-emoji: 👀
 colorFrom: indigo
 colorTo: yellow
 sdk: gradio

 ---
 title: Chatty Vader
+emoji: 💣
 colorFrom: indigo
 colorTo: yellow
 sdk: gradio

app.ipynb ADDED Viewed

	@@ -0,0 +1,138 @@

+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": ["# Import required libraries"]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import requests\n",
+        "import json\n",
+        "from gtts import gTTS\n",
+        "import os\n",
+        "from pydub import AudioSegment"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": ["# 1. Function to take in audio output and return text output"]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def transcribe_audio_to_text(file_path):\n",
+        "    # Replace with your implementation for transcribing audio to text\n",
+        "    pass"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# 2. Function to call the ChatGPT API with a text and system prompt and return the response"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def call_chatgpt_api(prompt, system_prompt):\n",
+        "    # Replace with your OpenAI API Key\n",
+        "    api_key = 'your-api-key'\n",
+        "\n",
+        "    headers = {\n",
+        "        'Content-Type': 'application/json',\n",
+        "        'Authorization': f'Bearer {api_key}',\n",
+        "    }\n",
+        "\n",
+        "    data = json.dumps({\n",
+        "        'model': 'text-davinci-002',\n",
+        "        'prompt': f'{system_prompt} {prompt}',\n",
+        "        'max_tokens': 150,\n",
+        "        'n': 1,\n",
+        "        'stop': None,\n",
+        "        'temperature': 0.5,\n",
+        "    })\n",
+        "\n",
+        "    response = requests.post('https://api.openai.com/v1/engines/davinci-codex/completions', headers=headers, data=data)\n",
+        "    response_text = response.json()['choices'][0]['text'].strip()\n",
+        "\n",
+        "    return response_text"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# 3. Function to convert text to speech using a suitable library and add intonation for Yoda's voice"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def text_to_speech_yoda(text, output_file):\n",
+        "    tts = gTTS(text, lang='en')\n",
+        "    tts.save(output_file)\n",
+        "\n",
+        "    # Add intonation for Yoda voice (you may need to customize this for better results)\n",
+        "    audio = AudioSegment.from_file(output_file, format=\"mp3\")\n",
+        "    audio = audio.speedup(playback_speed=1.2)\n",
+        "    audio.export(output_file, format=\"mp3\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# 4. Wrapper function that calls all of these functions in order"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def process_audio(input_audio_file, output_audio_file, system_prompt):\n",
+        "    transcribed_text = transcribe_audio_to_text(input_audio_file)\n",
+        "    chatgpt_response = call_chatgpt_api(transcribed_text, system_prompt)\n",
+        "    text_to_speech_yoda(chatgpt_response, output_audio_file)"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.5"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 4
+}

data/metadata.csv ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cbc2bf511a6f46b0c195ac5cc6ad82ef2762c0258a9a50b25f9ca0ac55657d36
+size 1966

data/wavs/wav1.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1ab36530b9abdf0ef53a932c04915c325eeeecc576a1d4265e4fa4d30d4c5d4
+size 17734

data/wavs/wav10.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfad8f3e36b9bf2a743646ecadf503382bfc213a690a37f103c2639348cb02cb
+size 12030

data/wavs/wav11.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b03bd0d9cbaa7e385466ce541c75ba22d89fd75aaf65f402d2db5a2e68ab9d71
+size 8650

data/wavs/wav12.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:de0347db8880d5cb40d11f67b7c4ecfeb6630f6e2cd4dc16af53d866493bc9bf
+size 6830

data/wavs/wav13.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a761d63251887e5481cca23f0eb2cefd51d3158db8101402ccd0fedb0a14a4e0
+size 14370

data/wavs/wav14.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3d08743983001498860a1e9830a7ddcb28b8d3217ce1cab41eb672a1f8184b3
+size 34304

data/wavs/wav15.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:064415dbd40fe447b618d328c5fc93d58651f6b1bc1b975b113c97bbbc3c9c38
+size 74834

data/wavs/wav16.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6181e0fafc34deb20ee74d3e2f7c9811975fe12a2a3bb5577bf0affea3e2c83c
+size 23006

data/wavs/wav17.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5dee5a713f8a4b62ccd2ec32b10c950f455d8f7a9d8435f4f8b201d701152ae
+size 43472

data/wavs/wav18.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fd77a6d3e15aea495745c518f33f4a125511001611616b82039a1c1c97cb8cc
+size 83258

data/wavs/wav19.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:920acc4cda72c697d72e6030f0568b75ab0da79efed1df8f3a8b0f62b31f8119
+size 41826

data/wavs/wav2.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48656c12ef9a556aad43a8a1c6e289f0afb1f5b3283d83a72e2648e464845d51
+size 46146

data/wavs/wav20.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:10f6de671c0daeaf7189902aa694d0f8ef5d108b361b9250d6a67a6981335111
+size 78474

data/wavs/wav21.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3aceca45bbe69f717346ab25063d801ae07fe530d5ff8b7a7fdc86646c50b2e0
+size 50536

data/wavs/wav22.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ccd832488f585aa852b22061c11c9a251595aed4a9b62c46025387af2b901988
+size 38170

data/wavs/wav23.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7d3bdb55e029cc5cce78ac03edc9de459d4757a23aa895f21a1be0e5ba8aa45
+size 77422

data/wavs/wav24.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9253767d354b1aa484498ba013c1f981fa166b83025620173bcd37c29e096f64
+size 51398

data/wavs/wav25.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:831108ab28494e7d36438a04eb527a1c05cd14c769218f5f5f8d01ef8f39c8e3
+size 6310

data/wavs/wav26.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00bf0d0defa342786883d7c5ef444d76329bca499e356fcc1c2f7d1649fddd48
+size 7350

data/wavs/wav27.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62cf76057721d42234f616947c0ae5aeaa7deac1667d79cb57e2cd8fee1a1844
+size 9170

data/wavs/wav28.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:441101a2d56838fa952aaeeb78f4a5ad55ce7b4fcdb4199d5648e4aea6d4ad52
+size 18230

data/wavs/wav29.mp3 ADDED Viewed

Binary file (114 kB). View file

data/wavs/wav3.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5049fb7e23db05081275a9c94f8d7056993b3b929125d7f30758d1e05f3ea187
+size 28066

data/wavs/wav30.mp3 ADDED Viewed

Binary file (48.1 kB). View file

data/wavs/wav31.mp3 ADDED Viewed

Binary file (17.1 kB). View file

data/wavs/wav32.mp3 ADDED Viewed

Binary file (96.1 kB). View file

data/wavs/wav33.mp3 ADDED Viewed

Binary file (27.6 kB). View file

data/wavs/wav34.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eeb545563ca25dcea2c0e6cf83aeb096a6198b7b10976ff0af305297028c3f29
+size 9690

data/wavs/wav4.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d07f6e5fd84f2f83ccb0b9069deed1e512099d7ffa870233bde0bf9673d326e5
+size 5530

data/wavs/wav5.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:17da780707c66bc4297a11cd0fc1be80cef0cd3e8559519ff4404acf264070f4
+size 529964

data/wavs/wav6.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4af156d450349d48672f160fc817906a9b9928fd3135451b747738317e3533c0
+size 19162

data/wavs/wav7.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a891200cd5a05a382caa265d81b9567bbfc8129e6aed524ef512f587624b0087
+size 11510

data/wavs/wav8.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5346a94429fdf19eb9721c133203022dcb479f7adeaa65a3ea7213bb242946f
+size 8390

data/wavs/wav9.wav ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a0e839cf656d25867ef2c3d1977173e465917804ce51d5acabd6c07b505878c
+size 9170

gpt-data.md ADDED Viewed

	@@ -0,0 +1,43 @@

+[Audio link](https://www.drodd.com/star-wars-soundboard/bickering.wav)
+Admiral Motti: "This station is now the ultimate power in the universe. I suggest we use it!"
+Darth Vader: "Don't be too proud of this technological terror you've constructed. The ability to destroy a planet is insignificant next to the power of the Force."
+Admiral Motti: "Don't try to frighten us with your sorcerer's ways, Lord Vader. Your sad devotion to that ancient religion has not helped you conjure up the stolen data tapes, or given you clairvoyance enough to find the Rebel's hidden fortre..."
+Darth Vader: "(Vader chokes Motti with the Force) I find your lack of faith disturbing."
+Grand Moff Tarkin: "Enough of this! Vader, release him!"
+Darth Vader: "As you wish."
+Grand Moff Tarkin: "This bickering is pointless. Now, Lord Vader will provide us with the location of the Rebel fortress by the time this station is operational. We will then crush the Rebellion with one swift stroke."
+[Audio link](https://www.drodd.com/star-wars-soundboard/sorcerersways.wav)
+Admiral Motti: "Don't try to frighten us with your sorcerer's ways, Lord Vader. Your sad devotion to that ancient religion has not helped you conjure up the stolen data tapes, or given you clairvoyance enough to find the Rebel's hidden fortre..."
+Darth Vader: "(Vader chokes Motti with the Force) I find your lack of faith disturbing."
+Grand Moff Tarkin: "Enough of this! Vader, release him!"
+Darth Vader: "As you wish."
+[Audio link](https://www.drodd.com/star-wars-soundboard/mindprobe.wav)
+Darth Vader: "Her resistance to the mind probe is considerable. It will be some time before we can extract any information from her."
+Imperial Officer: "The final check-out is complete. All systems are operational. What course shall we set?"
+Grand Moff Tarken: "Perhaps she would respond to an alternative form of persuasion."
+Darth Vader: "What do you mean?"
+Grand Moff Tarken: "I think it is time we demonstrate the full power of this station. Set your course for Alderaan."
+Imperial Officer: "With pleasure."
+[Audio link](https://www.drodd.com/star-wars-soundboard/thoseplans.wav)
+Stormtrooper: "The Death Star plans are not in the main computer."
+Darth Vader (James Earl Jones): "Where are those transmissions you intercepted? What have you done with those plans?"
+Rebel (???): "We intercepted no transmissions. This is a consular ship. We're on a diplomatic mission."
+Darth Vader: "If this is a consular ship, where is the ambassador? (He throws him against the wall) Commander, tear this ship apart untill you've found those plans and bring me the passengers! I want them alive!"
+[Audio link](https://www.drodd.com/star-wars-soundboard/diplomatic.wav)
+Princess Leia Organa: "Darth Vader, only you could be so bold. The imperial senate will not sit still for this. When they hear you've attacked a diplomatic--"
+Darth Vader: "Don't act so surprised, your highness. You weren't on any mercy mission this time. Several transmissions were beamed to this ship by rebel spies. I want to know what happened to the plans they sent you."
+Leia: "I don't know what you're talking about. I'm a member of the imperial senate on a diplomatic mission to Alderaan."
+Darth Vader: "You are part of the Rebel Alliance and a traitor. Take her away!"
+[Audio link](https://www.drodd.com/star-wars-soundboard/takeheraway.wav)
+Leia: "I'm a member of the imperial senate on a diplomatic mission to Alderaan."
+Darth Vader: "You are part of the Rebel Alliance and a traitor. Take her away!"
+[Audio link](https://www.drodd.com/star-wars-soundboard/notaboard.wav)
+Imperial Officer Commander (???): "Lord Vader, the battle station plans are not aboard this ship and no transmissions were made. An escape pod was jettisoned during the fighting but no life forms were aboard."
+Darth Vader: "She must have hidden the plans in the escape pod. Send a detachment down to retrieve them. See to it personally, Commander. There'll be no one to stop us this time."
+Imperial Officer Commander: "Yes, sir."

resources.md ADDED Viewed

	@@ -0,0 +1,18 @@

+### Star Wars Audio Files
+[Very clear audio](http://www.moviesoundclips.net/sound.php?id=137) - check for the [other movies](http://www.moviesoundclips.net/movies.php?page=3) also
+[1.](https://www.drodd.com/star-wars-soundboard/)
+[2.](http://www.galaxyfaraway.com/gfa/1998/12/star-wars-sounds-archive/#episode%20i%20sounds)
+[3.](https://www.wavsource.com/movies/star_wars.htm)
+[4.](https://www.thesoundarchive.com/star-wars.asp)
+[5.]()
+[Whisper API Reference](https://platform.openai.com/docs/api-reference/audio)
+[Voice training with Resemble.ai](https://www.resemble.ai/api/)
+[Resemble API reference](https://docs.app.resemble.ai/docs/resource_voice/create)
+[Resemble.ai Dataset reference](https://resemble.notion.site/resemble/Resemble-AI-Supported-Datasets-64e94dffc7fe4f518989df48d815879f)

test.py ADDED Viewed

	@@ -0,0 +1,31 @@

+import app
+def test_transcribe_audio_to_text():
+    input_audio_file = "test_audio_input.wav"
+    expected_transcribed_text = "your expected transcription"
+    result = app.transcribe_audio_to_text(input_audio_file)
+    assert result == expected_transcribed_text
+def test_call_chatgpt_api():
+    prompt = "What is the meaning of life?"
+    system_prompt = "Yoda:"
+    expected_response = "your expected chatgpt response"
+    result = app.call_chatgpt_api(prompt, system_prompt)
+    assert result == expected_response
+def test_text_to_speech_yoda():
+    input_text = "Do or do not, there is no try."
+    output_audio_file = "test_audio_output.mp3"
+    app.text_to_speech_yoda(input_text, output_audio_file)
+    assert os.path.exists(output_audio_file)
+def test_process_audio():
+    input_audio_file = "test_audio_input.wav"
+    output_audio_file = "test_audio_output.mp3"
+    system_prompt = "Yoda:"
+    app.process_audio(input_audio_file, output_audio_file, system_prompt)
+    assert os.path.exists(output_audio_file)