Spaces:

datascientist22
/

real-robot-speaking

Running

App Files Files Community

datascientist22 commited on Sep 9

Commit

1b365e4

•

1 Parent(s): 2368c75

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -12

app.py CHANGED Viewed

@@ -1,13 +1,12 @@
 import streamlit as st
 import speech_recognition as sr
 from transformers import pipeline
-from tts import TTS  # Hugging Face TTS model
 import requests
-# Load the chatbot model
 chatbot = pipeline("conversational", model="facebook/blenderbot-400M-distill")
-# Function to convert speech to text
 def speech_to_text():
     recognizer = sr.Recognizer()
     with sr.Microphone() as source:
@@ -21,28 +20,41 @@ def speech_to_text():
         except sr.RequestError:
             return "Speech recognition service is not available."
-# Function to generate avatar video
 def generate_avatar_video(text_response):
-    # Call the API of an avatar service (e.g., D-ID, Synthesia)
-    api_url = "https://api.example.com/generate-avatar"
-    payload = {"text": text_response}
-    response = requests.post(api_url, json=payload)
-    video_url = response.json().get("video_url")
     return video_url
-st.title("🗣️ Live Video Chatbot")
 # Button to start recording
 if st.button("Speak"):
     user_input = speech_to_text()
     if user_input:
         st.write(f"**You:** {user_input}")
-        # Generate chatbot response
         bot_response = chatbot(user_input)
         response_text = bot_response[0]["generated_text"]
         st.write(f"**Bot:** {response_text}")
-        # Generate avatar video
         video_url = generate_avatar_video(response_text)
         # Display the video response

 import streamlit as st
 import speech_recognition as sr
 from transformers import pipeline
 import requests
+# Load the chatbot model from Hugging Face
 chatbot = pipeline("conversational", model="facebook/blenderbot-400M-distill")
+# Function to convert speech to text using SpeechRecognition
 def speech_to_text():
     recognizer = sr.Recognizer()
     with sr.Microphone() as source:
         except sr.RequestError:
             return "Speech recognition service is not available."
+# Function to generate avatar video using D-ID API
 def generate_avatar_video(text_response):
+    api_url = "https://api.d-id.com/talk"
+    headers = {
+        "Authorization": "Bearer YOUR_API_KEY",  # Replace with your D-ID API Key
+        "Content-Type": "application/json"
+    }
+    payload = {
+        "script": {
+            "type": "text",
+            "input": text_response
+        },
+        "source": {
+            "avatar_id": "your_avatar_id"  # Replace with the desired avatar ID
+        }
+    }
+    response = requests.post(api_url, headers=headers, json=payload)
+    video_url = response.json().get("result_url")
     return video_url
+# Streamlit app interface
+st.title("🗣️ Voice-Enabled Live Video Chatbot")
 # Button to start recording
 if st.button("Speak"):
     user_input = speech_to_text()
     if user_input:
         st.write(f"**You:** {user_input}")
+        # Generate chatbot response using NLP model
         bot_response = chatbot(user_input)
         response_text = bot_response[0]["generated_text"]
         st.write(f"**Bot:** {response_text}")
+        # Generate avatar video with the bot's response
         video_url = generate_avatar_video(response_text)
         # Display the video response