Spaces:

Mubin1917
/

Chat_With_Youtube_Videos

Sleeping

App Files Files Community

Mubin1917 commited on Jul 16, 2024

Commit

857dbaf

1 Parent(s): 17e8e9f

Update_1

Browse files

Files changed (3) hide show

app.py +97 -59
requirements.txt +12 -1
youtube_FC_14.py +443 -0

app.py CHANGED Viewed

@@ -1,63 +1,101 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    messages = [{"role": "system", "content": system_message}]
-    for val in history:
-        if val[0]:
-            messages.append({"role": "user", "content": val[0]})
-        if val[1]:
-            messages.append({"role": "assistant", "content": val[1]})
-    messages.append({"role": "user", "content": message})
-    response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
-)
 if __name__ == "__main__":
-    demo.launch()

+import os
+import openai
 import gradio as gr
+from youtube_transcript_api import YouTubeTranscriptApi
+from langchain_openai import ChatOpenAI
+from langchain.agents import AgentExecutor
+from langchain.memory import ConversationBufferWindowMemory
+from youtube_FC_14 import YouTubeTranscriptTool, MainPointsExtractor, SummaryExtractor, YouTubeAgent
+import logging
+logging.getLogger().setLevel(logging.ERROR)
+import warnings
+warnings.filterwarnings("ignore")
+class ChatBot:
+    def __init__(self):
+        self.youtube_agent = None
+        self.api_key = None
+    def initialize_agent(self, api_key):
+        if api_key:
+            os.environ['OPENAI_API_KEY'] = api_key
+            openai.api_key = api_key
+            self.api_key = api_key
+            self.youtube_agent = YouTubeAgent()
+            return "API key set successfully. Agent initialized."
+        else:
+            return "Please provide a valid API key."
+    def chat(self, message, history):
+        if not self.youtube_agent:
+            return "Please set your OpenAI API key first."
+        try:
+            response = self.youtube_agent.invoke(message)
+            return response
+        except Exception as e:
+            return f"An error occurred: {str(e)}"
+chatbot = ChatBot()  # Create an instance of ChatBot
+def set_api_key(api_key):
+    return chatbot.initialize_agent(api_key)
+def user_message(message, history):
+    return "", history + [[message, None]]
+def bot_message(history):
+    user_message = history[-1][0]
+    bot_response = chatbot.chat(user_message, history)
+    history[-1][1] = bot_response
+    return history
+def use_example(example, text_input):
+    return example
+# Example messages
+example_messages = [
+    "What tools are available for use?",
+    "What is the following video about? https://www.youtube.com/watch?v=dZxbVGhpEkI",
+    "Can you summarize this video? https://www.youtube.com/watch?v=hM8unyUM6KA",
+    "Extract the main points from this video: https://www.youtube.com/watch?v=UF8uR6Z6KLc"
+]
+with gr.Blocks() as demo:
+    gr.Markdown("# YouTube Video Analysis Chatbot")
+    with gr.Row():
+        api_key_input = gr.Textbox(type="password", label="Enter your OpenAI API key")
+        api_key_button = gr.Button("Set API Key")
+    api_key_status = gr.Textbox(label="API Key Status", interactive=False)
+    chatbot_interface = gr.Chatbot()
+    msg = gr.Textbox(label="Message")
+    with gr.Row():
+        submit_btn = gr.Button("Submit")
+        clear_btn = gr.Button("Clear")
+    gr.Markdown("## Example Messages")
+    example_btns = [gr.Button(i) for i in example_messages]
+    api_key_button.click(set_api_key, inputs=api_key_input, outputs=api_key_status)
+    submit_btn.click(user_message, [msg, chatbot_interface], [msg, chatbot_interface], queue=False).then(
+        bot_message, chatbot_interface, chatbot_interface
+    )
+    msg.submit(user_message, [msg, chatbot_interface], [msg, chatbot_interface], queue=False).then(
+        bot_message, chatbot_interface, chatbot_interface
+    )
+    clear_btn.click(lambda: None, None, chatbot_interface, queue=False)
+    for btn, example in zip(example_btns, example_messages):
+        btn.click(use_example, inputs=[gr.Textbox(value=example, visible=False)], outputs=msg)
 if __name__ == "__main__":
+    demo.launch()

requirements.txt CHANGED Viewed

	@@ -1 +1,12 @@
1	- huggingface_hub==0.22.2

+huggingface_hub==0.22.2
+youtube-transcript-api==0.6.2
+gradio==4.38.1
+tiktoken==0.7.
+pytube==15.0.0
+langchain==0.2.8
+langchain-community==0.2.7
+langchain-core==0.2.19
+langchain-openai==0.1.16
+langchain-text-splitters==0.2.2
+pyperclip==1.9.0
+openai==1.35.13

youtube_FC_14.py ADDED Viewed

	@@ -0,0 +1,443 @@

+"""
+YouTube Video Analysis Module
+This module provides tools for analyzing YouTube videos, including transcript extraction
+and main points summarization. It uses the LangChain library for natural language
+processing tasks and the YouTube Transcript API for fetching video transcripts.
+Classes:
+    YouTubeTranscriptTool: Handles fetching and processing of YouTube video transcripts.
+    MainPointsExtractor: Extracts and formats main points from YouTube video transcripts.
+    YouTubeAgent: Manages the overall agent setup for interacting with YouTube videos.
+    SummaryExtractor: Extracts summaries from YouTube video transcripts.
+Usage:
+    youtube_agent = YouTubeAgent()
+    video_link = "https://www.youtube.com/watch?v=VIDEO_ID"
+    results = process_video(video_link, youtube_agent)
+"""
+import os
+import openai
+from typing import List, Dict, Any
+from youtube_transcript_api import YouTubeTranscriptApi
+from langchain_core.pydantic_v1 import BaseModel, Field
+from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain_openai import ChatOpenAI
+from langchain.schema.runnable import RunnableLambda, RunnablePassthrough
+from langchain.agents import tool, AgentExecutor
+from langchain.output_parsers.openai_functions import JsonKeyOutputFunctionsParser
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_core.utils.function_calling import convert_to_openai_function
+from langchain.agents.output_parsers import OpenAIFunctionsAgentOutputParser
+from langchain.agents.format_scratchpad import format_to_openai_functions
+from langchain.memory import ConversationBufferWindowMemory
+from functools import wraps
+import functools
+import logging
+import traceback
+# Set up logging with more detailed format
+logging.basicConfig(level=logging.INFO,
+                    format='%(asctime)s - %(levelname)s - %(name)s - %(filename)s:%(lineno)d - %(message)s')
+logger = logging.getLogger(__name__)
+# Define a decorator for error logging
+def log_errors(func):
+    @wraps(func)
+    def wrapper(*args, **kwargs):
+        try:
+            return func(*args, **kwargs)
+        except Exception as e:
+            logger.error(f"Error in {func.__name__}: {str(e)}")
+            logger.error(f"Traceback: {traceback.format_exc()}")
+            raise
+    return wrapper
+class YouTubeTranscriptTool:
+    """
+    A tool for fetching and processing YouTube video transcripts.
+    This class provides methods to retrieve transcripts with or without timestamps,
+    and to split transcripts into manageable chunks.
+    """
+    @staticmethod
+    @tool(return_direct=True)
+    def get_transcript_with_timestamps(youtube_video_id: str, chunk_number: int = 0) -> str:
+        """
+        Retrieves a YouTube video transcript with timestamps.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+            chunk_number (int): The index of the transcript chunk to retrieve.
+        Returns:
+            str: The requested transcript chunk with timestamps.
+        """
+        return YouTubeTranscriptTool._get_transcript(youtube_video_id, chunk_number, include_timestamps=True)
+    @staticmethod
+    @tool(return_direct=True)
+    def get_transcript_without_timestamps(youtube_video_id: str, chunk_number: int = 0) -> str:
+        """
+        Retrieves a YouTube video transcript without timestamps.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+            chunk_number (int): The index of the transcript chunk to retrieve.
+        Returns:
+            str: The requested transcript chunk without timestamps.
+        """
+        return YouTubeTranscriptTool._get_transcript(youtube_video_id, chunk_number, include_timestamps=False)
+    @staticmethod
+    @log_errors
+    def _get_transcript(youtube_video_id: str, chunk_number: int, include_timestamps: bool) -> str:
+        """
+        Internal method to fetch and process the transcript.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+            chunk_number (int): The index of the transcript chunk to retrieve.
+            include_timestamps (bool): Whether to include timestamps in the transcript.
+        Returns:
+            str: The processed transcript chunk.
+        Raises:
+            ValueError: If the requested chunk number is out of range.
+        """
+        try:
+            transcript_json = YouTubeTranscriptApi.get_transcript(youtube_video_id)
+            text_splitter = RecursiveCharacterTextSplitter(
+                chunk_size=8192,
+                chunk_overlap=0,
+                separators=[f" {char}" for char in "ABCDEFGHIJKLMNOPQRSTUVWXYZ"]
+            )
+            if include_timestamps:
+                transcript_data = [f"{entry['start']:.2f}: {entry['text']} " for entry in transcript_json]
+            else:
+                transcript_data = [entry['text'] for entry in transcript_json]
+            transcript_text = " ".join(transcript_data)
+            transcript_splits = text_splitter.split_text(transcript_text)
+            if chunk_number >= len(transcript_splits):
+                raise ValueError(f"Chunk number {chunk_number} is out of range. Total chunks: {len(transcript_splits)}")
+            chunked_text = transcript_splits[chunk_number]
+            return YouTubeTranscriptTool._format_response(transcript_splits, chunk_number, chunked_text)
+        except Exception as e:
+            logger.error(f"Error in _get_transcript: {str(e)}")
+            return f"Error fetching transcript: {str(e)}"
+    @staticmethod
+    def _format_response(transcript_splits: List[str], chunk_number: int, chunked_text: str) -> str:
+        """
+        Formats the transcript chunk response.
+        Args:
+            transcript_splits (List[str]): All transcript chunks.
+            chunk_number (int): The index of the current chunk.
+            chunked_text (str): The text of the current chunk.
+        Returns:
+            str: Formatted response string.
+        """
+        if len(transcript_splits) == 1:
+            return f"Note: Complete subtitles returned.\n\nSubtitles:{chunked_text}"
+        elif chunk_number == len(transcript_splits) - 1:
+            return f"Note: Last chunk of subtitles returned.\n\nSubtitles:{chunked_text}"
+        else:
+            return f"Note: Partial subtitles returned. To get the next chunk, use chunk_number = {chunk_number + 1}.\n\nSubtitles:{chunked_text}"
+class Points(BaseModel):
+    """Pydantic model for representing extracted points."""
+    point: str = Field(description="The main topic, theme, or subject extracted from the subtitle.")
+    context: str = Field(description="The context or brief explanation of the main point.")
+    emoji: str = Field(description="An emoji that represents or summarizes the main point.")
+    timestamp: float = Field(description="The timestamp (in floating-point number) from the video where the main point is mentioned.")
+class MainPointsExtractor:
+    """
+    A tool for extracting and formatting main points from YouTube video transcripts.
+    This class provides methods to process transcripts and identify key points
+    using natural language processing techniques.
+    """
+    class Info(BaseModel):
+        """Pydantic model for representing a collection of points."""
+        points: List[Points]
+    @staticmethod
+    @tool(return_direct=True)
+    @log_errors
+    def get_youtube_video_main_points(youtube_video_id: str) -> str:
+        """
+        Extracts and formats main points from a YouTube video transcript.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+        Returns:
+            str: Formatted string of main points extracted from the video.
+        """
+        try:
+            transcript = MainPointsExtractor._get_youtube_video_transcript(youtube_video_id)
+            main_points = MainPointsExtractor._extract_main_points(transcript)
+            return MainPointsExtractor._format_youtube_comment(main_points)
+        except Exception as e:
+            logger.error(f"Error in get_youtube_video_main_points: {str(e)}")
+            return f"Error extracting main points: {str(e)}"
+    @staticmethod
+    @log_errors
+    def _get_youtube_video_transcript(youtube_video_id: str) -> str:
+        """
+        Fetches the transcript for a YouTube video.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+        Returns:
+            str: The full transcript of the video.
+        Raises:
+            Exception: If there's an error fetching the transcript.
+        """
+        try:
+            transcript_json = YouTubeTranscriptApi.get_transcript(youtube_video_id)
+            transcript_data = [f"{entry['start']:.2f}: {entry['text']} " for entry in transcript_json]
+            return "".join(transcript_data)
+        except Exception as e:
+            logger.error(f"Error fetching transcript: {str(e)}")
+            raise
+    @staticmethod
+    @functools.lru_cache(maxsize=16)
+    def _extract_main_points(transcript: str) -> List[Dict[str, Any]]:
+        """
+        Extracts main points from the transcript using NLP techniques.
+        This method is cached to improve performance for repeated calls.
+        Args:
+            transcript (str): The full transcript of the video.
+        Returns:
+            List[Dict[str, Any]]: A list of dictionaries containing extracted main points.
+        """
+        main_points_extraction_function = [convert_to_openai_function(MainPointsExtractor.Info)]
+        model = ChatOpenAI(temperature=0)
+        extraction_model = model.bind(functions=main_points_extraction_function, function_call={"name": "Info"})
+        prompt = ChatPromptTemplate.from_messages([("human", "{input}")])
+        extraction_chain = prompt | extraction_model | JsonKeyOutputFunctionsParser(key_name="points")
+        text_splitter = RecursiveCharacterTextSplitter(chunk_overlap=0, chunk_size=8192, separators=[f" {char}" for char in "123456789"])
+        prep = RunnableLambda(lambda x: [{"input": doc} for doc in text_splitter.split_text(x)])
+        chain = prep | extraction_chain.map() | MainPointsExtractor._flatten
+        return chain.invoke(transcript)
+    @staticmethod
+    @log_errors
+    def _flatten(matrix):
+        """Flattens a 2D list into a 1D list."""
+        return [item for row in matrix for item in row]
+    @staticmethod
+    @log_errors
+    def _format_youtube_comment(json_data: List[Dict[str, Any]]) -> str:
+        """
+        Formats extracted main points into a YouTube-style comment.
+        Args:
+            json_data (List[Dict[str, Any]]): List of dictionaries containing main points.
+        Returns:
+            str: Formatted string representing the main points as a YouTube comment.
+        """
+        def _format_timestamp(seconds):
+            hours = int(seconds // 3600)
+            minutes = int((seconds % 3600) // 60)
+            seconds = int(seconds % 60)
+            return f"{hours:02}:{minutes:02}:{seconds:02}"
+        formatted_comment = ""
+        for entry in json_data:
+            timestamp = _format_timestamp(entry['timestamp'])
+            emoji = entry['emoji']
+            point = entry['point']
+            context = entry['context']
+            formatted_comment += f"{timestamp} {emoji} {point}: {context}\n"
+        return formatted_comment.strip()
+class Summary(BaseModel):
+    """Pydantic model for representing extracted summary."""
+    summary: str = Field(description="Extract detailed information from the content.")
+class SummaryExtractor:
+    """
+    A tool for extracting and formatting summaries from YouTube video transcripts.
+    This class provides methods to process transcripts and generate concise summaries
+    using natural language processing techniques.
+    """
+    class Info(BaseModel):
+        """Pydantic model for representing a collection of summaries."""
+        summary: List[Summary]
+    @staticmethod
+    @tool(return_direct=False)
+    @log_errors
+    def get_youtube_video_summary(youtube_video_id: str) -> str:
+        """
+        Extracts and formats a summary from a YouTube video transcript.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+        Returns:
+            str: Formatted string of the summary extracted from the video.
+        """
+        try:
+            transcript = SummaryExtractor._get_youtube_video_transcript(youtube_video_id)
+            summary = SummaryExtractor._extract_summary(transcript)
+            return SummaryExtractor._format_summary(summary)
+        except Exception as e:
+            logger.error(f"Error in get_youtube_video_summary: {str(e)}")
+            return f"Error extracting summary: {str(e)}"
+    @staticmethod
+    @log_errors
+    def _get_youtube_video_transcript(youtube_video_id: str) -> str:
+        """
+        Fetches the transcript for a YouTube video.
+        Args:
+            youtube_video_id (str): The ID of the YouTube video.
+        Returns:
+            str: The full transcript of the video.
+        Raises:
+            Exception: If there's an error fetching the transcript.
+        """
+        try:
+            transcript_json = YouTubeTranscriptApi.get_transcript(youtube_video_id)
+            transcript_data = [entry['text'] for entry in transcript_json]
+            return " ".join(transcript_data)
+        except Exception as e:
+            logger.error(f"Error fetching transcript: {str(e)}")
+            raise
+    @staticmethod
+    @functools.lru_cache(maxsize=16)
+    def _extract_summary(transcript: str) -> List[Summary]:
+        """
+        Extracts a summary from a YouTube video transcript.
+        Args:
+            transcript (str): The full transcript of the video.
+        Returns:
+            Summary: A Summary object containing the extracted summary.
+        """
+        summary_extraction_function = [convert_to_openai_function(SummaryExtractor.Info)]
+        model = ChatOpenAI(temperature=0)
+        extraction_model = model.bind(functions=summary_extraction_function, function_call={"name": "Info"})
+        prompt = ChatPromptTemplate.from_messages([("human", "{input}")])
+        extraction_chain = prompt | extraction_model | JsonKeyOutputFunctionsParser(key_name="summary")
+        text_splitter = RecursiveCharacterTextSplitter(chunk_overlap=0, chunk_size=8192, separators=[f" {char}" for char in "ABCDEFGHIJKLMNOPQRSTUVWXYZ"])
+        prep = RunnableLambda(lambda x: [{"input": doc} for doc in text_splitter.split_text(x)])
+        chain = prep | extraction_chain.map() | MainPointsExtractor._flatten
+        return chain.invoke(transcript)
+    @staticmethod
+    def _format_summary(summaries: List[Summary]) -> str:
+        """
+        Formats the list of summaries into a single string.
+        Args:
+            summaries (List[Summary]): List of Summary objects.
+        Returns:
+            str: A formatted string containing all summaries.
+        """
+        return "\n\n".join([s["summary"] for s in summaries])
+class YouTubeAgent:
+    """
+    An agent for interacting with YouTube videos and processing user queries.
+    This class sets up the necessary components for an AI agent that can understand
+    and respond to user queries about YouTube videos.
+    """
+    def __init__(self):
+        """Initializes the YouTubeAgent with necessary tools and components."""
+        self.tools = [
+            YouTubeTranscriptTool.get_transcript_with_timestamps,
+            YouTubeTranscriptTool.get_transcript_without_timestamps,
+            MainPointsExtractor.get_youtube_video_main_points,
+            SummaryExtractor.get_youtube_video_summary
+        ]
+        self.sys_message = "You are a helpful assistant."
+        self.functions = [convert_to_openai_function(f) for f in self.tools]
+        self.model = ChatOpenAI(temperature=0).bind(functions=self.functions)
+        self.prompt = ChatPromptTemplate.from_messages([
+            ("system", self.sys_message),
+            MessagesPlaceholder(variable_name="history"),
+            ("user", "{input}"),
+            MessagesPlaceholder(variable_name="agent_scratchpad")
+        ])
+        self.agent_chain = RunnablePassthrough.assign(
+            agent_scratchpad= lambda x: format_to_openai_functions(x["intermediate_steps"])
+        ) | self.prompt | self.model | OpenAIFunctionsAgentOutputParser()
+        self.memory = ConversationBufferWindowMemory(k=3, return_messages=True, memory_key="history")
+        self.agent_executor = AgentExecutor(agent=self.agent_chain, tools=self.tools, memory=self.memory)
+    @log_errors
+    def invoke(self, input_text: str) -> str:
+        """
+        Processes a user input and returns the agent's response.
+        Args:
+            input_text (str): The user's input query.
+        Returns:
+            str: The agent's response to the user's query.
+        """
+        try:
+            result = self.agent_executor.invoke({"input": input_text})
+            return result['output']
+        except Exception as e:
+            logger.error(f"Error in YouTubeAgent.invoke: {str(e)}")
+            return f"An error occurred: {str(e)}"
+# # Usage example
+# if __name__ == "__main__":
+#     youtube_agent = YouTubeAgent()
+#     video_link = "https://www.youtube.com/watch?v=dZxbVGhpEkI"
+#     try:
+#         main_points = youtube_agent.invoke(f"Can you get summary of the following video {video_link}")
+#     except Exception as e:
+#         logger.error(f"An error occurred during processing: {str(e)}")
+#         print(f"An error occurred: {str(e)}")