Spaces:

girishwangikar
/

SmolAgent_News_Analysis

Running

App Files Files Community

girishwangikar commited on 14 days ago

Commit

d8a9363

verified ·

1 Parent(s): 45896a6

Update app.py

Browse files

Files changed (1) hide show

app.py +134 -222

app.py CHANGED Viewed

@@ -1,250 +1,162 @@
 import streamlit as st
 import pandas as pd
-from smolagents import CodeAgent, tool
-from typing import Union, List, Dict, Optional
-from duckduckgo_search import DDGS
-import requests
-from bs4 import BeautifulSoup
-from datetime import datetime
 from groq import Groq
 import os
-import re
-from dataclasses import dataclass
-@dataclass
-class SearchResult:
-    """Data class to store search results from news searches"""
-    title: str
-    link: str
-    date: str
 class GroqLLM:
     """Compatible LLM interface for smolagents CodeAgent"""
-    def __init__(self, model_name: str = "llama-3.1-8B-Instant"):
         self.client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
         self.model_name = model_name
     def __call__(self, prompt: Union[str, dict, List[Dict]]) -> str:
-        """Process the prompt and return the LLM's response"""
         try:
-            prompt_str = str(prompt) if isinstance(prompt, (dict, list)) else prompt
             completion = self.client.chat.completions.create(
                 model=self.model_name,
-                messages=[{"role": "user", "content": prompt_str}],
                 temperature=0.7,
                 max_tokens=1024,
                 stream=False
             )
             return completion.choices[0].message.content if completion.choices else "Error: No response generated"
         except Exception as e:
-            return f"Error generating response: {str(e)}"
-class NewsAnalysisAgent(CodeAgent):
-    """Extended CodeAgent with news search and analysis capabilities"""
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self._articles = []
-        self._search_results = []
-    @property
-    def articles(self) -> List[Dict]:
-        """Access stored article data"""
-        return self._articles
-    @property
-    def search_results(self) -> List[SearchResult]:
-        """Access stored search results"""
-        return self._search_results
-    def run(self, prompt: str) -> str:
-        """Execute the agent with the given prompt"""
-        enhanced_prompt = f"""
-        You are a news analysis assistant that can:
-        - Search for recent news articles
-        - Extract and analyze article content
-        - Summarize key points
-        - Identify trends and patterns
-        Task: {prompt}
-        Use the provided tools to search and analyze news content.
-        """
-        return super().run(enhanced_prompt)
-def extract_text_from_url(url: str) -> str:
-    """Extract main text content from a given URL using BeautifulSoup.
-    Args:
-        url: The URL of the webpage to extract text from
-    Returns:
-        str: Extracted and cleaned text content from the webpage
-    """
-    try:
-        headers = {
-            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36'
-        }
-        response = requests.get(url, headers=headers, timeout=10)
-        response.raise_for_status()
-        soup = BeautifulSoup(response.text, 'html.parser')
-        # Remove unwanted elements
-        for element in soup(['script', 'style', 'nav', 'header', 'footer']):
-            element.decompose()
-        # Extract text from paragraphs
-        paragraphs = soup.find_all('p')
-        text = ' '.join(p.get_text().strip() for p in paragraphs if p.get_text().strip())
-        return re.sub(r'\s+', ' ', text)
-    except Exception as e:
-        return f"Error extracting text: {str(e)}"
-@tool
-def search_news(query: str, max_results: Optional[int] = 5) -> str:
-    """Search for recent news articles using DuckDuckGo.
-    Args:
-        query: Search query string to find relevant news articles
-        max_results: Maximum number of results to return (default: 5)
-    Returns:
-        str: Formatted string containing search results with titles and URLs
-    """
-    try:
-        with DDGS() as ddgs:
-            search_results = list(ddgs.news(
-                query,
-                max_results=max_results or 5,
-                timeframe='d'
-            ))
-        # Store results in agent
-        tool.agent._search_results = [
-            SearchResult(title=r['title'], link=r['link'], date=r['date'])
-            for r in search_results
-        ]
-        # Format results
-        formatted_results = []
-        for idx, result in enumerate(search_results, 1):
-            formatted_results.append(
-                f"{idx}. {result['title']}\n   URL: {result['link']}\n   Date: {result['date']}\n"
-            )
-        return "\n".join(formatted_results)
-    except Exception as e:
-        return f"Error searching news: {str(e)}"
-@tool
-def analyze_article(url: str) -> str:
-    """Extract and analyze content from a news article URL.
-    Args:
-        url: URL of the news article to analyze
-    Returns:
-        str: Analysis of the article including summary, key points, and main themes
-    """
-    try:
-        content = extract_text_from_url(url)
-        analysis_prompt = f"""
-        Please analyze this article content and provide:
-        1. A brief summary (2-3 sentences)
-        2. Key points (3-5 main takeaways)
-        3. Main topics/themes discussed
-        Article content:
-        {content[:3000]}
-        """
-        analysis = tool.agent.model(analysis_prompt)
-        # Store article data
-        article_data = {
-            'url': url,
-            'content': content[:1000],
-            'analysis': analysis,
-            'date': datetime.now().strftime('%Y-%m-%d')
-        }
-        tool.agent._articles.append(article_data)
-        return analysis
-    except Exception as e:
-        return f"Error analyzing article: {str(e)}"
-@tool
-def identify_trends(articles: Optional[List[Dict]] = None) -> str:
-    """Identify common themes and trends across analyzed articles.
-    Args:
-        articles: Optional list of analyzed article data. If None, uses stored articles.
-    Returns:
-        str: Analysis of trends and patterns found across the articles
-    """
-    articles = articles or tool.agent._articles
-    if not articles:
-        return "No articles available for trend analysis"
-    combined_analyses = "\n".join(article['analysis'] for article in articles)
-    trend_prompt = f"""
-    Based on the analyses of {len(articles)} articles, please identify:
-    1. Common themes or topics across articles
-    2. Any notable patterns or trends
-    3. Different perspectives or viewpoints presented
-    Combined analyses:
-    {combined_analyses}
-    """
-    return tool.agent.model(trend_prompt)
-def main():
-    st.title("News Analysis Assistant")
-    st.write("Search and analyze recent news articles with natural language interaction.")
-    # Initialize session state
-    if 'agent' not in st.session_state:
-        st.session_state['agent'] = NewsAnalysisAgent(
-            tools=[search_news, analyze_article, identify_trends],
-            model=GroqLLM(),
-            additional_authorized_imports=[
-                "requests", "bs4", "duckduckgo_search", "pandas"
-            ]
         )
-    # News search interface
-    search_query = st.text_input("Enter news search query:")
-    if search_query:
-        with st.spinner('Searching news...'):
-            search_results = st.session_state['agent'].run(
-                f"Use the search_news tool to find recent articles about: {search_query}"
-            )
-            st.write(search_results)
-    # Article analysis interface
-    st.subheader("Article Analysis")
-    article_url = st.text_input("Enter article URL to analyze:")
-    if article_url:
-        with st.spinner('Analyzing article...'):
-            analysis = st.session_state['agent'].run(
-                f"Use the analyze_article tool to analyze this article: {article_url}"
-            )
-            st.write(analysis)
-    # Trend analysis interface
-    if st.button("Analyze Trends"):
-        with st.spinner('Identifying trends...'):
-            trends = st.session_state['agent'].run(
-                "Use the identify_trends tool to analyze patterns across all articles"
-            )
-            st.write(trends)
-if __name__ == "__main__":
-    main()

 import streamlit as st
 import pandas as pd
+from smolagents import CodeAgent, DuckDuckGoSearchTool
+from typing import Union, List, Dict
 from groq import Groq
 import os
 class GroqLLM:
     """Compatible LLM interface for smolagents CodeAgent"""
+    def __init__(self, model_name="llama-3.1-8B-Instant"):
         self.client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
         self.model_name = model_name
     def __call__(self, prompt: Union[str, dict, List[Dict]]) -> str:
         try:
+            # Handle different prompt formats
+            if isinstance(prompt, (dict, list)):
+                prompt_str = str(prompt)
+            else:
+                prompt_str = str(prompt)
+            # Create a properly formatted message
             completion = self.client.chat.completions.create(
                 model=self.model_name,
+                messages=[{
+                    "role": "user",
+                    "content": prompt_str
+                }],
                 temperature=0.7,
                 max_tokens=1024,
                 stream=False
             )
             return completion.choices[0].message.content if completion.choices else "Error: No response generated"
         except Exception as e:
+            error_msg = f"Error generating response: {str(e)}"
+            print(error_msg)
+            return error_msg
+def create_analysis_prompt(topic: str, search_results: str) -> str:
+    """Creates a structured prompt for news analysis"""
+    return f"""Analyze the following news information about {topic}.
+    Search Results: {search_results}
+    Please provide:
+    1. Summary of key points
+    2. Main stakeholders involved
+    3. Potential implications
+    4. Analysis of different perspectives
+    5. Fact-check of major claims (if applicable)
+    Format the analysis in a clear, journalistic style."""
+def log_agent_activity(prompt: str, result: str, agent_name: str):
+    """Logs agent activities in the Streamlit interface"""
+    with st.expander("View Agent Activity Log"):
+        st.write(f"### Agent Activity ({agent_name}):")
+        st.write("**Input Prompt:**")
+        st.code(prompt, language="text")
+        st.write("**Analysis Output:**")
+        st.code(result, language="text")
+# Initialize Streamlit app
+st.set_page_config(page_title="News Analysis Tool", layout="wide")
+# Title and description
+st.title("🔍 AI News Analysis Tool")
+st.write("""
+This tool uses advanced AI to analyze news topics, providing comprehensive insights
+and analysis using real-time data from the web. Powered by Groq's LLama 3.1 8B
+Instant model and DuckDuckGo search.
+""")
+# Initialize the agents
+try:
+    # Initialize LLM and tools
+    llm = GroqLLM()
+    search_tool = DuckDuckGoSearchTool()
+    # Create the analysis agent
+    news_agent = CodeAgent(
+        tools=[search_tool],
+        model=llm
+    )
+    # Input section
+    news_topic = st.text_input(
+        "Enter News Topic or Query:",
+        placeholder="E.g., Recent developments in renewable energy"
+    )
+    # Analysis options
+    col1, col2 = st.columns(2)
+    with col1:
+        search_depth = st.slider(
+            "Search Depth (number of results)",
+            min_value=3,
+            max_value=10,
+            value=5
+        )
+    with col2:
+        analysis_type = st.selectbox(
+            "Analysis Type",
+            ["Comprehensive", "Quick Summary", "Technical", "Simplified"]
         )
+    # Generate analysis button
+    if st.button("Analyze News"):
+        if news_topic:
+            with st.spinner("Gathering information and analyzing..."):
+                try:
+                    # First, get search results
+                    search_results = search_tool.run(
+                        f"Latest news about {news_topic} last 7 days"
+                    )
+                    # Create analysis prompt
+                    analysis_prompt = create_analysis_prompt(news_topic, search_results)
+                    # Get analysis from the agent
+                    analysis_result = news_agent.run(analysis_prompt)
+                    # Display results
+                    st.subheader("📊 Analysis Results")
+                    st.markdown(analysis_result)
+                    # Log the activity
+                    log_agent_activity(
+                        analysis_prompt,
+                        analysis_result,
+                        "News Analysis Agent"
+                    )
+                except Exception as e:
+                    st.error(f"An error occurred during analysis: {str(e)}")
+        else:
+            st.warning("Please enter a news topic to analyze.")
+    # Add helpful tips
+    with st.expander("💡 Tips for Better Results"):
+        st.write("""
+        - Be specific with your topic for more focused analysis
+        - Use keywords related to recent events for timely information
+        - Consider including timeframes in your query
+        - Try different analysis types for various perspectives
+        """)
+except Exception as e:
+    st.error(f"""
+    Failed to initialize the application: {str(e)}
+    Please ensure:
+    1. Your GROQ_API_KEY is properly set in environment variables
+    2. All required packages are installed
+    3. You have internet connectivity for DuckDuckGo searches
+    """)
+# Footer
+st.markdown("---")
+st.caption(
+    "Powered by Groq LLama 3.1 8B Instant, DuckDuckGo, and Streamlit | "
+    "Created for news analysis and research purposes"
+)