Spaces:

proKBD
/

news-summarization

Sleeping

App Files Files Community

proKBD commited on Mar 23

Commit

71f0750

verified ·

1 Parent(s): ada2f0f

Update api.py

Browse files

Files changed (1) hide show

api.py +182 -72

api.py CHANGED Viewed

@@ -1,72 +1,182 @@
-"""FastAPI backend for the News Summarization application."""
-from fastapi import FastAPI, HTTPException
-from fastapi.staticfiles import StaticFiles
-from pydantic import BaseModel
-from typing import List, Dict, Any
-import uvicorn
-from utils import NewsExtractor, SentimentAnalyzer, TextToSpeechConverter, ComparativeAnalyzer
-import os
-from config import API_PORT, AUDIO_OUTPUT_DIR
-import time
-app = FastAPI(title="News Summarization API")
-# Mount static directory for audio files
-os.makedirs(AUDIO_OUTPUT_DIR, exist_ok=True)
-app.mount("/audio", StaticFiles(directory=AUDIO_OUTPUT_DIR), name="audio")
-# Initialize components
-news_extractor = NewsExtractor()
-sentiment_analyzer = SentimentAnalyzer()
-tts_converter = TextToSpeechConverter()
-comparative_analyzer = ComparativeAnalyzer()
-class CompanyRequest(BaseModel):
-    name: str
-class AnalysisResponse(BaseModel):
-    company: str
-    articles: List[Dict[str, Any]]
-    comparative_sentiment_score: Dict[str, Any]
-    final_sentiment_analysis: str
-    audio_url: str = None
-@app.post("/api/analyze", response_model=AnalysisResponse)
-async def analyze_company(request: CompanyRequest):
-    """Analyze news articles for a given company."""
-    try:
-        # Extract news articles
-        articles = news_extractor.search_news(request.name)
-        if not articles:
-            raise HTTPException(status_code=404, detail="No articles found for the company")
-        # Analyze each article
-        analyzed_articles = []
-        for article in articles:
-            analysis = sentiment_analyzer.analyze_article(article)
-            # Add company name to each article
-            analysis['company'] = request.name
-            analyzed_articles.append(analysis)
-        # Perform comparative analysis
-        comparison = comparative_analyzer.analyze_coverage(analyzed_articles, company_name=request.name)
-        final_analysis = comparison["final_sentiment"]
-        # Generate Hindi audio for final analysis
-        audio_filename = f"{request.name.lower().replace(' ', '_')}_{int(time.time())}"
-        audio_path = tts_converter.generate_audio(final_analysis, audio_filename)
-        audio_url = f"/audio/{os.path.basename(audio_path)}"
-        return {
-            "company": request.name,
-            "articles": analyzed_articles,
-            "comparative_sentiment_score": comparison,
-            "final_sentiment_analysis": final_analysis,
-            "audio_url": audio_url
-        }
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))
-if __name__ == "__main__":
-    uvicorn.run(app, host="0.0.0.0", port=API_PORT)

+"""Streamlit frontend for the News Summarization application."""
+import streamlit as st
+import pandas as pd
+import json
+import os
+import plotly.express as px
+import altair as alt
+from utils import analyze_company_data  # Import the analysis function directly
+# Set page config
+st.set_page_config(
+    page_title="News Summarization App",
+    page_icon="📰",
+    layout="wide"
+)
+# Show loading message
+with st.spinner("Initializing the application... Please wait while we load the models."):
+    # Initialize components
+    try:
+        from utils import NewsExtractor, SentimentAnalyzer, TextSummarizer, TextToSpeechConverter
+        st.success("Application initialized successfully!")
+    except Exception as e:
+        st.error(f"Error initializing application: {str(e)}")
+        st.info("Please try refreshing the page.")
+def process_company(company_name):
+    """Process company data directly."""
+    try:
+        # Call the analysis function directly from utils
+        data = analyze_company_data(company_name)
+        # Generate audio if needed
+        if 'summary' in data:
+            from gtts import gTTS
+            tts = gTTS(text=data['summary'], lang='en')
+            audio_path = os.path.join('audio_output', f'{company_name}_summary.mp3')
+            os.makedirs('audio_output', exist_ok=True)
+            tts.save(audio_path)
+            data['audio_path'] = audio_path
+            return data
+    except Exception as e:
+        st.error(f"Error processing company: {str(e)}")
+        return {"articles": [], "comparative_sentiment_score": {}, "final_sentiment_analysis": "", "audio_path": None}
+def main():
+    st.title("News Summarization App")
+    st.write("Analyze news articles and get sentiment analysis for any company.")
+    # User input
+    company_name = st.text_input("Enter company name:", "Tesla")
+    if st.button("Analyze"):
+        with st.spinner("Analyzing news articles..."):
+            try:
+                # Process company data
+                data = analyze_company_data(company_name)
+                if not data["articles"]:
+                    st.error("No articles found for analysis.")
+                    return
+                # Display overall sentiment
+                st.subheader("Overall Sentiment Analysis")
+                st.write(data["final_sentiment_analysis"])
+                # Create DataFrame for sentiment scores
+                sentiment_df = pd.DataFrame(data["comparative_sentiment_score"])
+                # Display sentiment distribution by source
+                st.subheader("Sentiment Distribution by Source")
+                # Convert sentiment labels to numeric values for visualization
+                sentiment_map = {'positive': 1, 'neutral': 0, 'negative': -1}
+                numeric_df = sentiment_df.replace(sentiment_map)
+                # Calculate sentiment distribution
+                sentiment_dist = numeric_df.apply(lambda x: x.value_counts(normalize=True).to_dict())
+                # Create a new DataFrame for visualization
+                viz_data = []
+                for source in sentiment_df.columns:
+                    dist = sentiment_dist[source]
+                    for sentiment, percentage in dist.items():
+                        viz_data.append({
+                            'Source': source,
+                            'Sentiment': sentiment,
+                            'Percentage': percentage * 100
+                        })
+                viz_df = pd.DataFrame(viz_data)
+                # Create stacked bar chart
+                fig = px.bar(viz_df,
+                           x='Source',
+                           y='Percentage',
+                           color='Sentiment',
+                           title='Sentiment Distribution by Source',
+                           barmode='stack')
+                fig.update_layout(
+                    yaxis_title='Percentage',
+                    xaxis_title='News Source',
+                    legend_title='Sentiment'
+                )
+                st.plotly_chart(fig)
+                # Display fine-grained sentiment analysis
+                st.subheader("Fine-grained Sentiment Analysis")
+                # Create tabs for different fine-grained analyses
+                tab1, tab2, tab3 = st.tabs(["Financial Sentiment", "Emotional Sentiment", "ESG Sentiment"])
+                with tab1:
+                    st.write("Financial Market Impact Analysis")
+                    financial_data = []
+                    for article in data["articles"]:
+                        if "financial_sentiment" in article:
+                            financial_data.append({
+                                "Article": article["title"],
+                                "Financial Impact": article["financial_sentiment"]
+                            })
+                    if financial_data:
+                        st.dataframe(pd.DataFrame(financial_data))
+                    else:
+                        st.info("Financial sentiment analysis not available for these articles.")
+                with tab2:
+                    st.write("Emotional Sentiment Analysis")
+                    emotional_data = []
+                    for article in data["articles"]:
+                        if "emotional_sentiment" in article:
+                            emotional_data.append({
+                                "Article": article["title"],
+                                "Emotional Impact": article["emotional_sentiment"]
+                            })
+                    if emotional_data:
+                        st.dataframe(pd.DataFrame(emotional_data))
+                    else:
+                        st.info("Emotional sentiment analysis not available for these articles.")
+                with tab3:
+                    st.write("ESG (Environmental, Social, Governance) Analysis")
+                    esg_data = []
+                    for article in data["articles"]:
+                        if "esg_sentiment" in article:
+                            esg_data.append({
+                                "Article": article["title"],
+                                "ESG Impact": article["esg_sentiment"]
+                            })
+                    if esg_data:
+                        st.dataframe(pd.DataFrame(esg_data))
+                    else:
+                        st.info("ESG sentiment analysis not available for these articles.")
+                # Display articles with detailed sentiment analysis
+                st.subheader("Recent Articles")
+                for article in data["articles"]:
+                    with st.expander(article["title"]):
+                        st.write(f"**Source:** {article['source']}")
+                        st.write(f"**Summary:** {article['summary']}")
+                        st.write(f"**Overall Sentiment:** {article['sentiment']}")
+                        # Display fine-grained sentiment if available
+                        if "financial_sentiment" in article:
+                            st.write(f"**Financial Impact:** {article['financial_sentiment']}")
+                        if "emotional_sentiment" in article:
+                            st.write(f"**Emotional Impact:** {article['emotional_sentiment']}")
+                        if "esg_sentiment" in article:
+                            st.write(f"**ESG Impact:** {article['esg_sentiment']}")
+                        st.write(f"**URL:** [{article['url']}]({article['url']})")
+            except Exception as e:
+                st.error(f"Error analyzing company data: {str(e)}")
+                print(f"Error: {str(e)}")
+if __name__ == "__main__":
+    main()