Spaces:

TanishqO0F
/

Test

Sleeping

File size: 5,127 Bytes

import gradio as gr
import requests
from bs4 import BeautifulSoup
import pandas as pd
from transformers import pipeline
import plotly.express as px
from datetime import datetime, timedelta

# Sentiment Analysis Model
sentiment_model = pipeline(model="finiteautomata/bertweet-base-sentiment-analysis")

# Function to encode special characters in the search query
def encode_special_characters(text):
    encoded_text = ''
    special_characters = {'&': '%26', '=': '%3D', '+': '%2B', ' ': '%20'}
    for char in text.lower():
        encoded_text += special_characters.get(char, char)
    return encoded_text

# Function to fetch news articles
def fetch_news(query, num_articles=10):
    encoded_query = encode_special_characters(query)
    url = f"https://news.google.com/search?q={encoded_query}&hl=en-US&gl=in&ceid=US%3Aen&num={num_articles}"
    
    try:
        response = requests.get(url)
        response.raise_for_status()
    except requests.RequestException as e:
        print(f"Error fetching news: {e}")
        return pd.DataFrame()
    
    soup = BeautifulSoup(response.text, 'html.parser')
    articles = soup.find_all('article')
    
    news_data = []
    for article in articles[:num_articles]:
        link = article.find('a')['href'].replace("./articles/", "https://news.google.com/articles/")
        text_parts = article.get_text(separator='\n').split('\n')
        
        news_data.append({
            'Title': text_parts[2] if len(text_parts) > 2 else 'Missing',
            'Source': text_parts[0] if len(text_parts) > 0 else 'Missing',
            'Time': text_parts[3] if len(text_parts) > 3 else 'Missing',
            'Author': text_parts[4].split('By ')[-1] if len(text_parts) > 4 else 'Missing',
            'Link': link
        })
    
    return pd.DataFrame(news_data)

# Function to perform sentiment analysis
def analyze_sentiment(text):
    result = sentiment_model(text)[0]
    return result['label'], result['score']

# Function to fetch stock data from Alpha Vantage API
def fetch_stock_data(company_name):
    url = "https://alpha-vantage.p.rapidapi.com/query"
    querystring = {"function": "TIME_SERIES_DAILY", "symbol": company_name, "outputsize": "compact", "datatype": "json"}
    headers = {
        "x-rapidapi-key": "e078dae417mshb13ddc2d8149768p1608e9jsn888ce49e8554",
        "x-rapidapi-host": "alpha-vantage.p.rapidapi.com"
    }
    
    try:
        response = requests.get(url, headers=headers, params=querystring)
        response.raise_for_status()
        data = response.json()
    except requests.RequestException as e:
        print(f"Error fetching stock data: {e}")
        return None
    
    if "Time Series (Daily)" not in data:
        return None
    
    stock_data = data["Time Series (Daily)"]
    df = pd.DataFrame.from_dict(stock_data, orient='index')
    df.index = pd.to_datetime(df.index)
    df = df.astype(float)
    return df

# Main function to process news and perform analysis
def news_and_analysis(query):
    # Fetch news
    news_df = fetch_news(query)
    
    if news_df.empty:
        return "No news articles found.", None, None
    
    # Perform sentiment analysis
    news_df['Sentiment'], news_df['Sentiment_Score'] = zip(*news_df['Title'].apply(analyze_sentiment))
    
    # Create sentiment plot
    sentiment_fig = px.bar(
        news_df,
        x='Time',
        y='Sentiment_Score',
        color='Sentiment',
        color_discrete_map={'positive': 'green', 'neutral': 'gray', 'negative': 'red'},
        title='News Sentiment Over Time',
        labels={'Time': 'Publication Time', 'Sentiment_Score': 'Sentiment Score'}
    )
    
    # Check if the input query is a company name (heuristic: if it's more than one word)
    if len(query.split()) > 1:
        stock_df = fetch_stock_data(query)
        if stock_df is not None:
            stock_fig = px.line(
                stock_df,
                x=stock_df.index,
                y='4. close',
                title=f'{query} Stock Price Over Time',
                labels={'index': 'Date', '4. close': 'Closing Price'}
            )
            return news_df, sentiment_fig, stock_fig
    return news_df, sentiment_fig, None

# Gradio interface
with gr.Blocks() as demo:
    gr.Markdown(
        """
        # Financial News Sentiment Analysis
        
        Analyze the sentiment of news articles related to financial topics or companies. 
        Enter a topic or company name to get started.
        """
    )
    
    with gr.Row():
        with gr.Column():
            topic = gr.Textbox(label="Enter a financial topic or company name", placeholder="e.g., Apple Inc.")
            analyze_btn = gr.Button(value="Analyze")
        
        with gr.Column():
            news_output = gr.DataFrame(label="News and Sentiment Analysis")
            sentiment_plot = gr.Plot(label="Sentiment Analysis")
            stock_plot = gr.Plot(label="Stock Price Analysis")
    
    analyze_btn.click(
        news_and_analysis,
        inputs=[topic],
        outputs=[news_output, sentiment_plot, stock_plot]
    )

if __name__ == "__main__":
    demo.launch()