Spaces:
Sleeping
Sleeping
Commit
·
7443219
1
Parent(s):
7384066
1.61 +decluster
Browse files- app.py +10 -12
- requirements.txt +5 -1
app.py
CHANGED
@@ -2,7 +2,7 @@ import gradio as gr
|
|
2 |
import spaces
|
3 |
import pandas as pd
|
4 |
import torch
|
5 |
-
from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer
|
6 |
import plotly.graph_objects as go
|
7 |
import logging
|
8 |
import io
|
@@ -14,7 +14,10 @@ from langchain_openai import ChatOpenAI
|
|
14 |
from langchain.prompts import PromptTemplate
|
15 |
from openpyxl import load_workbook
|
16 |
from openpyxl.utils.dataframe import dataframe_to_rows
|
17 |
-
|
|
|
|
|
|
|
18 |
|
19 |
def fuzzy_deduplicate(df, column, threshold=55):
|
20 |
"""Deduplicate rows based on fuzzy matching of text content"""
|
@@ -731,7 +734,7 @@ def create_interface():
|
|
731 |
# Create state for file data
|
732 |
current_file = gr.State(None)
|
733 |
|
734 |
-
gr.Markdown("# AI-анализ мониторинга новостей v.1.
|
735 |
|
736 |
with gr.Row():
|
737 |
file_input = gr.File(
|
@@ -793,12 +796,14 @@ def create_interface():
|
|
793 |
control.request_stop()
|
794 |
return "Остановка обработки..."
|
795 |
|
|
|
796 |
@spaces.GPU(duration=300)
|
797 |
def process_and_download(file_bytes):
|
798 |
if file_bytes is None:
|
799 |
gr.Warning("Пожалуйста, загрузите файл")
|
800 |
return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
|
801 |
-
|
|
|
802 |
try:
|
803 |
file_obj = io.BytesIO(file_bytes)
|
804 |
logger.info("File loaded into BytesIO successfully")
|
@@ -906,14 +911,7 @@ def create_interface():
|
|
906 |
error_msg = f"Ошибка анализа: {str(e)}"
|
907 |
logger.error(error_msg)
|
908 |
gr.Error(error_msg)
|
909 |
-
return (
|
910 |
-
pd.DataFrame(),
|
911 |
-
None,
|
912 |
-
None,
|
913 |
-
None,
|
914 |
-
error_msg,
|
915 |
-
""
|
916 |
-
)
|
917 |
finally:
|
918 |
if detector:
|
919 |
detector.cleanup()
|
|
|
2 |
import spaces
|
3 |
import pandas as pd
|
4 |
import torch
|
5 |
+
from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer, AutoModel
|
6 |
import plotly.graph_objects as go
|
7 |
import logging
|
8 |
import io
|
|
|
14 |
from langchain.prompts import PromptTemplate
|
15 |
from openpyxl import load_workbook
|
16 |
from openpyxl.utils.dataframe import dataframe_to_rows
|
17 |
+
import torch.nn.functional as F
|
18 |
+
import numpy as np
|
19 |
+
import logging
|
20 |
+
from typing import List, Set, Tuple
|
21 |
|
22 |
def fuzzy_deduplicate(df, column, threshold=55):
|
23 |
"""Deduplicate rows based on fuzzy matching of text content"""
|
|
|
734 |
# Create state for file data
|
735 |
current_file = gr.State(None)
|
736 |
|
737 |
+
gr.Markdown("# AI-анализ мониторинга новостей v.1.61 + добавка")
|
738 |
|
739 |
with gr.Row():
|
740 |
file_input = gr.File(
|
|
|
796 |
control.request_stop()
|
797 |
return "Остановка обработки..."
|
798 |
|
799 |
+
|
800 |
@spaces.GPU(duration=300)
|
801 |
def process_and_download(file_bytes):
|
802 |
if file_bytes is None:
|
803 |
gr.Warning("Пожалуйста, загрузите файл")
|
804 |
return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
|
805 |
+
|
806 |
+
detector = None
|
807 |
try:
|
808 |
file_obj = io.BytesIO(file_bytes)
|
809 |
logger.info("File loaded into BytesIO successfully")
|
|
|
911 |
error_msg = f"Ошибка анализа: {str(e)}"
|
912 |
logger.error(error_msg)
|
913 |
gr.Error(error_msg)
|
914 |
+
return (pd.DataFrame(), None, None, None, error_msg, "")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
915 |
finally:
|
916 |
if detector:
|
917 |
detector.cleanup()
|
requirements.txt
CHANGED
@@ -23,4 +23,8 @@ plotly
|
|
23 |
datetime
|
24 |
langchain_openai
|
25 |
langchain
|
26 |
-
langchain-community
|
|
|
|
|
|
|
|
|
|
23 |
datetime
|
24 |
langchain_openai
|
25 |
langchain
|
26 |
+
langchain-community
|
27 |
+
numpy
|
28 |
+
spacy
|
29 |
+
pymorphy2
|
30 |
+
https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.0/en_core_web_sm-3.7.0.tar.gz
|