pentarosarium commited on
Commit
7443219
·
1 Parent(s): 7384066

1.61 +decluster

Browse files
Files changed (2) hide show
  1. app.py +10 -12
  2. requirements.txt +5 -1
app.py CHANGED
@@ -2,7 +2,7 @@ import gradio as gr
2
  import spaces
3
  import pandas as pd
4
  import torch
5
- from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer
6
  import plotly.graph_objects as go
7
  import logging
8
  import io
@@ -14,7 +14,10 @@ from langchain_openai import ChatOpenAI
14
  from langchain.prompts import PromptTemplate
15
  from openpyxl import load_workbook
16
  from openpyxl.utils.dataframe import dataframe_to_rows
17
-
 
 
 
18
 
19
  def fuzzy_deduplicate(df, column, threshold=55):
20
  """Deduplicate rows based on fuzzy matching of text content"""
@@ -731,7 +734,7 @@ def create_interface():
731
  # Create state for file data
732
  current_file = gr.State(None)
733
 
734
- gr.Markdown("# AI-анализ мониторинга новостей v.1.60 + добавка")
735
 
736
  with gr.Row():
737
  file_input = gr.File(
@@ -793,12 +796,14 @@ def create_interface():
793
  control.request_stop()
794
  return "Остановка обработки..."
795
 
 
796
  @spaces.GPU(duration=300)
797
  def process_and_download(file_bytes):
798
  if file_bytes is None:
799
  gr.Warning("Пожалуйста, загрузите файл")
800
  return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
801
-
 
802
  try:
803
  file_obj = io.BytesIO(file_bytes)
804
  logger.info("File loaded into BytesIO successfully")
@@ -906,14 +911,7 @@ def create_interface():
906
  error_msg = f"Ошибка анализа: {str(e)}"
907
  logger.error(error_msg)
908
  gr.Error(error_msg)
909
- return (
910
- pd.DataFrame(),
911
- None,
912
- None,
913
- None,
914
- error_msg,
915
- ""
916
- )
917
  finally:
918
  if detector:
919
  detector.cleanup()
 
2
  import spaces
3
  import pandas as pd
4
  import torch
5
+ from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer, AutoModel
6
  import plotly.graph_objects as go
7
  import logging
8
  import io
 
14
  from langchain.prompts import PromptTemplate
15
  from openpyxl import load_workbook
16
  from openpyxl.utils.dataframe import dataframe_to_rows
17
+ import torch.nn.functional as F
18
+ import numpy as np
19
+ import logging
20
+ from typing import List, Set, Tuple
21
 
22
  def fuzzy_deduplicate(df, column, threshold=55):
23
  """Deduplicate rows based on fuzzy matching of text content"""
 
734
  # Create state for file data
735
  current_file = gr.State(None)
736
 
737
+ gr.Markdown("# AI-анализ мониторинга новостей v.1.61 + добавка")
738
 
739
  with gr.Row():
740
  file_input = gr.File(
 
796
  control.request_stop()
797
  return "Остановка обработки..."
798
 
799
+
800
  @spaces.GPU(duration=300)
801
  def process_and_download(file_bytes):
802
  if file_bytes is None:
803
  gr.Warning("Пожалуйста, загрузите файл")
804
  return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
805
+
806
+ detector = None
807
  try:
808
  file_obj = io.BytesIO(file_bytes)
809
  logger.info("File loaded into BytesIO successfully")
 
911
  error_msg = f"Ошибка анализа: {str(e)}"
912
  logger.error(error_msg)
913
  gr.Error(error_msg)
914
+ return (pd.DataFrame(), None, None, None, error_msg, "")
 
 
 
 
 
 
 
915
  finally:
916
  if detector:
917
  detector.cleanup()
requirements.txt CHANGED
@@ -23,4 +23,8 @@ plotly
23
  datetime
24
  langchain_openai
25
  langchain
26
- langchain-community
 
 
 
 
 
23
  datetime
24
  langchain_openai
25
  langchain
26
+ langchain-community
27
+ numpy
28
+ spacy
29
+ pymorphy2
30
+ https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.0/en_core_web_sm-3.7.0.tar.gz