Spaces:
Build error
Build error
Commit ·
7443219
1
Parent(s): 7384066
1.61 +decluster
Browse files- app.py +10 -12
- requirements.txt +5 -1
app.py
CHANGED
|
@@ -2,7 +2,7 @@ import gradio as gr
|
|
| 2 |
import spaces
|
| 3 |
import pandas as pd
|
| 4 |
import torch
|
| 5 |
-
from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer
|
| 6 |
import plotly.graph_objects as go
|
| 7 |
import logging
|
| 8 |
import io
|
|
@@ -14,7 +14,10 @@ from langchain_openai import ChatOpenAI
|
|
| 14 |
from langchain.prompts import PromptTemplate
|
| 15 |
from openpyxl import load_workbook
|
| 16 |
from openpyxl.utils.dataframe import dataframe_to_rows
|
| 17 |
-
|
|
|
|
|
|
|
|
|
|
| 18 |
|
| 19 |
def fuzzy_deduplicate(df, column, threshold=55):
|
| 20 |
"""Deduplicate rows based on fuzzy matching of text content"""
|
|
@@ -731,7 +734,7 @@ def create_interface():
|
|
| 731 |
# Create state for file data
|
| 732 |
current_file = gr.State(None)
|
| 733 |
|
| 734 |
-
gr.Markdown("# AI-анализ мониторинга новостей v.1.
|
| 735 |
|
| 736 |
with gr.Row():
|
| 737 |
file_input = gr.File(
|
|
@@ -793,12 +796,14 @@ def create_interface():
|
|
| 793 |
control.request_stop()
|
| 794 |
return "Остановка обработки..."
|
| 795 |
|
|
|
|
| 796 |
@spaces.GPU(duration=300)
|
| 797 |
def process_and_download(file_bytes):
|
| 798 |
if file_bytes is None:
|
| 799 |
gr.Warning("Пожалуйста, загрузите файл")
|
| 800 |
return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
|
| 801 |
-
|
|
|
|
| 802 |
try:
|
| 803 |
file_obj = io.BytesIO(file_bytes)
|
| 804 |
logger.info("File loaded into BytesIO successfully")
|
|
@@ -906,14 +911,7 @@ def create_interface():
|
|
| 906 |
error_msg = f"Ошибка анализа: {str(e)}"
|
| 907 |
logger.error(error_msg)
|
| 908 |
gr.Error(error_msg)
|
| 909 |
-
return (
|
| 910 |
-
pd.DataFrame(),
|
| 911 |
-
None,
|
| 912 |
-
None,
|
| 913 |
-
None,
|
| 914 |
-
error_msg,
|
| 915 |
-
""
|
| 916 |
-
)
|
| 917 |
finally:
|
| 918 |
if detector:
|
| 919 |
detector.cleanup()
|
|
|
|
| 2 |
import spaces
|
| 3 |
import pandas as pd
|
| 4 |
import torch
|
| 5 |
+
from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer, AutoModel
|
| 6 |
import plotly.graph_objects as go
|
| 7 |
import logging
|
| 8 |
import io
|
|
|
|
| 14 |
from langchain.prompts import PromptTemplate
|
| 15 |
from openpyxl import load_workbook
|
| 16 |
from openpyxl.utils.dataframe import dataframe_to_rows
|
| 17 |
+
import torch.nn.functional as F
|
| 18 |
+
import numpy as np
|
| 19 |
+
import logging
|
| 20 |
+
from typing import List, Set, Tuple
|
| 21 |
|
| 22 |
def fuzzy_deduplicate(df, column, threshold=55):
|
| 23 |
"""Deduplicate rows based on fuzzy matching of text content"""
|
|
|
|
| 734 |
# Create state for file data
|
| 735 |
current_file = gr.State(None)
|
| 736 |
|
| 737 |
+
gr.Markdown("# AI-анализ мониторинга новостей v.1.61 + добавка")
|
| 738 |
|
| 739 |
with gr.Row():
|
| 740 |
file_input = gr.File(
|
|
|
|
| 796 |
control.request_stop()
|
| 797 |
return "Остановка обработки..."
|
| 798 |
|
| 799 |
+
|
| 800 |
@spaces.GPU(duration=300)
|
| 801 |
def process_and_download(file_bytes):
|
| 802 |
if file_bytes is None:
|
| 803 |
gr.Warning("Пожалуйста, загрузите файл")
|
| 804 |
return (pd.DataFrame(), None, None, None, "Ожидание файла...", "")
|
| 805 |
+
|
| 806 |
+
detector = None
|
| 807 |
try:
|
| 808 |
file_obj = io.BytesIO(file_bytes)
|
| 809 |
logger.info("File loaded into BytesIO successfully")
|
|
|
|
| 911 |
error_msg = f"Ошибка анализа: {str(e)}"
|
| 912 |
logger.error(error_msg)
|
| 913 |
gr.Error(error_msg)
|
| 914 |
+
return (pd.DataFrame(), None, None, None, error_msg, "")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 915 |
finally:
|
| 916 |
if detector:
|
| 917 |
detector.cleanup()
|
requirements.txt
CHANGED
|
@@ -23,4 +23,8 @@ plotly
|
|
| 23 |
datetime
|
| 24 |
langchain_openai
|
| 25 |
langchain
|
| 26 |
-
langchain-community
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
datetime
|
| 24 |
langchain_openai
|
| 25 |
langchain
|
| 26 |
+
langchain-community
|
| 27 |
+
numpy
|
| 28 |
+
spacy
|
| 29 |
+
pymorphy2
|
| 30 |
+
https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.0/en_core_web_sm-3.7.0.tar.gz
|