Spaces:

Yazi3333
/

reviewsmart

Sleeping

App Files Files Community

Yazi3333 commited on Jul 27

Commit

6493d76

verified ·

1 Parent(s): 11b33e3

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -29

app.py CHANGED Viewed

@@ -1,55 +1,84 @@
 import gradio as gr
 import mimetypes
 import pdfminer.high_level
-from transformers import pipeline
-classifier = pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english")
-summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
-def load_content(file, text):
     if text.strip():
         return text
     if file is None:
         return ""
     mime = mimetypes.guess_type(file.name)[0]
-    binary = file.read()
     if mime and "pdf" in mime:
-        return pdfminer.high_level.extract_text(file)
-    return binary.decode("utf-8", errors="ignore")
 def detect_sentiment(file, text):
-    content = load_content(file, text).strip()
     if not content:
-        return "Нет текста"
-    return f"Тональность: {classifier(content)[0]['label']}"
 def summarize_text(file, text):
-    content = load_content(file, text).strip()
     if not content:
-        return "Нет текста"
-    return summarizer(content, max_length=65, min_length=25, do_sample=False)[0]['summary_text']
-def full_analysis(file, text):
-    content = load_content(file, text).strip()
     if not content:
-        return "Нет текста", "Нет текста"
-    sentiment = f"Тональность: {classifier(content)[0]['label']}"
-    summary = summarizer(content, max_length=65, min_length=25, do_sample=False)[0]['summary_text']
-    return sentiment, summary
 def reset_fields():
     return "", None, "", ""
-with gr.Blocks() as demo:
-    gr.Markdown("## ReviewSmart — анализ отзывов с помощью NLP")
     with gr.Row():
-        input_text = gr.Textbox(label="Текст отзыва", lines=8, placeholder="Введите или загрузите отзыв...")
-        input_file = gr.File(label="Файл (.pdf, .txt)", file_types=[".pdf", ".txt"])
     with gr.Row():
-        btn_sentiment = gr.Button("Определить тональность")
-        btn_summary = gr.Button("Создать резюме")
         btn_both = gr.Button("Анализировать оба")
         btn_clear = gr.Button("Очистить")
@@ -57,9 +86,9 @@ with gr.Blocks() as demo:
         sentiment_box = gr.Textbox(label="Результат анализа тональности", lines=2)
         summary_box = gr.Textbox(label="Результат резюмирования", lines=4)
-    btn_sentiment.click(fn=detect_sentiment, inputs=[input_file, input_text], outputs=sentiment_box)
-    btn_summary.click(fn=summarize_text, inputs=[input_file, input_text], outputs=summary_box)
-    btn_both.click(fn=full_analysis, inputs=[input_file, input_text], outputs=[sentiment_box, summary_box])
     btn_clear.click(fn=reset_fields, outputs=[input_text, input_file, sentiment_box, summary_box])
-demo.launch()

+!pip install -q transformers gradio pdfminer.six langdetect
 import gradio as gr
+from transformers import pipeline
 import mimetypes
 import pdfminer.high_level
+from langdetect import detect
+import io
+# Модели
+sentiment_models = {
+    "en": pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english"),
+    "ru": pipeline("sentiment-analysis", model="blanchefort/rubert-base-cased-sentiment")
+}
+summary_models = {
+    "en": pipeline("summarization", model="facebook/bart-large-cnn"),
+    "ru": pipeline("summarization", model="csebuetnlp/mT5_multilingual_XLSum")
+}
+# Чтение текста из текстового поля или файла
+def get_text(file, text):
     if text.strip():
         return text
     if file is None:
         return ""
     mime = mimetypes.guess_type(file.name)[0]
     if mime and "pdf" in mime:
+        return pdfminer.high_level.extract_text(io.BytesIO(file.read()))
+    else:
+        return file.read().decode("utf-8", errors="ignore")
+# Язык - модели
+def detect_language_model(text):
+    lang = detect(text)
+    return "ru" if lang.startswith("ru") else "en"
+# Анализ тональности
 def detect_sentiment(file, text):
+    content = get_text(file, text).strip()
     if not content:
+        return "Введите текст или загрузите файл"
+    lang = detect_language_model(content)
+    result = sentiment_models[lang](content)[0]
+    return f"Тональность: {result['label']}"
+# Суммаризация
 def summarize_text(file, text):
+    content = get_text(file, text).strip()
     if not content:
+        return "Введите текст или загрузите файл"
+    lang = detect_language_model(content)
+    result = summary_models[lang](content, max_length=65, min_length=25, do_sample=False)[0]
+    return result['summary_text']
+# Оба анализа
+def analyze_all(file, text):
+    content = get_text(file, text).strip()
     if not content:
+        return "Введите текст или загрузите файл", "Введите текст или загрузите файл"
+    lang = detect_language_model(content)
+    sent = sentiment_models[lang](content)[0]['label']
+    summ = summary_models[lang](content, max_length=65, min_length=25, do_sample=False)[0]['summary_text']
+    return f"Тональность: {sent}", summ
+# Очистка
 def reset_fields():
     return "", None, "", ""
+# Интерфейс
+with gr.Blocks(title="ReviewSmart") as demo:
+    gr.Markdown("## ReviewSmart — анализ отзывов на основе NLP")
     with gr.Row():
+        input_text = gr.Textbox(label="Текст отзыва", lines=8, placeholder="Введите отзыв вручную...")
+        input_file = gr.File(label="Файл (.pdf или .txt)", file_types=[".pdf", ".txt"])
     with gr.Row():
+        btn_sent = gr.Button("Определить тональность")
+        btn_sum = gr.Button("Создать резюме")
         btn_both = gr.Button("Анализировать оба")
         btn_clear = gr.Button("Очистить")
         sentiment_box = gr.Textbox(label="Результат анализа тональности", lines=2)
         summary_box = gr.Textbox(label="Результат резюмирования", lines=4)
+    btn_sent.click(fn=detect_sentiment, inputs=[input_file, input_text], outputs=sentiment_box)
+    btn_sum.click(fn=summarize_text, inputs=[input_file, input_text], outputs=summary_box)
+    btn_both.click(fn=analyze_all, inputs=[input_file, input_text], outputs=[sentiment_box, summary_box])
     btn_clear.click(fn=reset_fields, outputs=[input_text, input_file, sentiment_box, summary_box])
+demo.launch(share=True, debug=True)