Spaces:

nhull
/

reviews-demo

Running

App Files Files Community

nhull commited on 20 days ago

Commit

e4627b7

verified ·

1 Parent(s): bdb3169

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -24

app.py CHANGED Viewed

@@ -9,7 +9,6 @@ from huggingface_hub import hf_hub_download
 import torch
 import pickle
 import numpy as np
-from transformers import AutoTokenizer, AutoModelForSequenceClassification
 # Load models and tokenizers
 models = {
@@ -76,13 +75,12 @@ def predict_with_bert_multilingual(text):
 def predict_with_tinybert(text):
     tokenizer = models["TinyBERT"]["tokenizer"]
     model = models["TinyBERT"]["model"]
-    encodings = tokenizer([text], padding=True, truncation=True, max_length=128, return_tensors="pt").to(device)
     with torch.no_grad():
         outputs = model(**encodings)
         logits = outputs.logits
         predictions = logits.argmax(axis=-1).cpu().numpy()
-    return int(predictions[0])
 # Unified function for sentiment analysis and statistics
 def analyze_sentiment_and_statistics(text):
@@ -95,22 +93,28 @@ def analyze_sentiment_and_statistics(text):
     # Calculate statistics
     scores = list(results.values())
-    min_score_model = min(results, key=results.get)
-    max_score_model = max(results, key=results.get)
-    average_score = np.mean(scores)
-    statistics = {
-        "Lowest Score": f"{results[min_score_model]} (Model: {min_score_model})",
-        "Highest Score": f"{results[max_score_model]} (Model: {max_score_model})",
-        "Average Score": f"{average_score:.2f}",
-    }
     return results, statistics
 # Gradio Interface
 with gr.Blocks(css=".gradio-container { max-width: 900px; margin: auto; padding: 20px; }") as demo:
     gr.Markdown("# Sentiment Analysis App")
     gr.Markdown(
-        "This app predicts the sentiment of the input text on a scale from 1 to 5 using multiple models and provides detailed statistics."
     )
     with gr.Row():
@@ -150,7 +154,7 @@ with gr.Blocks(css=".gradio-container { max-width: 900px; margin: auto; padding:
         with gr.Column():
             distilbert_output = gr.Textbox(label="Predicted Sentiment (DistilBERT)", interactive=False)
             log_reg_output = gr.Textbox(label="Predicted Sentiment (Logistic Regression)", interactive=False)
-            bert_output = gr.Textbox(label="Predicted Sentiment (BERT Multilingual)", interactive=False),
             tinybert_output = gr.Textbox(label="Predicted Sentiment (TinyBERT)", interactive=False)
         with gr.Column():
@@ -159,13 +163,22 @@ with gr.Blocks(css=".gradio-container { max-width: 900px; margin: auto; padding:
     # Button to analyze sentiment and show statistics
     def process_input_and_analyze(text_input):
         results, statistics = analyze_sentiment_and_statistics(text_input)
-        return (
-            f"{results['DistilBERT']}",
-            f"{results['Logistic Regression']}",
-            f"{results['BERT Multilingual (NLP Town)']}",
-            f"{results['TinyBERT']}",
-            f"Statistics:\n{statistics['Lowest Score']}\n{statistics['Highest Score']}\nAverage Score: {statistics['Average Score']}"
-        )
     analyze_button.click(
         process_input_and_analyze,
@@ -173,7 +186,5 @@ with gr.Blocks(css=".gradio-container { max-width: 900px; margin: auto; padding:
         outputs=[distilbert_output, log_reg_output, bert_output, tinybert_output, statistics_output]
     )
 # Launch the app
 demo.launch()

 import torch
 import pickle
 import numpy as np
 # Load models and tokenizers
 models = {
 def predict_with_tinybert(text):
     tokenizer = models["TinyBERT"]["tokenizer"]
     model = models["TinyBERT"]["model"]
+    encodings = tokenizer([text], padding=True, truncation=True, max_length=512, return_tensors="pt").to(device)
     with torch.no_grad():
         outputs = model(**encodings)
         logits = outputs.logits
         predictions = logits.argmax(axis=-1).cpu().numpy()
+    return int(predictions[0] + 1)
 # Unified function for sentiment analysis and statistics
 def analyze_sentiment_and_statistics(text):
     # Calculate statistics
     scores = list(results.values())
+    if all(score == scores[0] for score in scores):  # Check if all predictions are the same
+        statistics = {
+            "Message": "All models predict the same score.",
+            "Average Score": f"{scores[0]:.2f}",
+        }
+    else:
+        min_score_model = min(results, key=results.get)
+        max_score_model = max(results, key=results.get)
+        average_score = np.mean(scores)
+        statistics = {
+            "Lowest Score": f"{results[min_score_model]} (Model: {min_score_model})",
+            "Highest Score": f"{results[max_score_model]} (Model: {max_score_model})",
+            "Average Score": f"{average_score:.2f}",
+        }
     return results, statistics
 # Gradio Interface
 with gr.Blocks(css=".gradio-container { max-width: 900px; margin: auto; padding: 20px; }") as demo:
     gr.Markdown("# Sentiment Analysis App")
     gr.Markdown(
+        "This app predicts the sentiment of the input text on a scale from 1 to 5 using multiple models and provides basic statistics."
     )
     with gr.Row():
         with gr.Column():
             distilbert_output = gr.Textbox(label="Predicted Sentiment (DistilBERT)", interactive=False)
             log_reg_output = gr.Textbox(label="Predicted Sentiment (Logistic Regression)", interactive=False)
+            bert_output = gr.Textbox(label="Predicted Sentiment (BERT Multilingual)", interactive=False)
             tinybert_output = gr.Textbox(label="Predicted Sentiment (TinyBERT)", interactive=False)
         with gr.Column():
     # Button to analyze sentiment and show statistics
     def process_input_and_analyze(text_input):
         results, statistics = analyze_sentiment_and_statistics(text_input)
+        if "Message" in statistics:  # All models predicted the same score
+            return (
+                f"{results['DistilBERT']}",
+                f"{results['Logistic Regression']}",
+                f"{results['BERT Multilingual (NLP Town)']}",
+                f"{results['TinyBERT']}",
+                f"Statistics:\n{statistics['Message']}\nAverage Score: {statistics['Average Score']}"
+            )
+        else:  # Min and Max scores are present
+            return (
+                f"{results['DistilBERT']}",
+                f"{results['Logistic Regression']}",
+                f"{results['BERT Multilingual (NLP Town)']}",
+                f"{results['TinyBERT']}",
+                f"Statistics:\n{statistics['Lowest Score']}\n{statistics['Highest Score']}\nAverage Score: {statistics['Average Score']}"
+            )
     analyze_button.click(
         process_input_and_analyze,
         outputs=[distilbert_output, log_reg_output, bert_output, tinybert_output, statistics_output]
     )
 # Launch the app
 demo.launch()