Spaces:

Yi-666
/

aaa

Sleeping

App Files Files Community

Yi-666 commited on Nov 22, 2024

Commit

cc59fa1

verified ·

1 Parent(s): 59beba1

Update app.py

Browse files

Files changed (1) hide show

app.py +68 -66

app.py CHANGED Viewed

@@ -2,6 +2,10 @@ import streamlit as st
 import numpy as np
 import matplotlib.pyplot as plt
 from sklearn.metrics import precision_recall_curve, auc
 # Sidebar navigation
 st.sidebar.title("App Navigation")
@@ -13,79 +17,77 @@ if page == "Sentiment Analysis":
     st.title("Twitter Sentiment Analysis App")
     # Load sentiment analysis pipeline
-    from transformers import pipeline
-    sentiment_pipe = pipeline("text-classification", model="cardiffnlp/twitter-roberta-base-sentiment-latest")
     # Input box for user to enter a tweet
     user_input = st.text_input("Enter a tweet to analyze:")
     if user_input:
-        # Run sentiment analysis
-        result = sentiment_pipe(user_input)
-        st.write("Sentiment Analysis Result:", result)
 # Model Evaluation Page
 elif page == "Model Evaluation":
     st.title("Model Precision-Recall Evaluation")
-    # Initialize default values for y_true and y_score
-    y_true, y_score = None, None
-    # Option to use actual model predictions
-    st.write("### Evaluate Using Actual Model")
-    model_type = st.selectbox("Choose model type:", ["Scikit-learn", "Transformers"])
-    if model_type == "Scikit-learn":
-        st.write("### Scikit-learn Model")
-        from sklearn.ensemble import RandomForestClassifier
-        from sklearn.datasets import make_classification
-        # Create and train a Scikit-learn model
-        X_train, y_train = make_classification(n_samples=1000, n_features=20, random_state=42)
-        X_test, y_test = make_classification(n_samples=200, n_features=20, random_state=42)
-        model = RandomForestClassifier()
-        model.fit(X_train, y_train)
-        # Generate predictions
-        y_score = model.predict_proba(X_test)[:, 1]  # Predicted probabilities for the positive class
-        y_true = y_test  # True labels
-    elif model_type == "Transformers":
-        st.write("### Transformers Model")
-        from transformers import pipeline
-        # Load a Transformers model
-        model = pipeline("text-classification", model="cardiffnlp/twitter-roberta-base-sentiment-latest")
-        # Simulate a batch of tweets for evaluation
-        tweets = ["I love this!", "This is bad...", "I'm not sure about this."]
-        results = model(tweets)
-        # Simulated true labels (manually defined for simplicity)
-        y_true = [1, 0, 1]  # Manually defined true labels
-        y_score = [res["score"] for res in results]  # Extract probabilities
-    # Validate data and calculate Precision-Recall curve
-    if y_true is not None and y_score is not None and len(y_true) > 0 and len(y_score) > 0:
-        try:
-            # Calculate Precision, Recall, and AUC
-            precision, recall, _ = precision_recall_curve(y_true, y_score)
-            pr_auc = auc(recall, precision)
-            # Plot the PR curve
-            fig, ax = plt.subplots()
-            ax.plot(recall, precision, label=f"PR Curve (AUC = {pr_auc:.2f})")
-            ax.set_xlabel("Recall")
-            ax.set_ylabel("Precision")
-            ax.set_title("Precision-Recall Curve")
-            ax.legend(loc="best")
-            ax.grid()
-            # Display the plot
-            st.pyplot(fig)
-        except Exception as e:
-            st.error(f"An error occurred while generating the PR curve: {e}")
-    else:
-        st.info("Please select a model and ensure it generates valid data.")

 import numpy as np
 import matplotlib.pyplot as plt
 from sklearn.metrics import precision_recall_curve, auc
+from datasets import load_dataset
+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+import torch
+from tqdm import tqdm
 # Sidebar navigation
 st.sidebar.title("App Navigation")
     st.title("Twitter Sentiment Analysis App")
     # Load sentiment analysis pipeline
+    tokenizer = AutoTokenizer.from_pretrained("cardiffnlp/twitter-roberta-base-sentiment-latest")
+    model = AutoModelForSequenceClassification.from_pretrained("cardiffnlp/twitter-roberta-base-sentiment-latest")
     # Input box for user to enter a tweet
     user_input = st.text_input("Enter a tweet to analyze:")
     if user_input:
+        # Tokenize and predict
+        inputs = tokenizer(user_input, return_tensors="pt", truncation=True, padding=True)
+        with torch.no_grad():
+            outputs = model(**inputs)
+            probs = torch.softmax(outputs.logits, dim=-1)
+        sentiment = "POSITIVE" if probs[0][1] > probs[0][0] else "NEGATIVE"
+        st.write(f"Sentiment: {sentiment}")
+        st.write(f"Scores: {probs[0].numpy()}")
 # Model Evaluation Page
 elif page == "Model Evaluation":
     st.title("Model Precision-Recall Evaluation")
+    # Load tweet_eval dataset
+    dataset_name = "cardiffnlp/tweet_eval"
+    task = st.selectbox("Choose a dataset task:", ["emoji", "sentiment"])
+    split = st.selectbox("Choose data split:", ["train", "validation", "test"])
+    # Load dataset
+    with st.spinner("Loading dataset..."):
+        dataset = load_dataset(dataset_name, task, split=split)
+    st.write(f"Loaded {len(dataset)} samples from {dataset_name} ({task}/{split}).")
+    # Load model
+    model_name = f"cardiffnlp/twitter-roberta-base-{task}"
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    model = AutoModelForSequenceClassification.from_pretrained(model_name)
+    # Batch predict on dataset
+    batch_size = 16
+    predicted_probs = []
+    true_labels = dataset["label"]
+    texts = dataset["text"]
+    with st.spinner("Running model predictions..."):
+        for i in tqdm(range(0, len(texts), batch_size)):
+            batch = texts[i:i + batch_size]
+            inputs = tokenizer(batch, padding=True, truncation=True, return_tensors="pt")
+            with torch.no_grad():
+                outputs = model(**inputs)
+                probs = torch.softmax(outputs.logits, dim=-1)
+                predicted_probs.extend(probs.cpu().numpy())
+    # Select a class for PR Curve
+    num_classes = model.config.num_labels
+    class_to_evaluate = st.selectbox("Choose a class to evaluate:", list(range(num_classes)))
+    # Calculate Precision-Recall Curve
+    y_true = [1 if label == class_to_evaluate else 0 for label in true_labels]
+    y_score = [probs[class_to_evaluate] for probs in predicted_probs]
+    precision, recall, _ = precision_recall_curve(y_true, y_score)
+    pr_auc = auc(recall, precision)
+    # Plot PR Curve
+    fig, ax = plt.subplots()
+    ax.plot(recall, precision, label=f"PR Curve (AUC = {pr_auc:.2f})")
+    ax.set_xlabel("Recall")
+    ax.set_ylabel("Precision")
+    ax.set_title(f"Precision-Recall Curve for Class {class_to_evaluate}")
+    ax.legend(loc="best")
+    ax.grid()
+    st.pyplot(fig)
+    st.success(f"Precision-Recall AUC: {pr_auc:.2f}")