finiteautomata commited on
Commit
43e2fd9
1 Parent(s): a188b38

Add other datasets

Browse files
Files changed (1) hide show
  1. app.py +16 -6
app.py CHANGED
@@ -4,9 +4,6 @@ import streamlit as st
4
  from datasets import load_dataset
5
  from annotated_text import annotated_text
6
 
7
- # Load data
8
- ds = load_dataset("hs-knowledge/hateval_enriched")
9
-
10
 
11
  # Show highlighted ner entities in a tweet
12
  def display_ner(example):
@@ -69,9 +66,9 @@ def display_ner(example):
69
  annotated_text(*chunks)
70
 
71
 
72
- def display_text(example):
73
  # Use annotated_text to show entities
74
- text = example["text"]
75
 
76
  # Sort entities by start
77
  entities = sorted(example["entities"], key=lambda x: x["start"])
@@ -110,7 +107,20 @@ def display_text(example):
110
  annotated_text(*chunks)
111
 
112
 
113
- # Get first 1000 examples
 
 
 
 
 
 
 
 
 
 
 
 
 
114
 
115
  elements = random.choices(range(len(ds["train"])), k=50)
116
  ds["train"] = ds["train"].select(elements)
 
4
  from datasets import load_dataset
5
  from annotated_text import annotated_text
6
 
 
 
 
7
 
8
  # Show highlighted ner entities in a tweet
9
  def display_ner(example):
 
66
  annotated_text(*chunks)
67
 
68
 
69
+ def display_text(example, text_column):
70
  # Use annotated_text to show entities
71
+ text = example[text_column]
72
 
73
  # Sort entities by start
74
  entities = sorted(example["entities"], key=lambda x: x["start"])
 
107
  annotated_text(*chunks)
108
 
109
 
110
+ # selectbox to choose dataset
111
+
112
+ selected_dataset = st.sidebar.selectbox(
113
+ "Select dataset", ["hateval_enriched", "sbf-enriched", "hatecheck-enriched"]
114
+ )
115
+
116
+ # Load data
117
+ ds = load_dataset(f"hs-knowledge/{selected_dataset}")
118
+
119
+ text_column = {
120
+ "hateval_enriched": "text",
121
+ "sbf-enriched": "post",
122
+ "hatecheck-enriched": "test_case",
123
+ }
124
 
125
  elements = random.choices(range(len(ds["train"])), k=50)
126
  ds["train"] = ds["train"].select(elements)