Spaces:

Hellisotherpeople
/

Interpretable_Text_Classification_And_Clustering

Running

App Files Files Community

Rainsilves commited on Dec 19, 2021

Commit

ee8a91d

•

1 Parent(s): bd550e0

more performance improvements

Browse files

Files changed (1) hide show

interpretable_text_clustering.py +3 -3

interpretable_text_clustering.py CHANGED Viewed

@@ -40,7 +40,7 @@ task = form.radio("Which task are we solving?", ('Classification', 'Clustering')
 dataset_name = form.text_area("Enter the name of the huggingface Dataset to do analysis of:", value = "Hellisotherpeople/DebateSum")
 dataset_name_2 = form.text_area("Enter the name of the config for the dataset if it has one", value = "")
 split_name = form.text_area("Enter the name of the split of the dataset that you want to use", value = "train")
-number_of_records = form.number_input("Enter the number of documents that you want to analyze from the dataset", value = 200)
 column_name = form.text_area("Enter the name of the column that we are doing analysis on (the X value)", value = "Full-Document")
 if task == "Classification":
@@ -141,7 +141,7 @@ text_example = """Judge Leon last week questioned the effectiveness of the gover
 form_explainer = st.sidebar.form("explainer_form")
 form_explainer.header("Explainer Settings")
 position_dep = form_explainer.checkbox("Check this if you want to take into account the position of a word in the interpretation", value = False)
-number_samples = form_explainer.number_input("Enter the number of explainer peterbuted samples, higher creates a better explanation but takes longer", value = 5000)
 char_based = form_explainer.checkbox("Check this if you want to use a character based explanier", value = False)
 form_explainer.form_submit_button("Submit")
@@ -150,7 +150,7 @@ te = TextExplainer(random_state=42, char_based=char_based, n_samples = number_sa
 input_choice = st.checkbox("Check this if you want to enter your own example to explain", value = False)
 if input_choice == False:
-    record_to_explain = st.number_input("Enter the index of the document from the original dataset to interpret", value = 151)
     te.fit(df[column_name][record_to_explain], text_clf.predict_proba)
     if task == "Classification":
         st.write("Ground truth label")

 dataset_name = form.text_area("Enter the name of the huggingface Dataset to do analysis of:", value = "Hellisotherpeople/DebateSum")
 dataset_name_2 = form.text_area("Enter the name of the config for the dataset if it has one", value = "")
 split_name = form.text_area("Enter the name of the split of the dataset that you want to use", value = "train")
+number_of_records = form.number_input("Enter the number of documents that you want to analyze from the dataset", value = 50)
 column_name = form.text_area("Enter the name of the column that we are doing analysis on (the X value)", value = "Full-Document")
 if task == "Classification":
 form_explainer = st.sidebar.form("explainer_form")
 form_explainer.header("Explainer Settings")
 position_dep = form_explainer.checkbox("Check this if you want to take into account the position of a word in the interpretation", value = False)
+number_samples = form_explainer.number_input("Enter the number of explainer peterbuted samples, higher creates a better explanation but takes longer", value = 1000)
 char_based = form_explainer.checkbox("Check this if you want to use a character based explanier", value = False)
 form_explainer.form_submit_button("Submit")
 input_choice = st.checkbox("Check this if you want to enter your own example to explain", value = False)
 if input_choice == False:
+    record_to_explain = st.number_input("Enter the index of the document from the original dataset to interpret", value = 30)
     te.fit(df[column_name][record_to_explain], text_clf.predict_proba)
     if task == "Classification":
         st.write("Ground truth label")