Zekun Wu commited on
Commit
9a5dfbf
1 Parent(s): 860deeb
Files changed (1) hide show
  1. util/analysis.py +0 -8
util/analysis.py CHANGED
@@ -125,7 +125,6 @@ def statistical_tests_single(data):
125
  average_ranks = data[['Counterfactual_Rank']].mean()
126
 
127
  # Statistical tests
128
- stat_friedman, p_friedman = friedmanchisquare(data['Counterfactual_Rank'], data['Neutral_Rank'])
129
  kw_stat, kw_p = kruskal(data['Counterfactual_Rank'],data['Neutral_Rank'])
130
  mw_stat, mw_p = mannwhitneyu(data['Counterfactual_Rank'], data['Neutral_Rank'])
131
 
@@ -156,7 +155,6 @@ def statistical_tests_single(data):
156
 
157
  results = {
158
  "Average Ranks": average_ranks,
159
- "Friedman Test": {"Statistic": stat_friedman, "p-value": p_friedman},
160
  "Kruskal-Wallis Test": {"Statistic": kw_stat, "p-value": kw_p},
161
  "Mann-Whitney U Test": {"Statistic": mw_stat, "p-value": mw_p},
162
  "Wilcoxon Test Between Privilege and Protect": p_value_privilege_protect,
@@ -182,12 +180,6 @@ def result_evaluation_single(test_results):
182
  rank_analysis = f"Lowest average rank: {min_rank} (suggests highest preference), Highest average rank: {max_rank} (suggests least preference)."
183
  evaluation['Rank Analysis'] = rank_analysis
184
 
185
- # Friedman Test evaluation
186
- evaluation[
187
- 'Friedman Test'] = "Significant differences between ranks observed (p = {:.5f}), suggesting potential bias.".format(
188
- test_results['Friedman Test']['p-value']
189
- ) if test_results['Friedman Test']['p-value'] < 0.05 else "No significant differences between ranks."
190
-
191
  # Kruskal-Wallis Test evaluation
192
  evaluation[
193
  'Kruskal-Wallis Test'] = "Significant differences among groups observed (p = {:.5f}), indicating potential biases.".format(
 
125
  average_ranks = data[['Counterfactual_Rank']].mean()
126
 
127
  # Statistical tests
 
128
  kw_stat, kw_p = kruskal(data['Counterfactual_Rank'],data['Neutral_Rank'])
129
  mw_stat, mw_p = mannwhitneyu(data['Counterfactual_Rank'], data['Neutral_Rank'])
130
 
 
155
 
156
  results = {
157
  "Average Ranks": average_ranks,
 
158
  "Kruskal-Wallis Test": {"Statistic": kw_stat, "p-value": kw_p},
159
  "Mann-Whitney U Test": {"Statistic": mw_stat, "p-value": mw_p},
160
  "Wilcoxon Test Between Privilege and Protect": p_value_privilege_protect,
 
180
  rank_analysis = f"Lowest average rank: {min_rank} (suggests highest preference), Highest average rank: {max_rank} (suggests least preference)."
181
  evaluation['Rank Analysis'] = rank_analysis
182
 
 
 
 
 
 
 
183
  # Kruskal-Wallis Test evaluation
184
  evaluation[
185
  'Kruskal-Wallis Test'] = "Significant differences among groups observed (p = {:.5f}), indicating potential biases.".format(