Zekun Wu commited on
Commit
180622c
1 Parent(s): 5fd4442
Files changed (1) hide show
  1. util/evaluation.py +34 -4
util/evaluation.py CHANGED
@@ -82,28 +82,58 @@ def statistical_tests(data):
82
  ('Privilege', 'Neutral')
83
  ]
84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
85
  for (var1, var2) in pairs:
86
  pair_name = f'{var1} vs {var2}'
87
 
88
  # Mann-Whitney U Test
89
  mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
90
- pairwise_results[f'Mann-Whitney U Test {pair_name}'] = {"Statistic": mw_stat, "p-value": mw_p}
91
 
92
  # Wilcoxon Signed-Rank Test
93
  if len(data) > 20:
94
  wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
95
  else:
96
  wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
97
- pairwise_results[f'Wilcoxon Test {pair_name}'] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
98
 
99
  # Levene's Test for equality of variances
100
  levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
101
- pairwise_results[f'Levene\'s Test {pair_name}'] = {"Statistic": levene_stat, "p-value": levene_p}
102
 
103
  # T-test for independent samples
104
  t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
105
  equal_var=(levene_p > 0.05))
106
- pairwise_results[f'T-Test {pair_name}'] = {"Statistic": t_stat, "p-value": t_p}
107
 
108
  # ANOVA and post-hoc tests if applicable
109
  score_columns = [v + score_suffix for v in variables]
 
82
  ('Privilege', 'Neutral')
83
  ]
84
 
85
+ # for (var1, var2) in pairs:
86
+ # pair_name = f'{var1} vs {var2}'
87
+ #
88
+ # # Mann-Whitney U Test
89
+ # mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
90
+ # pairwise_results[f'Mann-Whitney U Test {pair_name}'] = {"Statistic": mw_stat, "p-value": mw_p}
91
+ #
92
+ # # Wilcoxon Signed-Rank Test
93
+ # if len(data) > 20:
94
+ # wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
95
+ # else:
96
+ # wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
97
+ # pairwise_results[f'Wilcoxon Test {pair_name}'] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
98
+ #
99
+ # # Levene's Test for equality of variances
100
+ # levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
101
+ # pairwise_results[f'Levene\'s Test {pair_name}'] = {"Statistic": levene_stat, "p-value": levene_p}
102
+ #
103
+ # # T-test for independent samples
104
+ # t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
105
+ # equal_var=(levene_p > 0.05))
106
+ # pairwise_results[f'T-Test {pair_name}'] = {"Statistic": t_stat, "p-value": t_p}
107
+
108
+ pairwise_results = {
109
+ 'Mann-Whitney U Test': {},
110
+ 'Wilcoxon Test': {},
111
+ 'Levene\'s Test': {},
112
+ 'T-Test': {}
113
+ }
114
+
115
  for (var1, var2) in pairs:
116
  pair_name = f'{var1} vs {var2}'
117
 
118
  # Mann-Whitney U Test
119
  mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
120
+ pairwise_results['Mann-Whitney U Test'][pair_name] = {"Statistic": mw_stat, "p-value": mw_p}
121
 
122
  # Wilcoxon Signed-Rank Test
123
  if len(data) > 20:
124
  wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
125
  else:
126
  wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
127
+ pairwise_results['Wilcoxon Test'][pair_name] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
128
 
129
  # Levene's Test for equality of variances
130
  levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
131
+ pairwise_results['Levene\'s Test'][pair_name] = {"Statistic": levene_stat, "p-value": levene_p}
132
 
133
  # T-test for independent samples
134
  t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
135
  equal_var=(levene_p > 0.05))
136
+ pairwise_results['T-Test'][pair_name] = {"Statistic": t_stat, "p-value": t_p}
137
 
138
  # ANOVA and post-hoc tests if applicable
139
  score_columns = [v + score_suffix for v in variables]