Zekun Wu commited on
Commit
5ca3be7
1 Parent(s): 3fe3b4c
Files changed (1) hide show
  1. util/evaluation.py +6 -5
util/evaluation.py CHANGED
@@ -90,27 +90,28 @@ def statistical_tests(data):
90
  }
91
 
92
  for (var1, var2) in pairs:
93
- pair_name = f'{var1} vs {var2}'
 
94
 
95
  # Mann-Whitney U Test
96
  mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
97
- pairwise_results['Mann-Whitney U Test'][pair_name+ rank_suffix] = {"Statistic": mw_stat, "p-value": mw_p}
98
 
99
  # Wilcoxon Signed-Rank Test
100
  if len(data) > 20:
101
  wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
102
  else:
103
  wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
104
- pairwise_results['Wilcoxon Test'][pair_name+ rank_suffix] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
105
 
106
  # Levene's Test for equality of variances
107
  levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
108
- pairwise_results['Levene\'s Test'][pair_name+score_suffix] = {"Statistic": levene_stat, "p-value": levene_p}
109
 
110
  # T-test for independent samples
111
  t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
112
  equal_var=(levene_p > 0.05))
113
- pairwise_results['T-Test'][pair_name+score_suffix] = {"Statistic": t_stat, "p-value": t_p}
114
 
115
  # ANOVA and post-hoc tests if applicable
116
  score_columns = [v + score_suffix for v in variables]
 
90
  }
91
 
92
  for (var1, var2) in pairs:
93
+ pair_name_rank = f'{var1}{rank_suffix} vs {var2}{rank_suffix}'
94
+ pair_name_score = f'{var1}{score_suffix} vs {var2}{score_suffix}'
95
 
96
  # Mann-Whitney U Test
97
  mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
98
+ pairwise_results['Mann-Whitney U Test'][pair_name_rank] = {"Statistic": mw_stat, "p-value": mw_p}
99
 
100
  # Wilcoxon Signed-Rank Test
101
  if len(data) > 20:
102
  wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
103
  else:
104
  wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
105
+ pairwise_results['Wilcoxon Test'][pair_name_rank] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
106
 
107
  # Levene's Test for equality of variances
108
  levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
109
+ pairwise_results['Levene\'s Test'][pair_name_score] = {"Statistic": levene_stat, "p-value": levene_p}
110
 
111
  # T-test for independent samples
112
  t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
113
  equal_var=(levene_p > 0.05))
114
+ pairwise_results['T-Test'][pair_name_score] = {"Statistic": t_stat, "p-value": t_p}
115
 
116
  # ANOVA and post-hoc tests if applicable
117
  score_columns = [v + score_suffix for v in variables]