Spaces:
Sleeping
Sleeping
Zekun Wu
commited on
Commit
•
180622c
1
Parent(s):
5fd4442
update
Browse files- util/evaluation.py +34 -4
util/evaluation.py
CHANGED
@@ -82,28 +82,58 @@ def statistical_tests(data):
|
|
82 |
('Privilege', 'Neutral')
|
83 |
]
|
84 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
85 |
for (var1, var2) in pairs:
|
86 |
pair_name = f'{var1} vs {var2}'
|
87 |
|
88 |
# Mann-Whitney U Test
|
89 |
mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
90 |
-
pairwise_results[
|
91 |
|
92 |
# Wilcoxon Signed-Rank Test
|
93 |
if len(data) > 20:
|
94 |
wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
95 |
else:
|
96 |
wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
|
97 |
-
pairwise_results[
|
98 |
|
99 |
# Levene's Test for equality of variances
|
100 |
levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
|
101 |
-
pairwise_results[
|
102 |
|
103 |
# T-test for independent samples
|
104 |
t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
|
105 |
equal_var=(levene_p > 0.05))
|
106 |
-
pairwise_results[
|
107 |
|
108 |
# ANOVA and post-hoc tests if applicable
|
109 |
score_columns = [v + score_suffix for v in variables]
|
|
|
82 |
('Privilege', 'Neutral')
|
83 |
]
|
84 |
|
85 |
+
# for (var1, var2) in pairs:
|
86 |
+
# pair_name = f'{var1} vs {var2}'
|
87 |
+
#
|
88 |
+
# # Mann-Whitney U Test
|
89 |
+
# mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
90 |
+
# pairwise_results[f'Mann-Whitney U Test {pair_name}'] = {"Statistic": mw_stat, "p-value": mw_p}
|
91 |
+
#
|
92 |
+
# # Wilcoxon Signed-Rank Test
|
93 |
+
# if len(data) > 20:
|
94 |
+
# wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
95 |
+
# else:
|
96 |
+
# wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
|
97 |
+
# pairwise_results[f'Wilcoxon Test {pair_name}'] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
|
98 |
+
#
|
99 |
+
# # Levene's Test for equality of variances
|
100 |
+
# levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
|
101 |
+
# pairwise_results[f'Levene\'s Test {pair_name}'] = {"Statistic": levene_stat, "p-value": levene_p}
|
102 |
+
#
|
103 |
+
# # T-test for independent samples
|
104 |
+
# t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
|
105 |
+
# equal_var=(levene_p > 0.05))
|
106 |
+
# pairwise_results[f'T-Test {pair_name}'] = {"Statistic": t_stat, "p-value": t_p}
|
107 |
+
|
108 |
+
pairwise_results = {
|
109 |
+
'Mann-Whitney U Test': {},
|
110 |
+
'Wilcoxon Test': {},
|
111 |
+
'Levene\'s Test': {},
|
112 |
+
'T-Test': {}
|
113 |
+
}
|
114 |
+
|
115 |
for (var1, var2) in pairs:
|
116 |
pair_name = f'{var1} vs {var2}'
|
117 |
|
118 |
# Mann-Whitney U Test
|
119 |
mw_stat, mw_p = mannwhitneyu(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
120 |
+
pairwise_results['Mann-Whitney U Test'][pair_name] = {"Statistic": mw_stat, "p-value": mw_p}
|
121 |
|
122 |
# Wilcoxon Signed-Rank Test
|
123 |
if len(data) > 20:
|
124 |
wilcoxon_stat, wilcoxon_p = wilcoxon(data[f'{var1}{rank_suffix}'], data[f'{var2}{rank_suffix}'])
|
125 |
else:
|
126 |
wilcoxon_stat, wilcoxon_p = np.nan, "Sample size too small for Wilcoxon test."
|
127 |
+
pairwise_results['Wilcoxon Test'][pair_name] = {"Statistic": wilcoxon_stat, "p-value": wilcoxon_p}
|
128 |
|
129 |
# Levene's Test for equality of variances
|
130 |
levene_stat, levene_p = levene(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'])
|
131 |
+
pairwise_results['Levene\'s Test'][pair_name] = {"Statistic": levene_stat, "p-value": levene_p}
|
132 |
|
133 |
# T-test for independent samples
|
134 |
t_stat, t_p = ttest_ind(data[f'{var1}{score_suffix}'], data[f'{var2}{score_suffix}'],
|
135 |
equal_var=(levene_p > 0.05))
|
136 |
+
pairwise_results['T-Test'][pair_name] = {"Statistic": t_stat, "p-value": t_p}
|
137 |
|
138 |
# ANOVA and post-hoc tests if applicable
|
139 |
score_columns = [v + score_suffix for v in variables]
|