aq_bert_gaq_mt / test_results.txt
anlausch's picture
Upload test_results.txt
fad28f0
cogency = {'mae': 0.3592796, 'mse': 0.1983012, 'pearsonr': 0.5809292900460671, 'pearsonp': 1.9064123938873942e-10}
effectiveness = {'mae': 0.42302832, 'mse': 0.2679618, 'pearsonr': 0.6203233528426574, 'pearsonp': 4.571428090457124e-12}
overall = {'mae': 0.38855445, 'mse': 0.22525525, 'pearsonr': 0.5235363955730953, 'pearsonp': 1.9365543006731483e-08}
reasonableness = {'mae': 0.35993263, 'mse': 0.20340253, 'pearsonr': 0.5734174888262382, 'pearsonp': 3.673681326066232e-10}