model update
Browse files- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_dequad.default.json +1 -0
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_esquad.default.json +1 -0
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_itquad.default.json +1 -0
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_jaquad.default.json +1 -0
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_koquad.default.json +1 -0
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_ruquad.default.json +1 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_dequad.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_esquad.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_itquad.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_jaquad.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_koquad.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_ruquad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_dequad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_esquad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_itquad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_jaquad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_koquad.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_ruquad.default.txt +0 -0
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_dequad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.016563347539712486, "Bleu_2": 0.00164017232799013, "Bleu_3": 5.485931952561731e-09, "Bleu_4": 1.0398886251298505e-11, "METEOR": 0.048242022461103554, "ROUGE_L": 0.016203570372304816, "BERTScore": 0.7371850965299024, "MoverScore": 0.5048791085509114}, "test": {"Bleu_1": 0.0155755658311017, "Bleu_2": 0.0013001277535285665, "Bleu_3": 4.696915431372903e-09, "Bleu_4": 9.242783121165897e-12, "METEOR": 0.04809700451843158, "ROUGE_L": 0.01556150764938016, "BERTScore": 0.7353078946893743, "MoverScore": 0.5036973829954939}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_esquad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.06400882359306387, "Bleu_2": 0.028423554237600325, "Bleu_3": 0.013484449091511863, "Bleu_4": 0.006908746027721992, "METEOR": 0.0580261757943717, "ROUGE_L": 0.05725959048259657, "BERTScore": 0.739460686351553, "MoverScore": 0.503132819197482}, "test": {"Bleu_1": 0.05698384656966584, "Bleu_2": 0.024183325154997555, "Bleu_3": 0.011520527213918438, "Bleu_4": 0.0059191752064594125, "METEOR": 0.06021086135293597, "ROUGE_L": 0.05208940592236566, "BERTScore": 0.7494422899749911, "MoverScore": 0.5062373132800192}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_itquad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.055887226950777295, "Bleu_2": 0.023797780823067778, "Bleu_3": 0.011418151261135904, "Bleu_4": 0.005907310966943627, "METEOR": 0.06478583217280727, "ROUGE_L": 0.04971947524396246, "BERTScore": 0.7357749120412369, "MoverScore": 0.5055480082720634}, "test": {"Bleu_1": 0.05627130996069784, "Bleu_2": 0.023968061444368343, "Bleu_3": 0.01119607925884517, "Bleu_4": 0.005438910607183992, "METEOR": 0.05890828426558759, "ROUGE_L": 0.05010570221421983, "BERTScore": 0.7260160158030385, "MoverScore": 0.5023119088393686}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_jaquad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03783346772233188, "Bleu_2": 0.0015411816247711597, "Bleu_3": 3.4629325178281635e-09, "Bleu_4": 5.350206732357571e-12, "METEOR": 0.005292131929790666, "ROUGE_L": 0.061958614759464875, "BERTScore": 0.6608086721605609, "MoverScore": 0.4648730149566324}, "test": {"Bleu_1": 0.03623832670553565, "Bleu_2": 0.0024163606906520323, "Bleu_3": 0.0006233487833399195, "Bleu_4": 4.4114578660129224e-08, "METEOR": 0.005149267426183168, "ROUGE_L": 0.06084267343290677, "BERTScore": 0.6608093198082075, "MoverScore": 0.46526108687696893}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_koquad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.0006134969325153261, "Bleu_2": 0.0002227838918347579, "Bleu_3": 0.00010324678023422135, "Bleu_4": 1.2819708463917865e-08, "METEOR": 0.007516731424749895, "ROUGE_L": 0.0007456867598022614, "BERTScore": 0.6650788443154896, "MoverScore": 0.45807532117648786}, "test": {"Bleu_1": 0.0004947136314807415, "Bleu_2": 0.00012325032170095948, "Bleu_3": 6.343141508957129e-10, "Bleu_4": 1.4750917137316939e-12, "METEOR": 0.007310046912436679, "ROUGE_L": 0.0006466767450454226, "BERTScore": 0.6634288882769679, "MoverScore": 0.4586124640357038}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_ruquad.default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.009066924306045688, "Bleu_2": 0.0008615643170394829, "Bleu_3": 0.0002566749503857388, "Bleu_4": 2.5671907994227123e-08, "METEOR": 0.017725042642279257, "ROUGE_L": 0.009948558551829344, "BERTScore": 0.7102904897794929, "MoverScore": 0.4913488465255146}, "test": {"Bleu_1": 0.008929234424890308, "Bleu_2": 0.0007401163336141037, "Bleu_3": 2.3187462841659724e-09, "Bleu_4": 4.229109829516021e-12, "METEOR": 0.017796529053904556, "ROUGE_L": 0.009881091250723615, "BERTScore": 0.7089446693028568, "MoverScore": 0.49098728551715626}}
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_dequad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_esquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_itquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_jaquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_koquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_ruquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_dequad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_esquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_itquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_jaquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_koquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_ruquad.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|