model update
Browse files- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -1
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.default.json +1 -1
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.json +1 -1
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.nyt.json +1 -1
- eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.reddit.json +1 -1
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt +0 -0
- eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt +0 -0
- eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt +0 -0
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"test": {"Bleu_1": 0.
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.22807172771780135, "Bleu_2": 0.14302875909058343, "Bleu_3": 0.0943267118225361, "Bleu_4": 0.06397573073460441, "METEOR": 0.2200658878298197, "ROUGE_L": 0.24511379765662356, "BERTScore": 0.9079008184234665, "MoverScore": 0.606714651117478}, "test": {"Bleu_1": 0.2323498314281678, "Bleu_2": 0.14533654718622838, "Bleu_3": 0.09566220123845202, "Bleu_4": 0.06530369842068952, "METEOR": 0.2229994442645732, "ROUGE_L": 0.25030985091008146, "BERTScore": 0.9092814804525936, "MoverScore": 0.6086538514008419}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.default.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"test": {"Bleu_1": 0.
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.24343317972350043, "Bleu_2": 0.15816218902595877, "Bleu_3": 0.10917347021786453, "Bleu_4": 0.07824175435643511, "METEOR": 0.2383924625046418, "ROUGE_L": 0.2502527693569991, "BERTScore": 0.9174469174829358, "MoverScore": 0.6262604968663966}, "test": {"Bleu_1": 0.24615529618749774, "Bleu_2": 0.15963407302487692, "Bleu_3": 0.10978933228979144, "Bleu_4": 0.07839941048417529, "METEOR": 0.24046838149047955, "ROUGE_L": 0.25357667226247294, "BERTScore": 0.9182198703598111, "MoverScore": 0.6274693859765924}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"test": {"Bleu_1": 0.
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.29548978153628275, "Bleu_2": 0.20339994285369517, "Bleu_3": 0.14792639521090523, "Bleu_4": 0.11153987956921331, "METEOR": 0.2685051155769907, "ROUGE_L": 0.291721694521888, "BERTScore": 0.9303727465348341, "MoverScore": 0.6578535040761879}, "test": {"Bleu_1": 0.3007592217366819, "Bleu_2": 0.20544724608294512, "Bleu_3": 0.14867543544025819, "Bleu_4": 0.11118273173452982, "METEOR": 0.27315087810722966, "ROUGE_L": 0.2967546690273089, "BERTScore": 0.9322739617807421, "MoverScore": 0.6623000084761579}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.nyt.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"test": {"Bleu_1": 0.
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.24126775080164223, "Bleu_2": 0.1576880718998448, "Bleu_3": 0.11025568243123894, "Bleu_4": 0.07933611543656821, "METEOR": 0.25016737508611303, "ROUGE_L": 0.24744850178029204, "BERTScore": 0.9239760153976859, "MoverScore": 0.6400083650749762}, "test": {"Bleu_1": 0.24531707979889658, "Bleu_2": 0.16092958631387722, "Bleu_3": 0.1122699742387424, "Bleu_4": 0.08117757543966063, "METEOR": 0.25254205113198686, "ROUGE_L": 0.25292097720734297, "BERTScore": 0.9249009759439454, "MoverScore": 0.6406329128556304}}
|
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.reddit.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"test": {"Bleu_1": 0.
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.21672830897956055, "Bleu_2": 0.13458583690303294, "Bleu_3": 0.0885694934055027, "Bleu_4": 0.06124778357220166, "METEOR": 0.21629531044944675, "ROUGE_L": 0.22542144780446666, "BERTScore": 0.9102946136638357, "MoverScore": 0.6071781933330372}, "test": {"Bleu_1": 0.21511267314450663, "Bleu_2": 0.13363404569075632, "Bleu_3": 0.08756326944274698, "Bleu_4": 0.059525104157825456, "METEOR": 0.21499800504546457, "ROUGE_L": 0.22365090580055863, "BERTScore": 0.9095144685254328, "MoverScore": 0.6059332247878408}}
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|