asahi417 commited on
Commit
620ed38
1 Parent(s): 76c68b1

model update

Browse files
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json CHANGED
@@ -1 +1 @@
1
- {"test": {"Bleu_1": 0.23478930923830185, "Bleu_2": 0.1470683817289908, "Bleu_3": 0.09687166236849479, "Bleu_4": 0.06591939807481897, "METEOR": 0.22302475776082759, "ROUGE_L": 0.25109091232896347, "BERTScore": 0.9089399299362496, "MoverScore": 0.6082623762984268}}
 
1
+ {"validation": {"Bleu_1": 0.22807172771780135, "Bleu_2": 0.14302875909058343, "Bleu_3": 0.0943267118225361, "Bleu_4": 0.06397573073460441, "METEOR": 0.2200658878298197, "ROUGE_L": 0.24511379765662356, "BERTScore": 0.9079008184234665, "MoverScore": 0.606714651117478}, "test": {"Bleu_1": 0.2323498314281678, "Bleu_2": 0.14533654718622838, "Bleu_3": 0.09566220123845202, "Bleu_4": 0.06530369842068952, "METEOR": 0.2229994442645732, "ROUGE_L": 0.25030985091008146, "BERTScore": 0.9092814804525936, "MoverScore": 0.6086538514008419}}
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.default.json CHANGED
@@ -1 +1 @@
1
- {"test": {"Bleu_1": 0.24961893211984934, "Bleu_2": 0.16224827348484944, "Bleu_3": 0.11189327527628831, "Bleu_4": 0.08018033757402318, "METEOR": 0.2415579184277559, "ROUGE_L": 0.2552366436867511, "BERTScore": 0.9180997168082414, "MoverScore": 0.6275456813517103}}
 
1
+ {"validation": {"Bleu_1": 0.24343317972350043, "Bleu_2": 0.15816218902595877, "Bleu_3": 0.10917347021786453, "Bleu_4": 0.07824175435643511, "METEOR": 0.2383924625046418, "ROUGE_L": 0.2502527693569991, "BERTScore": 0.9174469174829358, "MoverScore": 0.6262604968663966}, "test": {"Bleu_1": 0.24615529618749774, "Bleu_2": 0.15963407302487692, "Bleu_3": 0.10978933228979144, "Bleu_4": 0.07839941048417529, "METEOR": 0.24046838149047955, "ROUGE_L": 0.25357667226247294, "BERTScore": 0.9182198703598111, "MoverScore": 0.6274693859765924}}
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.json CHANGED
@@ -1 +1 @@
1
- {"test": {"Bleu_1": 0.3069051037723495, "Bleu_2": 0.21124403131423797, "Bleu_3": 0.15382059116535382, "Bleu_4": 0.1158431914489352, "METEOR": 0.2761422239981249, "ROUGE_L": 0.30019623715409394, "BERTScore": 0.9322687200707555, "MoverScore": 0.6625598086909308}}
 
1
+ {"validation": {"Bleu_1": 0.29548978153628275, "Bleu_2": 0.20339994285369517, "Bleu_3": 0.14792639521090523, "Bleu_4": 0.11153987956921331, "METEOR": 0.2685051155769907, "ROUGE_L": 0.291721694521888, "BERTScore": 0.9303727465348341, "MoverScore": 0.6578535040761879}, "test": {"Bleu_1": 0.3007592217366819, "Bleu_2": 0.20544724608294512, "Bleu_3": 0.14867543544025819, "Bleu_4": 0.11118273173452982, "METEOR": 0.27315087810722966, "ROUGE_L": 0.2967546690273089, "BERTScore": 0.9322739617807421, "MoverScore": 0.6623000084761579}}
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.nyt.json CHANGED
@@ -1 +1 @@
1
- {"test": {"Bleu_1": 0.24796297638398285, "Bleu_2": 0.16248797271179893, "Bleu_3": 0.11351554864896994, "Bleu_4": 0.08224137833073777, "METEOR": 0.2537118945936586, "ROUGE_L": 0.2533059879938537, "BERTScore": 0.9247776169969026, "MoverScore": 0.6414352251279016}}
 
1
+ {"validation": {"Bleu_1": 0.24126775080164223, "Bleu_2": 0.1576880718998448, "Bleu_3": 0.11025568243123894, "Bleu_4": 0.07933611543656821, "METEOR": 0.25016737508611303, "ROUGE_L": 0.24744850178029204, "BERTScore": 0.9239760153976859, "MoverScore": 0.6400083650749762}, "test": {"Bleu_1": 0.24531707979889658, "Bleu_2": 0.16092958631387722, "Bleu_3": 0.1122699742387424, "Bleu_4": 0.08117757543966063, "METEOR": 0.25254205113198686, "ROUGE_L": 0.25292097720734297, "BERTScore": 0.9249009759439454, "MoverScore": 0.6406329128556304}}
eval_ood/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.reddit.json CHANGED
@@ -1 +1 @@
1
- {"test": {"Bleu_1": 0.21878514571481367, "Bleu_2": 0.13599900424688438, "Bleu_3": 0.08922012763962954, "Bleu_4": 0.06100378824252892, "METEOR": 0.2160021098025375, "ROUGE_L": 0.22646405222542731, "BERTScore": 0.9097197203173146, "MoverScore": 0.6060461610454748}}
 
1
+ {"validation": {"Bleu_1": 0.21672830897956055, "Bleu_2": 0.13458583690303294, "Bleu_3": 0.0885694934055027, "Bleu_4": 0.06124778357220166, "METEOR": 0.21629531044944675, "ROUGE_L": 0.22542144780446666, "BERTScore": 0.9102946136638357, "MoverScore": 0.6071781933330372}, "test": {"Bleu_1": 0.21511267314450663, "Bleu_2": 0.13363404569075632, "Bleu_3": 0.08756326944274698, "Bleu_4": 0.059525104157825456, "METEOR": 0.21499800504546457, "ROUGE_L": 0.22365090580055863, "BERTScore": 0.9095144685254328, "MoverScore": 0.6059332247878408}}
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt CHANGED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt CHANGED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt CHANGED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt CHANGED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt CHANGED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt ADDED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.default.txt ADDED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.new_wiki.txt ADDED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.nyt.txt ADDED
The diff for this file is too large to render. See raw diff
 
eval_ood/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.reddit.txt ADDED
The diff for this file is too large to render. See raw diff