asahi417 commited on
Commit
aa7d710
·
1 Parent(s): e3fe9b5
eval/metric.first.answer.paragraph.questions_answers.lmqg_qg_esquad.default.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"test": {"QAAlignedF1Score (BERTScore)": 0.7857923031588016, "QAAlignedRecall (BERTScore)": 0.818131573057886, "QAAlignedPrecision (BERTScore)": 0.7568131812989265, "QAAlignedF1Score (MoverScore)": 0.5440632238208617, "QAAlignedRecall (MoverScore)": 0.5618051323423495, "QAAlignedPrecision (MoverScore)": 0.5283062579624821, "Bleu_1": 0.10501883932940846, "Bleu_2": 0.051857270646380425, "Bleu_3": 0.02803650656253214, "Bleu_4": 0.017165238393884483, "METEOR": 0.21575500905397338, "ROUGE_L": 0.1487928695440393, "BERTScore": 0.6843389849589524, "MoverScore": 0.5146346425030268}, "validation": {"QAAlignedF1Score (BERTScore)": 0.8032872538956043, "QAAlignedRecall (BERTScore)": 0.8111814216179581, "QAAlignedPrecision (BERTScore)": 0.7962710874037519, "QAAlignedF1Score (MoverScore)": 0.5574670262241981, "QAAlignedRecall (MoverScore)": 0.5575099542400072, "QAAlignedPrecision (MoverScore)": 0.5578893666250195, "Bleu_1": 0.28325854393030314, "Bleu_2": 0.17247610295182422, "Bleu_3": 0.10459432676426662, "Bleu_4": 0.06747249112375009, "METEOR": 0.26440140936059636, "ROUGE_L": 0.2624044175106968, "BERTScore": 0.7650593423474279, "MoverScore": 0.5476046077960683}}
eval/metric.first.answer.paragraph_sentence.answer.lmqg_qg_esquad.default.json CHANGED
@@ -1 +1 @@
1
- {"validation": {"Bleu_1": 0.34949431413767984, "Bleu_2": 0.3010229742085597, "Bleu_3": 0.2639999790761519, "Bleu_4": 0.23271776861985005, "METEOR": 0.42325361488349056, "ROUGE_L": 0.4850041207368862, "BERTScore": 0.8886451057279121, "MoverScore": 0.7908526230591614, "AnswerF1Score": 72.70064220866507, "AnswerExactMatch": 54.049195837275306}, "test": {"Bleu_1": 0.37687591745099086, "Bleu_2": 0.3288681680368388, "Bleu_3": 0.2922838291013312, "Bleu_4": 0.26115782792391073, "METEOR": 0.43971011092759443, "ROUGE_L": 0.49502711426653784, "BERTScore": 0.9006049837243929, "MoverScore": 0.8097034022051106, "AnswerF1Score": 75.5304511018074, "AnswerExactMatch": 58.0321665089877}}
 
1
+ {"validation": {"Bleu_1": 0.34949431413767984, "Bleu_2": 0.3010229742085597, "Bleu_3": 0.2639999790761519, "Bleu_4": 0.23271776861985005, "METEOR": 0.42325361488349056, "ROUGE_L": 0.4850041207368862, "BERTScore": 0.8886451051978425, "MoverScore": 0.7908529461541517, "AnswerF1Score": 72.70064220866507, "AnswerExactMatch": 54.049195837275306}, "test": {"Bleu_1": 0.37687591745099086, "Bleu_2": 0.3288681680368388, "Bleu_3": 0.2922838291013312, "Bleu_4": 0.26115782792391073, "METEOR": 0.43971011092759443, "ROUGE_L": 0.49502711426653784, "BERTScore": 0.9006049827911319, "MoverScore": 0.8097033911598629, "AnswerF1Score": 75.5304511018074, "AnswerExactMatch": 58.0321665089877}}
eval/metric.first.sentence.paragraph_answer.question.lmqg_qg_esquad.default.json CHANGED
@@ -1 +1 @@
1
- {"validation": {"Bleu_1": 0.2630273591706407, "Bleu_2": 0.17885668635674512, "Bleu_3": 0.12930667088677536, "Bleu_4": 0.09605197073242909, "METEOR": 0.2253147036513889, "ROUGE_L": 0.24877448667847044, "BERTScore": 0.8271475026557433, "MoverScore": 0.5805841566299468}, "test": {"Bleu_1": 0.25560696329914556, "Bleu_2": 0.17392220789339444, "Bleu_3": 0.12613075725776055, "Bleu_4": 0.09427744154220405, "METEOR": 0.22756934349784053, "ROUGE_L": 0.24617098484475786, "BERTScore": 0.8316794754989838, "MoverScore": 0.5866009300701224}}
 
1
+ {"validation": {"Bleu_1": 0.2630273591706407, "Bleu_2": 0.17885668635674512, "Bleu_3": 0.12930667088677536, "Bleu_4": 0.09605197073242909, "METEOR": 0.2253147036513889, "ROUGE_L": 0.24877448667847044, "BERTScore": 0.8271475028363823, "MoverScore": 0.5805841441070194}, "test": {"Bleu_1": 0.25560696329914556, "Bleu_2": 0.17392220789339444, "Bleu_3": 0.12613075725776055, "Bleu_4": 0.09427744154220405, "METEOR": 0.22756934349784053, "ROUGE_L": 0.24617098484475786, "BERTScore": 0.8316794749517861, "MoverScore": 0.5866010303436665}}
eval/samples.test.hyp.paragraph.questions_answers.lmqg_qg_esquad.default.txt ADDED
The diff for this file is too large to render. See raw diff
 
eval/samples.validation.hyp.paragraph.questions_answers.lmqg_qg_esquad.default.txt ADDED
The diff for this file is too large to render. See raw diff