OmniEval / eval-results /demo-leaderboard /qwen2-72b_bge-m3 /results_2023-12-08 15:46:20.425378.json
zstanjj's picture
add open-source
921b8ba
raw
history blame
926 Bytes
{
"results": {
"retrieval": {
"mrr": 0.3527809415337889,
"map": 0.3458855353075171
},
"generation": {
"em": 0.0017084282460136675,
"f1": 0.38645032979631466,
"rouge1": 0.3467267951634575,
"rouge2": 0.1930581604826183,
"rougeL": 0.24141093461883717,
"accuracy": 0.4271070615034169,
"completeness": 0.6119287374128582,
"hallucination": 0.0005847953216374269,
"utilization": 0.5400116822429907,
"numerical_accuracy": 0.3372093023255814
}
},
"config": {
"eval_name": "qwen2-72b_bge-m3",
"generative_model": "Qwen/Qwen2.5-72B-Instruct",
"generative_model_args": {
"name": "Qwen/Qwen2.5-72B-Instruct",
"num_params": 72.7,
"open_source": true
},
"retrieval_model": "BAAI/bge-m3",
"retrieval_model_args": {
"name": "BAAI/bge-m3",
"num_params": 0.5,
"open_source": true
}
}
}