OmniEval / eval-results /demo-leaderboard /qwen2-72b_gte-qwen2-1.5b /results_2023-12-08 15:46:20.425378.json
zstanjj's picture
add open source
0bf5b80
{
"results": {
"retrieval": {
"mrr": 0.36173120728929387,
"map": 0.3512338648443432
},
"generation": {
"em": 0.002277904328018223,
"f1": 0.3804001391052641,
"rouge1": 0.34576336184459094,
"rouge2": 0.1928778762677512,
"rougeL": 0.2383694455084706,
"accuracy": 0.4145785876993166,
"completeness": 0.598297213622291,
"hallucination": 0.0011627906976744186,
"utilization": 1.13922942206655,
"numerical_accuracy": 0.3218694885361552
}
},
"config": {
"eval_name": "gte-qwen2-1.5b_gte-qwen2-1.5b",
"generation_model": "Alibaba-NLP/gte-Qwen2-1.5B-instruct",
"generation_model_args": {
"name": "Alibaba-NLP/gte-Qwen2-1.5B-instruct",
"num_params": 1.5,
"open_source": true
},
"retrieval_model": "Alibaba-NLP/gte-Qwen2-1.5B-instruct",
"retrieval_model_args": {
"name": "Alibaba-NLP/gte-Qwen2-1.5B-instruct",
"num_params": 1.5,
"open_source": true
}
}
}