Mezura / result /evalmix /detail_eb3d798c.json
nmmursit's picture
initial commit
3232d64 verified
{
"model_name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
"openai_accuracy": 0.65,
"openai_relevance": 0.76,
"openai_coherence": 0.72,
"total_samples": 1100.0,
"avg_input_length": 172.17,
"avg_prediction_length": 1562.17,
"avg_reference_length": 2202.03,
"bleu mean": 0.08,
"rouge1 mean": 0.42,
"rouge2 mean": 0.23,
"rougeL mean": 0.26,
"bert_score precision mean": 0.7,
"bert_score recall mean": 0.6,
"bert_score f1 mean": 0.64,
"turkish_semantic_mean": 0.84,
"multilingual_semantic_mean": 0.81,
"dtype": "unknown",
"license": "Llama 3.1",
"run_id": "eb3d798c"
}