File size: 497 Bytes
8d4c52c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
[
    {
        "agent_name": "GenericAgent-AgentTrek-1.0-32b",
        "study_id": "ed14232c-cd7e-4708-b334-ebaf1f220000", 
        "date_time": "2025-01-12 00:37:04",
        "benchmark": "WorkArena-L1",
        "score": 38.29,
        "std_err": 2.70,
        "benchmark_specific": "No",
        "benchmark_tuned": "No",
        "followed_evaluation_protocol": "Yes", 
        "reproducible": "Yes",
        "comments": "Additional details",
        "original_or_reproduced": "Original"
    }
]