Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Pratik Bhavsar
commited on
Commit
·
30c00c1
1
Parent(s):
0c0ca73
added 4.1, o3, o4-mini
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- data_loader.py +2 -2
- output/gpt-4.1-2025-04-14/BFCL_v3_irrelevance.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_composite.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_long_context.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet +3 -0
- output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet +3 -0
- output/gpt-4.1-2025-04-14/tau_long_context.parquet +3 -0
- output/gpt-4.1-2025-04-14/toolace_single_func_call_1.parquet +3 -0
- output/gpt-4.1-2025-04-14/toolace_single_func_call_2.parquet +3 -0
- output/gpt-4.1-2025-04-14/xlam_multiple_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/xlam_multiple_tool_single_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/xlam_single_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/xlam_single_tool_single_call.parquet +3 -0
- output/gpt-4.1-2025-04-14/xlam_tool_miss.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_irrelevance.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_composite.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_long_context.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/tau_long_context.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/toolace_single_func_call_1.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/toolace_single_func_call_2.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/xlam_multiple_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/xlam_multiple_tool_single_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/xlam_single_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/xlam_single_tool_single_call.parquet +3 -0
- output/gpt-4.1-mini-2025-04-14/xlam_tool_miss.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_irrelevance.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_composite.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_long_context.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/tau_long_context.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/toolace_single_func_call_1.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/toolace_single_func_call_2.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/xlam_multiple_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/xlam_multiple_tool_single_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/xlam_single_tool_multiple_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/xlam_single_tool_single_call.parquet +3 -0
- output/gpt-4.1-nano-2025-04-14/xlam_tool_miss.parquet +3 -0
- output/o3-2025-04-16/BFCL_v3_irrelevance.parquet +3 -0
- output/o3-2025-04-16/BFCL_v3_multi_turn_base_multi_func_call.parquet +3 -0
- output/o3-2025-04-16/BFCL_v3_multi_turn_base_single_func_call.parquet +3 -0
- output/o3-2025-04-16/BFCL_v3_multi_turn_composite.parquet +3 -0
data_loader.py
CHANGED
@@ -648,7 +648,7 @@ CARDS = """ <div class="metrics-grid">
|
|
648 |
<div class="metric-card">
|
649 |
<div class="metric-number metric-blue">28</div>
|
650 |
<div class="metric-label">Total Models</div>
|
651 |
-
<div class="metric-detail primary">
|
652 |
<div class="metric-detail primary">8 Open Source</div>
|
653 |
</div>
|
654 |
|
@@ -1320,7 +1320,7 @@ evaluate_handler.finish()
|
|
1320 |
</div>
|
1321 |
<h3 class="feature-title">Updated Periodically</h3>
|
1322 |
<ul class="feature-list">
|
1323 |
-
<li>
|
1324 |
<li>8 open source models included</li>
|
1325 |
<li>Monthly model additions</li>
|
1326 |
</ul>
|
|
|
648 |
<div class="metric-card">
|
649 |
<div class="metric-number metric-blue">28</div>
|
650 |
<div class="metric-label">Total Models</div>
|
651 |
+
<div class="metric-detail primary">25 Private</div>
|
652 |
<div class="metric-detail primary">8 Open Source</div>
|
653 |
</div>
|
654 |
|
|
|
1320 |
</div>
|
1321 |
<h3 class="feature-title">Updated Periodically</h3>
|
1322 |
<ul class="feature-list">
|
1323 |
+
<li>25 private models evaluated</li>
|
1324 |
<li>8 open source models included</li>
|
1325 |
<li>Monthly model additions</li>
|
1326 |
</ul>
|
output/gpt-4.1-2025-04-14/BFCL_v3_irrelevance.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9657391d41255ffdbd4de7780e9dfe6a451bb5c6677606ac80bcbaef79541ef
|
3 |
+
size 38852
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0e7de17ae41587385da3d6f94ee3eed970796a4adf471ff1c44880dd6947ec4
|
3 |
+
size 23592
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f160b5db157355d39eb9dd59d3bb49251f673d1ca9cca1cfee676bc7ed43cde
|
3 |
+
size 21766
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_composite.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34943b87685bb6952d23fad943423a814b395c162f2348a04424f68a2a8a0410
|
3 |
+
size 43934
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5a910bf072b19ea7efab56bd124b1a76be0eefd17184c703a130a5e712103eb
|
3 |
+
size 36945
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e28f5fc8daf93f8d1918f064b39e8844e3f6b0890d8c542fa771cb7d0b079884
|
3 |
+
size 39152
|
output/gpt-4.1-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:966faf2bf7cb8ddcdab6cf9713143252726b0020ea04063bf61f6b403214cbd7
|
3 |
+
size 43237
|
output/gpt-4.1-2025-04-14/tau_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64532303dd7e812fb5ef38d72608d0968c5bb09bd50b010b585c294eb366d54e
|
3 |
+
size 44540
|
output/gpt-4.1-2025-04-14/toolace_single_func_call_1.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49a80caba95af5acbdb1cad1980ae21b35268d46165a956052080697757cee33
|
3 |
+
size 14854
|
output/gpt-4.1-2025-04-14/toolace_single_func_call_2.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a9060eddc7e91f8fdbc8ba9baaa0410cf73ed254dc6f94c1a98d4991a37cdb3
|
3 |
+
size 11794
|
output/gpt-4.1-2025-04-14/xlam_multiple_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5b899c060909ba19a23a5fa609fa17cd55113f4aaf1ad2b2f71a5d07645f216
|
3 |
+
size 100417
|
output/gpt-4.1-2025-04-14/xlam_multiple_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17d725be681561ab7a1172be69e5239dd772a2ca698b79e7ee00f7c2a82083ae
|
3 |
+
size 40235
|
output/gpt-4.1-2025-04-14/xlam_single_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d003963d351f1d8a7ee789ea7d6955c17c9a37c0356204d323e11e9267708327
|
3 |
+
size 31058
|
output/gpt-4.1-2025-04-14/xlam_single_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1970fc916291eafe5514a84c1cb0b074901dc2f76183fce13a059b28bbe5d6aa
|
3 |
+
size 44787
|
output/gpt-4.1-2025-04-14/xlam_tool_miss.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8167ac2915b4e33c18126edbb38389cd65584326884b7aa779559e1580b10c19
|
3 |
+
size 51042
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_irrelevance.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fccfcd1ac0cad9fc1f1d59de1d4ed4d898900609a2334026c6ee32c3e6ba8f9f
|
3 |
+
size 44676
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e12a309e4e7e26ef831397543b247441f737d3356184f84747f032eb45258e0
|
3 |
+
size 23552
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:535415d1dba1bb7db819c159e8f94328084fc0476e1ae323802489d7a6d3d04a
|
3 |
+
size 22540
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_composite.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:735629b98e55fdaf7c303f86b7cef03a8e2bda647f924cc34c329d9d6f546bdf
|
3 |
+
size 44786
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34742abfaf1b7c2d026ace161d64a31ac9b70e8ed40b5759349448e5df1adae8
|
3 |
+
size 38675
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3bf3f9733aa82be34ffe0ed70ce18d8c71760db125ef4dab4d0b83370c807bd
|
3 |
+
size 43312
|
output/gpt-4.1-mini-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80f6a75b1d8f5b3850fb9203e3118211e40e10f3b29ecfa07acc76105d8ff0fc
|
3 |
+
size 41539
|
output/gpt-4.1-mini-2025-04-14/tau_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf4a3bc10994592e948b32fe969104166452a700f41b5eacee93543368f4fd1
|
3 |
+
size 40845
|
output/gpt-4.1-mini-2025-04-14/toolace_single_func_call_1.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03b0c4739d04f758e2b19002bccbb7e458d2003ad5d2064cd71fe0f5149de6a8
|
3 |
+
size 18332
|
output/gpt-4.1-mini-2025-04-14/toolace_single_func_call_2.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:680d12f42944f33d23986fb9ef3d09a7c58032598ca07a99357f567ca0dc39f7
|
3 |
+
size 12367
|
output/gpt-4.1-mini-2025-04-14/xlam_multiple_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf98a01341a4f2bd7c2a045db5c16f692d76833222bd55688ff321d9f535d6a
|
3 |
+
size 102460
|
output/gpt-4.1-mini-2025-04-14/xlam_multiple_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c31ac0a4d91c91a6702d2f0cadea80e4245a1b19bc1565409465da2b13fe083
|
3 |
+
size 40289
|
output/gpt-4.1-mini-2025-04-14/xlam_single_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f1f7ebefc694dc464a505617dc5daf2fda4421635fdeaad189d2e4de8abdd85
|
3 |
+
size 30261
|
output/gpt-4.1-mini-2025-04-14/xlam_single_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18aa8fc4d1511927ee404e5eeea9006d18c4a20738c3d64471dbaec99b76563d
|
3 |
+
size 43614
|
output/gpt-4.1-mini-2025-04-14/xlam_tool_miss.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1e7f4023b92c464d248d77fcf950dc16f1b9d77528bfa72f1975a3ac0812763
|
3 |
+
size 54881
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_irrelevance.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d085185382e506e8780b60a6eceaac6b6bc26f3d1cfdfe88f9c73ade8f6a6f2
|
3 |
+
size 28700
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_base_multi_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c1484a10affc86ba086949da5e3ba6f4dd01eea27b1c9253e662aa8cf32b782
|
3 |
+
size 23233
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_base_single_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c8d3eb0d857fd78b5b9c30a0ac6cf230515cad9a7fa87551fb165d3870b2a4f
|
3 |
+
size 23672
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_composite.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50978eaf60ca133ce128a33fd4177c8f8dbd950226b2020b784adc54965e0995
|
3 |
+
size 40604
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8806fca6974028bd80dd947a0bed74f85cc21e708cc79242d1f433706aaf119c
|
3 |
+
size 38518
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_miss_func.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e64dd6f4dfa2f9a5c6baa832d133784010996666b393268e8c2f9a773c8d880
|
3 |
+
size 39577
|
output/gpt-4.1-nano-2025-04-14/BFCL_v3_multi_turn_miss_param.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48f0bcadd582afbe243186384d30c48d67986c852d51ed5cf2874cb5c316989a
|
3 |
+
size 40730
|
output/gpt-4.1-nano-2025-04-14/tau_long_context.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec16220b59b3a8a36deff0f0bc200a8b693a2a719f817615bf11478b08c47447
|
3 |
+
size 40606
|
output/gpt-4.1-nano-2025-04-14/toolace_single_func_call_1.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22bdc58ad908b88fac7d1e6eb6263596b6d0f8cf3ca1ee9a34fa2c250cbed6a8
|
3 |
+
size 15891
|
output/gpt-4.1-nano-2025-04-14/toolace_single_func_call_2.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dcc1ead32b72b83b86f7811f0eccfc2fee69aa30e64feb0095b362acfd20d44
|
3 |
+
size 11274
|
output/gpt-4.1-nano-2025-04-14/xlam_multiple_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8316f6de7d0f141aa4543642b78962fd30c7edf52a4092ac82f7e4a52af93ab
|
3 |
+
size 101127
|
output/gpt-4.1-nano-2025-04-14/xlam_multiple_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2589cec4f2cc428155d7a6386dc707935fe7e0f5e70554550ff3cb9664ace8fb
|
3 |
+
size 42309
|
output/gpt-4.1-nano-2025-04-14/xlam_single_tool_multiple_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c549fd43116a5ed343c5829e080c70f1a5b9475eb8bb4b978be27551edcf9eb
|
3 |
+
size 31369
|
output/gpt-4.1-nano-2025-04-14/xlam_single_tool_single_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97872c5db138fd78c790030526253f7437e522df850d2fa26c722dbe44abb696
|
3 |
+
size 45933
|
output/gpt-4.1-nano-2025-04-14/xlam_tool_miss.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80720e28be58215851a00a1437bcb1a02032321ee99f497771248ff605285541
|
3 |
+
size 53185
|
output/o3-2025-04-16/BFCL_v3_irrelevance.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:792d5f48891b2d40be615d33b2b78381610e7b8a776f13f0794ab687523fd3d6
|
3 |
+
size 61887
|
output/o3-2025-04-16/BFCL_v3_multi_turn_base_multi_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcdd60cc53f3bb310004c3fc584d345921f75106040a66423e3171f45e54ef86
|
3 |
+
size 24231
|
output/o3-2025-04-16/BFCL_v3_multi_turn_base_single_func_call.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27606cdd3aa865a4f79fdd0287e0578b2b74f2b3e9cdce307507d06b01da6814
|
3 |
+
size 23076
|
output/o3-2025-04-16/BFCL_v3_multi_turn_composite.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fbc0feb6b0a719b02c17f9cbd947bcc4ef5ae4e7c0f5cbe4e4cb0c2021a548f
|
3 |
+
size 47481
|