HoneyTian commited on
Commit
48b7537
·
1 Parent(s): 4464055
Files changed (41) hide show
  1. .gitignore +1 -1
  2. data/dataset/agent-lingoace-zh-400-choice.jsonl +3 -0
  3. data/dataset/agent-lingoace-zh-80-chat.jsonl +3 -0
  4. data/dataset/arc-easy-1000-choice.jsonl +3 -0
  5. data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250722_173400/arc-easy-1000-choice.jsonl +3 -0
  6. data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250722_192100/agent-lingoace-zh-400-choice.jsonl +3 -0
  7. data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl +3 -0
  8. data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  9. data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250722_151719/arc-easy-1000-choice.jsonl +3 -0
  10. data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250722_182800/agent-lingoace-zh-400-choice.jsonl +3 -0
  11. data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl +3 -0
  12. data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl +3 -0
  13. data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  14. data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_171155/arc-easy-1000-choice.jsonl +3 -0
  15. data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_174538/arc-easy-1000-choice.jsonl +3 -0
  16. data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250717_085617/arc-easy-1000-choice.jsonl +3 -0
  17. data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250721_094653/agent-lingoace-zh-400-choice.jsonl +3 -0
  18. data/eval_data/azure_openai/azure/gpt-4o-mini/us_west(47.88.76.239)/west_us_chatgpt_openai_azure_com/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl +3 -0
  19. data/eval_data/azure_openai/azure/gpt-4o-mini/us_west(47.88.76.239)/west_us_chatgpt_openai_azure_com/20250723-interval-10/arc-easy-1000-choice.jsonl +3 -0
  20. data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_173707/arc-easy-1000-choice.jsonl +3 -0
  21. data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250721_101634/agent-lingoace-zh-400-choice.jsonl +3 -0
  22. data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl +3 -0
  23. data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  24. data/eval_data/gemini_google/google/gemini-2.5-flash-lite-preview-06-17/shenzhen_sase/google_potent_veld_462405_t3/20250716_181105/arc-easy-1000-choice.jsonl +3 -0
  25. data/eval_data/gemini_google/google/gemini-2.5-flash-lite-preview-06-17/shenzhen_sase/google_potent_veld_462405_t3/20250721_102753/agent-lingoace-zh-400-choice.jsonl +3 -0
  26. data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250716_171804/arc-easy-1000-choice.jsonl +3 -0
  27. data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250721_103307/agent-lingoace-zh-400-choice.jsonl +3 -0
  28. data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250723_170948/agent-lingoace-zh-80-chat.jsonl +3 -0
  29. data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250723_170948/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  30. data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-400-choice.jsonl +3 -0
  31. data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-80-chat.jsonl +3 -0
  32. data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  33. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250716_194011/arc-easy-1000-choice.jsonl +3 -0
  34. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl +3 -0
  35. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_134934/agent-lingoace-zh-80-chat.jsonl +3 -0
  36. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_134934/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  37. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_090615/agent-lingoace-zh-400-choice.jsonl +3 -0
  38. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl +3 -0
  39. data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl.raw +0 -0
  40. data/eval_data/siliconflow/siliconflow/tencent#Hunyuan-A13B-Instruct/shenzhen_sase/siliconflow_api_key/20250721_113725/arc-easy-1000-choice.jsonl +3 -0
  41. data/eval_data/siliconflow/siliconflow/tencent#Hunyuan-A13B-Instruct/shenzhen_sase/siliconflow_api_key/20250723_114555/agent-lingoace-zh-400-choice.jsonl +3 -0
.gitignore CHANGED
@@ -2,7 +2,7 @@
2
  .git/
3
  .idea/
4
 
5
- /data/
6
  #/data/eval_data
7
  /data/raw_dataset
8
  /dotenv/
 
2
  .git/
3
  .idea/
4
 
5
+ #/data/
6
  #/data/eval_data
7
  /data/raw_dataset
8
  /dotenv/
data/dataset/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abced9a04efc60d5aeeb457232ae81f6f0574da2fa560951a4705096674a4594
3
+ size 1159751
data/dataset/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14fe4734e7e34bef9b0eab1fa7b4b92fa7dcd38194ec5271dde2b3bdbcbb2b32
3
+ size 812921
data/dataset/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcd9e4ecb932119e4d40d252957c88beab57cf5c322e8dfb4f865f750d9b9a66
3
+ size 590755
data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250722_173400/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d51627656a7d843562cf8196e683a74fec778f6cbedb3db1e6fc12b0f0d96849
3
+ size 716827
data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250722_192100/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d0bb578d6140790c8a0a1156f1cbf9dd4f4f09b9b3d32eca4bad2683c11b6f0
3
+ size 1206112
data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e43169d2f4370086055765f9f6d7a9483d8d4d718483a7d94a18816af376113
3
+ size 883128
data/eval_data/aws_claude/anthropic/anthropic.claude-instant-v1/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250722_151719/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3ca4e43701e7c5d4e10cc514c70657dca2f74d1d7c7cadc7362437036ebbe6c
3
+ size 867187
data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250722_182800/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31d0a0ace57b48d62f88e6a35bdb58aad11c13ba195367349971f71b550980c6
3
+ size 1240130
data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d837cffd8b66a66d830159d82e1854bdc4e0485614439ffb06bb4c6750f4393
3
+ size 1241812
data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bdd17b65ebcd3e23894a3cd6025ab076dc6077c2f6930ef22e6bd8426f75c68
3
+ size 893796
data/eval_data/aws_claude/anthropic/anthropic.claude-v2/us_west(47.88.76.239)/aws_us_east/20250724-interval-1/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_171155/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:413042e2111ed57e8ec284a73ab35ea0b37827dd035f6ec3612f1e9ae7067ced
3
+ size 720530
data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_174538/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203ac4e5c7ac5b957b044148ce9ce21621bb991c958a9bd991631043d87322f4
3
+ size 720499
data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250717_085617/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03f2394ae278458219d25b7933ab11925582425ee68796d83b826b58b7445cb4
3
+ size 720480
data/eval_data/azure_openai/azure/gpt-4o-mini/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250721_094653/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c860f01b9898a1dcb7ccabdd38201d907db4a3777e78f2c8bcda1f79aef633ec
3
+ size 1211356
data/eval_data/azure_openai/azure/gpt-4o-mini/us_west(47.88.76.239)/west_us_chatgpt_openai_azure_com/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624c7384e1f90591448730b002ac294a54e8f21050620527e4511507558f57cc
3
+ size 1211359
data/eval_data/azure_openai/azure/gpt-4o-mini/us_west(47.88.76.239)/west_us_chatgpt_openai_azure_com/20250723-interval-10/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbbe71941ac12af3678be85fd0dd2205503ccc44c1950a6b6b1dde721e15ba32
3
+ size 720520
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250716_173707/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8162c32ebd325a130057583dbbb19748e7b80f801d7cdd8fd2c5d45de715ee57
3
+ size 721025
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250721_101634/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ecbb0cc0e1321b018ac0a1319b4038f6ab552f589a1e871a3b1c873c92b995e
3
+ size 1211398
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7ad13e353f4db5a95c5fa2c293324c7e526a5a09230c60ef48437056f9613b4
3
+ size 228210
data/eval_data/azure_openai/azure/gpt-4o/shenzhen_sase/west_us_chatgpt_openai_azure_com/20250723_170505/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/gemini_google/google/gemini-2.5-flash-lite-preview-06-17/shenzhen_sase/google_potent_veld_462405_t3/20250716_181105/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b16f83e9824813bfb72e313ae88f10a773aa81b8124bca5400bbab3132be2898
3
+ size 721162
data/eval_data/gemini_google/google/gemini-2.5-flash-lite-preview-06-17/shenzhen_sase/google_potent_veld_462405_t3/20250721_102753/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65bbc20c79103eadb3fc43a2b3db1faa56eb51a5c8ef443a91775e331ab39727
3
+ size 1211276
data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250716_171804/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d0c8ed975dae2fb78271878f7ebf319967a48476e90394c6bd9c7e7413a5635
3
+ size 720952
data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250721_103307/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:058a61627c0738e053540d98c15fd023035e042dea9015d3ca1a55ef9677eeec
3
+ size 1211348
data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250723_170948/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2a98c5dc25e015fd820e67f4296facbd0d8a382302e1d4398d3e9f4e6ac62fd
3
+ size 880693
data/eval_data/gemini_google/google/gemini-2.5-flash/shenzhen_sase/google_potent_veld_462405_t3/20250723_170948/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52d752394961a9a1f088d4f133eadecba9218d8711771d7bd7f35479f563de90
3
+ size 1211203
data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7999d255ece2a0ba50cc1b78001f9cb90c8a85bf79a614e3b3079d3620582ac
3
+ size 874540
data/eval_data/siliconflow/siliconflow/Qwen#Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_110654/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250716_194011/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aab73da5402bf444935803fefd19e0e2498cdf437e2abea10702f656023d3f5
3
+ size 721209
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250723-interval-10/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8c7a5bcf39b74d282d2844da7b9c110dfb41ee4b6afec2483c09d5a8d1dfdda
3
+ size 1211471
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_134934/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f738d447fea73e42f14b847244efbb77feb875743d6c3cd64e26d3ef2a268152
3
+ size 881721
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-0528-Qwen3-8B/shenzhen_sase/siliconflow_api_key/20250724_134934/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_090615/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72dda25861a7cac263586a74da2e28d2ba7c01858428f5429c5b2384ab4fc65
3
+ size 1211475
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:319d3dc5d1bb00d972da47061549fc7641c0255e52dc1ae4f216e0bd96954521
3
+ size 943891
data/eval_data/siliconflow/siliconflow/deepseek-ai#DeepSeek-R1-Distill-Qwen-7B/shenzhen_sase/siliconflow_api_key/20250724_135543/agent-lingoace-zh-80-chat.jsonl.raw ADDED
The diff for this file is too large to render. See raw diff
 
data/eval_data/siliconflow/siliconflow/tencent#Hunyuan-A13B-Instruct/shenzhen_sase/siliconflow_api_key/20250721_113725/arc-easy-1000-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac93884932e258557cb04adddff72c08d4ffda751752a7eec3a2a52573ed9c7b
3
+ size 721973
data/eval_data/siliconflow/siliconflow/tencent#Hunyuan-A13B-Instruct/shenzhen_sase/siliconflow_api_key/20250723_114555/agent-lingoace-zh-400-choice.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4d412724af09ed3316e4af8690bba64161374c3329c3b98d88b94f9b9f70066
3
+ size 1211488