Add metadata (library name, pipeline tag, license)
Browse filesThis PR adds the `library_name`, `pipeline_tag` and `license` as metadata to improve the model card, as it's a text generation model that can be used with the Transformers library.
README.md
CHANGED
@@ -3,7 +3,11 @@ base_model:
|
|
3 |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
|
4 |
datasets:
|
5 |
- Skywork/Skywork-OR1-RL-Data
|
|
|
|
|
|
|
6 |
---
|
|
|
7 |
<div align="center">
|
8 |
|
9 |
# 🤔 Skywork-OR1 (Open Reasoner 1)
|
@@ -64,12 +68,11 @@ We include the detailed results in the following table.
|
|
64 |
|-------|---------|---------|--------------|
|
65 |
| DeepSeek-R1-Distill-Qwen-7B | 55.5 | 39.2| 37.6 |
|
66 |
| Light-R1-7B-DS | 59.1 | 44.3| 39.5 |
|
|
|
|
|
67 |
| DeepSeek-R1-Distill-Qwen-32B | 72.9 | 59.0| 57.2 |
|
68 |
| TinyR1-32B-Preview | 78.1| 65.3| 61.6 |
|
69 |
| QwQ-32B | 79.5 | 65.3| 61.6 |
|
70 |
-
| DeepSeek-R1 | 79.8 | 70.0| 65.9 |
|
71 |
-
| **Skywork-OR1-Math-7B** | 69.8 | 52.3 | 43.6 |
|
72 |
-
| **Skywork-OR1-7B-Preview** | 63.6 | 45.8 | 43.9 |
|
73 |
| **Skywork-OR1-32B-Preview** | 79.7 | 69.0 | 63.9 |
|
74 |
|
75 |
## ⚙️ Training Recipe
|
@@ -111,7 +114,7 @@ Please cite the following:
|
|
111 |
|
112 |
@misc{skywork-or1-2025,
|
113 |
title={Skywork Open Reasoner Series},
|
114 |
-
author = {He, Jujie and Liu, Jiacai and Liu, Chris Yuhao and Yan, Rui and Wang, Chaojie and Cheng, Peng and Zhang, Xiaoyu and Zhang, Fuxiang and Xu, Jiacheng and Shen, Wei and Li, Siyuan and Zeng, Liang and Wei, Tianwen and Cheng, Cheng and Liu, Yang and Zhou, Yahui},
|
115 |
howpublished={\url{https://capricious-hydrogen-41c.notion.site/Skywork-Open-Reaonser-Series-1d0bc9ae823a80459b46c149e4f51680}},
|
116 |
note={Notion Blog},
|
117 |
year={2025}
|
|
|
3 |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
|
4 |
datasets:
|
5 |
- Skywork/Skywork-OR1-RL-Data
|
6 |
+
library_name: transformers
|
7 |
+
pipeline_tag: text-generation
|
8 |
+
license: apache-2.0
|
9 |
---
|
10 |
+
|
11 |
<div align="center">
|
12 |
|
13 |
# 🤔 Skywork-OR1 (Open Reasoner 1)
|
|
|
68 |
|-------|---------|---------|--------------|
|
69 |
| DeepSeek-R1-Distill-Qwen-7B | 55.5 | 39.2| 37.6 |
|
70 |
| Light-R1-7B-DS | 59.1 | 44.3| 39.5 |
|
71 |
+
| **Skywork-OR1-Math-7B** | 69.8 | 52.3 | 43.6 |
|
72 |
+
| **Skywork-OR1-7B-Preview** | 63.6 | 45.8 | 43.9 |
|
73 |
| DeepSeek-R1-Distill-Qwen-32B | 72.9 | 59.0| 57.2 |
|
74 |
| TinyR1-32B-Preview | 78.1| 65.3| 61.6 |
|
75 |
| QwQ-32B | 79.5 | 65.3| 61.6 |
|
|
|
|
|
|
|
76 |
| **Skywork-OR1-32B-Preview** | 79.7 | 69.0 | 63.9 |
|
77 |
|
78 |
## ⚙️ Training Recipe
|
|
|
114 |
|
115 |
@misc{skywork-or1-2025,
|
116 |
title={Skywork Open Reasoner Series},
|
117 |
+
author = {He, Jujie and Liu, Jiacai and Liu, Chris Yuhao and Yan, Rui and Wang, Chaojie and Cheng, Peng and Zhang, Xiaoyu and Zhang, Fuxiang and Xu, Jiacheng and Shen, Wei and Li, Siyuan and Zeng, Liang and Wei, Tianwen and Cheng, Cheng and An, Bo and Liu, Yang and Zhou, Yahui},
|
118 |
howpublished={\url{https://capricious-hydrogen-41c.notion.site/Skywork-Open-Reaonser-Series-1d0bc9ae823a80459b46c149e4f51680}},
|
119 |
note={Notion Blog},
|
120 |
year={2025}
|