Add question-answering pipeline tag and link to Hugging Face paper
Browse filesThis PR updates the model card by:
- Adding the `pipeline_tag: question-answering`, which is relevant for this model, and makes it more easily discoverable on the Hub.
- Updating the paper link to the Hugging Face papers URL.
README.md
CHANGED
@@ -1,15 +1,16 @@
|
|
1 |
---
|
2 |
-
library_name: transformers
|
3 |
-
license: apache-2.0
|
4 |
base_model:
|
5 |
- Qwen/Qwen2.5-Math-7B
|
|
|
|
|
|
|
6 |
---
|
7 |
|
8 |
# Qwen2.5-Math-7B-Oat-Zero
|
9 |
|
10 |
## Links
|
11 |
|
12 |
-
- π [Paper](https://
|
13 |
- π» [GitHub](https://github.com/sail-sg/understand-r1-zero)
|
14 |
- π€ [Oat-Zero Collection](https://huggingface.co/collections/sail/oat-zero-understanding-r1-zero-like-training-67dcdb07b9f3eb05f1501c4a)
|
15 |
|
@@ -33,17 +34,24 @@ import vllm
|
|
33 |
|
34 |
def apply_qwen_math_template(question: str):
|
35 |
return (
|
36 |
-
"<|im_start|>system
|
|
|
|
|
|
|
37 |
+ question
|
38 |
-
+ "<|im_end
|
|
|
|
|
39 |
)
|
40 |
|
41 |
def apply_r1_template(question: str):
|
42 |
return (
|
43 |
"A conversation between User and Assistant. The User asks a question, and the Assistant solves it. The Assistant first thinks about the reasoning process in the mind and then provides the User with the answer. "
|
44 |
-
"The reasoning process is enclosed within <think> </think> and answer is enclosed within <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer
|
|
|
45 |
+ question
|
46 |
-
+ "
|
|
|
47 |
)
|
48 |
|
49 |
model_name = "sail/Qwen2.5-Math-7B-Oat-Zero"
|
@@ -85,4 +93,4 @@ print(outputs)
|
|
85 |
year={2025},
|
86 |
howpublished={\url{https://github.com/sail-sg/understand-r1-zero}},
|
87 |
}
|
88 |
-
```
|
|
|
1 |
---
|
|
|
|
|
2 |
base_model:
|
3 |
- Qwen/Qwen2.5-Math-7B
|
4 |
+
library_name: transformers
|
5 |
+
license: apache-2.0
|
6 |
+
pipeline_tag: question-answering
|
7 |
---
|
8 |
|
9 |
# Qwen2.5-Math-7B-Oat-Zero
|
10 |
|
11 |
## Links
|
12 |
|
13 |
+
- π [Paper](https://huggingface.co/papers/2503.20783)
|
14 |
- π» [GitHub](https://github.com/sail-sg/understand-r1-zero)
|
15 |
- π€ [Oat-Zero Collection](https://huggingface.co/collections/sail/oat-zero-understanding-r1-zero-like-training-67dcdb07b9f3eb05f1501c4a)
|
16 |
|
|
|
34 |
|
35 |
def apply_qwen_math_template(question: str):
|
36 |
return (
|
37 |
+
"<|im_start|>system
|
38 |
+
Please reason step by step, and put your final answer within \\boxed{}.<|im_end|>
|
39 |
+
<|im_start|>user
|
40 |
+
"
|
41 |
+ question
|
42 |
+
+ "<|im_end|>
|
43 |
+
<|im_start|>assistant
|
44 |
+
"
|
45 |
)
|
46 |
|
47 |
def apply_r1_template(question: str):
|
48 |
return (
|
49 |
"A conversation between User and Assistant. The User asks a question, and the Assistant solves it. The Assistant first thinks about the reasoning process in the mind and then provides the User with the answer. "
|
50 |
+
"The reasoning process is enclosed within <think> </think> and answer is enclosed within <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer>.
|
51 |
+
User: "
|
52 |
+ question
|
53 |
+
+ "
|
54 |
+
Assistant: <think>"
|
55 |
)
|
56 |
|
57 |
model_name = "sail/Qwen2.5-Math-7B-Oat-Zero"
|
|
|
93 |
year={2025},
|
94 |
howpublished={\url{https://github.com/sail-sg/understand-r1-zero}},
|
95 |
}
|
96 |
+
```
|