Update README.md
Browse files
README.md
CHANGED
@@ -9,18 +9,18 @@ tags:
|
|
9 |
licence: license
|
10 |
datasets:
|
11 |
- microsoft/orca-math-word-problems-200k
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
# - name: GSM8k (Few-Shot)
|
25 |
# type: GSM8k (Few-Shot)
|
26 |
# value: 63.31%
|
@@ -39,13 +39,12 @@ This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggi
|
|
39 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
40 |
|
41 |
|
42 |
-
|
43 |
|
44 |
| Model | GSM8k 0-Shot | GSM8k Few-Shot |
|
45 |
|------------------------------------------|------------------|-------------------|
|
46 |
-
| Mistral-7B-v0.1 | 10 | 41 |
|
47 |
-
| Qwen2.5-1.5B-Thinking |
|
48 |
-
-->
|
49 |
|
50 |
## Training procedure
|
51 |
|
|
|
9 |
licence: license
|
10 |
datasets:
|
11 |
- microsoft/orca-math-word-problems-200k
|
12 |
+
model-index:
|
13 |
+
- name: Qwen2.5-1.5B-Thinking-v1.1
|
14 |
+
results:
|
15 |
+
- task:
|
16 |
+
type: text-generation
|
17 |
+
dataset:
|
18 |
+
name: openai/gsm8k
|
19 |
+
type: GradeSchoolMath8K
|
20 |
+
metrics:
|
21 |
+
- name: GSM8k (0-Shot)
|
22 |
+
type: GSM8k (0-Shot)
|
23 |
+
value: 17%
|
24 |
# - name: GSM8k (Few-Shot)
|
25 |
# type: GSM8k (Few-Shot)
|
26 |
# value: 63.31%
|
|
|
39 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
40 |
|
41 |
|
42 |
+
## Evals
|
43 |
|
44 |
| Model | GSM8k 0-Shot | GSM8k Few-Shot |
|
45 |
|------------------------------------------|------------------|-------------------|
|
46 |
+
| Mistral-7B-v0.1 | 10% | 41% |
|
47 |
+
| Qwen2.5-1.5B-Thinking | 17% | N/A |
|
|
|
48 |
|
49 |
## Training procedure
|
50 |
|