Model save
Browse files- README.md +3 -6
- all_results.json +4 -4
- runs/Jun04_13-49-16_cn-d004.server.mila.quebec/events.out.tfevents.1749059573.cn-d004.server.mila.quebec.3254818.0 +3 -0
- train_results.json +4 -4
- trainer_state.json +4 -4
- training_DATA/plots/barycenters_delta.png +0 -0
- training_DATA/plots/distribution_step_18.png +0 -0
- training_DATA/plots/distribution_step_24.png +0 -0
- training_DATA/plots/distribution_step_6.png +0 -0
- training_DATA/plots/log_ratios_evolution.png +0 -0
- training_DATA/plots/loss_evolution.png +0 -0
- training_DATA/plots/qq_plots_evolution.png +2 -2
- training_DATA/plots/qq_plots_step_24.png +0 -0
- training_DATA/plots/quantile_percentile_all_step_24.png +0 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -1,20 +1,17 @@
|
|
1 |
---
|
2 |
base_model: mistralai/Mistral-7B-v0.1
|
3 |
-
datasets: HuggingFaceH4/ultrafeedback_binarized
|
4 |
library_name: transformers
|
5 |
-
model_name:
|
6 |
tags:
|
7 |
- generated_from_trainer
|
8 |
-
- alignment-handbook
|
9 |
-
- HuggingFaceH4/ultrafeedback_binarized
|
10 |
- trl
|
11 |
- dpo
|
12 |
licence: license
|
13 |
---
|
14 |
|
15 |
-
# Model Card for
|
16 |
|
17 |
-
This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1)
|
18 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
19 |
|
20 |
## Quick start
|
|
|
1 |
---
|
2 |
base_model: mistralai/Mistral-7B-v0.1
|
|
|
3 |
library_name: transformers
|
4 |
+
model_name: math_ultrachatmistral32_4_3
|
5 |
tags:
|
6 |
- generated_from_trainer
|
|
|
|
|
7 |
- trl
|
8 |
- dpo
|
9 |
licence: license
|
10 |
---
|
11 |
|
12 |
+
# Model Card for math_ultrachatmistral32_4_3
|
13 |
|
14 |
+
This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1).
|
15 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
16 |
|
17 |
## Quick start
|
all_results.json
CHANGED
@@ -14,9 +14,9 @@
|
|
14 |
"eval_samples_per_second": 17.291,
|
15 |
"eval_steps_per_second": 0.139,
|
16 |
"total_flos": 0.0,
|
17 |
-
"train_loss": 0.
|
18 |
-
"train_runtime":
|
19 |
"train_samples": 5776,
|
20 |
-
"train_samples_per_second":
|
21 |
-
"train_steps_per_second":
|
22 |
}
|
|
|
14 |
"eval_samples_per_second": 17.291,
|
15 |
"eval_steps_per_second": 0.139,
|
16 |
"total_flos": 0.0,
|
17 |
+
"train_loss": 0.0,
|
18 |
+
"train_runtime": 0.0144,
|
19 |
"train_samples": 5776,
|
20 |
+
"train_samples_per_second": 1249870.973,
|
21 |
+
"train_steps_per_second": 1671.509
|
22 |
}
|
runs/Jun04_13-49-16_cn-d004.server.mila.quebec/events.out.tfevents.1749059573.cn-d004.server.mila.quebec.3254818.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbedf723673ea5b0c9cf2b54b0ed8e90169a0a88308d9eff97076c66c64d3955
|
3 |
+
size 6427
|
train_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"total_flos": 0.0,
|
4 |
-
"train_loss": 0.
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 5776,
|
7 |
-
"train_samples_per_second":
|
8 |
-
"train_steps_per_second":
|
9 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"total_flos": 0.0,
|
4 |
+
"train_loss": 0.0,
|
5 |
+
"train_runtime": 0.0144,
|
6 |
"train_samples": 5776,
|
7 |
+
"train_samples_per_second": 1249870.973,
|
8 |
+
"train_steps_per_second": 1671.509
|
9 |
}
|
trainer_state.json
CHANGED
@@ -43,10 +43,10 @@
|
|
43 |
"epoch": 1.0,
|
44 |
"step": 24,
|
45 |
"total_flos": 0.0,
|
46 |
-
"train_loss": 0.
|
47 |
-
"train_runtime":
|
48 |
-
"train_samples_per_second":
|
49 |
-
"train_steps_per_second":
|
50 |
}
|
51 |
],
|
52 |
"logging_steps": 20,
|
|
|
43 |
"epoch": 1.0,
|
44 |
"step": 24,
|
45 |
"total_flos": 0.0,
|
46 |
+
"train_loss": 0.0,
|
47 |
+
"train_runtime": 0.0144,
|
48 |
+
"train_samples_per_second": 1249870.973,
|
49 |
+
"train_steps_per_second": 1671.509
|
50 |
}
|
51 |
],
|
52 |
"logging_steps": 20,
|
training_DATA/plots/barycenters_delta.png
CHANGED
![]() |
![]() |
training_DATA/plots/distribution_step_18.png
ADDED
![]() |
training_DATA/plots/distribution_step_24.png
ADDED
![]() |
training_DATA/plots/distribution_step_6.png
ADDED
![]() |
training_DATA/plots/log_ratios_evolution.png
CHANGED
![]() |
![]() |
training_DATA/plots/loss_evolution.png
CHANGED
![]() |
![]() |
training_DATA/plots/qq_plots_evolution.png
CHANGED
![]() |
Git LFS Details
|
![]() |
Git LFS Details
|
training_DATA/plots/qq_plots_step_24.png
ADDED
![]() |
training_DATA/plots/quantile_percentile_all_step_24.png
ADDED
![]() |
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 8209
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ce2a6f13889d9d9ddb9f2427b82c40679930850515e595db3187099f489153a
|
3 |
size 8209
|