oabi commited on
Commit
5d78f2a
·
verified ·
1 Parent(s): 5fa3e67

Model save

Browse files
README.md CHANGED
@@ -1,20 +1,17 @@
1
  ---
2
  base_model: mistralai/Mistral-7B-v0.1
3
- datasets: HuggingFaceH4/ultrafeedback_binarized
4
  library_name: transformers
5
- model_name: mistralai/Mistral-7B-v0.1
6
  tags:
7
  - generated_from_trainer
8
- - alignment-handbook
9
- - HuggingFaceH4/ultrafeedback_binarized
10
  - trl
11
  - dpo
12
  licence: license
13
  ---
14
 
15
- # Model Card for mistralai/Mistral-7B-v0.1
16
 
17
- This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the [HuggingFaceH4/ultrafeedback_binarized](https://huggingface.co/datasets/HuggingFaceH4/ultrafeedback_binarized) dataset.
18
  It has been trained using [TRL](https://github.com/huggingface/trl).
19
 
20
  ## Quick start
 
1
  ---
2
  base_model: mistralai/Mistral-7B-v0.1
 
3
  library_name: transformers
4
+ model_name: math_ultrachatmistral32_4_3
5
  tags:
6
  - generated_from_trainer
 
 
7
  - trl
8
  - dpo
9
  licence: license
10
  ---
11
 
12
+ # Model Card for math_ultrachatmistral32_4_3
13
 
14
+ This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
all_results.json CHANGED
@@ -14,9 +14,9 @@
14
  "eval_samples_per_second": 17.291,
15
  "eval_steps_per_second": 0.139,
16
  "total_flos": 0.0,
17
- "train_loss": 0.676513671875,
18
- "train_runtime": 3055.0984,
19
  "train_samples": 5776,
20
- "train_samples_per_second": 5.874,
21
- "train_steps_per_second": 0.008
22
  }
 
14
  "eval_samples_per_second": 17.291,
15
  "eval_steps_per_second": 0.139,
16
  "total_flos": 0.0,
17
+ "train_loss": 0.0,
18
+ "train_runtime": 0.0144,
19
  "train_samples": 5776,
20
+ "train_samples_per_second": 1249870.973,
21
+ "train_steps_per_second": 1671.509
22
  }
runs/Jun04_13-49-16_cn-d004.server.mila.quebec/events.out.tfevents.1749059573.cn-d004.server.mila.quebec.3254818.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbedf723673ea5b0c9cf2b54b0ed8e90169a0a88308d9eff97076c66c64d3955
3
+ size 6427
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 0.0,
4
- "train_loss": 0.676513671875,
5
- "train_runtime": 3055.0984,
6
  "train_samples": 5776,
7
- "train_samples_per_second": 5.874,
8
- "train_steps_per_second": 0.008
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 0.0,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 0.0144,
6
  "train_samples": 5776,
7
+ "train_samples_per_second": 1249870.973,
8
+ "train_steps_per_second": 1671.509
9
  }
trainer_state.json CHANGED
@@ -43,10 +43,10 @@
43
  "epoch": 1.0,
44
  "step": 24,
45
  "total_flos": 0.0,
46
- "train_loss": 0.676513671875,
47
- "train_runtime": 3055.0984,
48
- "train_samples_per_second": 5.874,
49
- "train_steps_per_second": 0.008
50
  }
51
  ],
52
  "logging_steps": 20,
 
43
  "epoch": 1.0,
44
  "step": 24,
45
  "total_flos": 0.0,
46
+ "train_loss": 0.0,
47
+ "train_runtime": 0.0144,
48
+ "train_samples_per_second": 1249870.973,
49
+ "train_steps_per_second": 1671.509
50
  }
51
  ],
52
  "logging_steps": 20,
training_DATA/plots/barycenters_delta.png CHANGED
training_DATA/plots/distribution_step_18.png ADDED
training_DATA/plots/distribution_step_24.png ADDED
training_DATA/plots/distribution_step_6.png ADDED
training_DATA/plots/log_ratios_evolution.png CHANGED
training_DATA/plots/loss_evolution.png CHANGED
training_DATA/plots/qq_plots_evolution.png CHANGED

Git LFS Details

  • SHA256: eef8afc5554b9292dcaa8a02e6feb3f49d14582be29c3eefb3d52429db9fd4b5
  • Pointer size: 131 Bytes
  • Size of remote file: 107 kB

Git LFS Details

  • SHA256: 7d46a24ffc0692fb39913276c4b5821582e0b1e5e212537beb0ec1d9f0233438
  • Pointer size: 131 Bytes
  • Size of remote file: 112 kB
training_DATA/plots/qq_plots_step_24.png ADDED
training_DATA/plots/quantile_percentile_all_step_24.png ADDED
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6303bdf060efe7d91327d9dd58b2614aa6f548519c1a96381816ba3e68d68547
3
  size 8209
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ce2a6f13889d9d9ddb9f2427b82c40679930850515e595db3187099f489153a
3
  size 8209