ezzaldeen commited on
Commit
1d67b54
·
verified ·
1 Parent(s): 94d15da

End of training

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # Qwen2.5-1.5B-Instruct-AraNews
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # Qwen2.5-1.5B-Instruct-AraNews
18
 
19
+ This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct) on the arabic_news_sammary_train dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 2.0,
3
  "eval_arabic_news_sammary_test_loss": 1.4771952629089355,
4
- "eval_arabic_news_sammary_test_runtime": 1.4541,
5
- "eval_arabic_news_sammary_test_samples_per_second": 6.877,
6
- "eval_arabic_news_sammary_test_steps_per_second": 6.877,
7
  "total_flos": 168628741816320.0,
8
- "train_loss": 1.7585566838582356,
9
- "train_runtime": 19.6571,
10
- "train_samples_per_second": 1.526,
11
- "train_steps_per_second": 0.305
12
  }
 
1
  {
2
  "epoch": 2.0,
3
  "eval_arabic_news_sammary_test_loss": 1.4771952629089355,
4
+ "eval_arabic_news_sammary_test_runtime": 1.7003,
5
+ "eval_arabic_news_sammary_test_samples_per_second": 5.881,
6
+ "eval_arabic_news_sammary_test_steps_per_second": 5.881,
7
  "total_flos": 168628741816320.0,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 1.3096,
10
+ "train_samples_per_second": 7.636,
11
+ "train_steps_per_second": 1.527
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 2.0,
3
  "eval_arabic_news_sammary_test_loss": 1.4771952629089355,
4
- "eval_arabic_news_sammary_test_runtime": 1.4541,
5
- "eval_arabic_news_sammary_test_samples_per_second": 6.877,
6
- "eval_arabic_news_sammary_test_steps_per_second": 6.877
7
  }
 
1
  {
2
  "epoch": 2.0,
3
  "eval_arabic_news_sammary_test_loss": 1.4771952629089355,
4
+ "eval_arabic_news_sammary_test_runtime": 1.7003,
5
+ "eval_arabic_news_sammary_test_samples_per_second": 5.881,
6
+ "eval_arabic_news_sammary_test_steps_per_second": 5.881
7
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.0,
3
  "total_flos": 168628741816320.0,
4
- "train_loss": 1.7585566838582356,
5
- "train_runtime": 19.6571,
6
- "train_samples_per_second": 1.526,
7
- "train_steps_per_second": 0.305
8
  }
 
1
  {
2
  "epoch": 2.0,
3
  "total_flos": 168628741816320.0,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 1.3096,
6
+ "train_samples_per_second": 7.636,
7
+ "train_steps_per_second": 1.527
8
  }
trainer_state.json CHANGED
@@ -12,16 +12,16 @@
12
  "epoch": 2.0,
13
  "step": 6,
14
  "total_flos": 168628741816320.0,
15
- "train_loss": 1.7585566838582356,
16
- "train_runtime": 19.6571,
17
- "train_samples_per_second": 1.526,
18
- "train_steps_per_second": 0.305
19
  }
20
  ],
21
  "logging_steps": 10,
22
- "max_steps": 6,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 3,
25
  "save_steps": 500,
26
  "stateful_callbacks": {
27
  "TrainerControl": {
 
12
  "epoch": 2.0,
13
  "step": 6,
14
  "total_flos": 168628741816320.0,
15
+ "train_loss": 0.0,
16
+ "train_runtime": 1.3096,
17
+ "train_samples_per_second": 7.636,
18
+ "train_steps_per_second": 1.527
19
  }
20
  ],
21
  "logging_steps": 10,
22
+ "max_steps": 2,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 1,
25
  "save_steps": 500,
26
  "stateful_callbacks": {
27
  "TrainerControl": {