blue-onuii commited on
Commit
23acac0
·
verified ·
1 Parent(s): 09a026c

Upload training_args.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_args.json +30 -0
training_args.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_name": "kanana-cpt-qlora-sft-lora-concrete-250409",
3
+ "model_name": "Onuii/DAMI-base-merge-0408",
4
+ "dataset_name": "Onuii/DAMI-lecture-DB-Dataset-0408-concrete",
5
+ "max_seq_length": 8192,
6
+ "dtype": "bfloat16",
7
+ "load_in_4bit": true,
8
+ "r": 16,
9
+ "lora_alpha": 32,
10
+ "lora_dropout": 0.1,
11
+ "use_rslora": true,
12
+ "batch_size": 16,
13
+ "gradient_accumulation_steps": 2,
14
+ "learning_rate": 1e-05,
15
+ "warmup_ratio": 0.05,
16
+ "num_train_epochs": 4,
17
+ "optimizer": "adamw_8bit",
18
+ "weight_decay": 0.01,
19
+ "lr_scheduler_type": "linear",
20
+ "output_dir": "../outputs/kanana-cpt-qlora-sft-lora-concrete-250409",
21
+ "logging_dir": "../logs",
22
+ "logging_steps": 1,
23
+ "save_steps": 200,
24
+ "save_total_limit": 2,
25
+ "report_to": "wandb",
26
+ "use_gradient_checkpointing": true,
27
+ "save_strategy": "steps",
28
+ "random_seed": 562,
29
+ "hyperparameter_dir": "../hyperparameters"
30
+ }