Luigi commited on
Commit
976c215
·
1 Parent(s): 38e2b45

adjust hyper-parameters

Browse files
Files changed (1) hide show
  1. train_with_unsloth.py +2 -2
train_with_unsloth.py CHANGED
@@ -92,8 +92,8 @@ class LoggingSFTTrainer(SFTTrainer):
92
  PROJECT_NAME = 'SmolLM2-360M-Instruct-TaiwanChat'
93
  BASE_MODEL_ID = "unsloth/SmolLM2-360M-Instruct"
94
  DATASET_ID = "yentinglin/TaiwanChat"
95
- N_SAMPLES = 800000
96
- MAX_LEN = 2048
97
 
98
  # CUDA and W&B setup
99
  os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True,max_split_size_mb:128"
 
92
  PROJECT_NAME = 'SmolLM2-360M-Instruct-TaiwanChat'
93
  BASE_MODEL_ID = "unsloth/SmolLM2-360M-Instruct"
94
  DATASET_ID = "yentinglin/TaiwanChat"
95
+ N_SAMPLES = 600000
96
+ MAX_LEN = 512
97
 
98
  # CUDA and W&B setup
99
  os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True,max_split_size_mb:128"