adjust hyper-parameters
Browse files- train_with_unsloth.py +2 -2
train_with_unsloth.py
CHANGED
|
@@ -92,8 +92,8 @@ class LoggingSFTTrainer(SFTTrainer):
|
|
| 92 |
PROJECT_NAME = 'SmolLM2-360M-Instruct-TaiwanChat'
|
| 93 |
BASE_MODEL_ID = "unsloth/SmolLM2-360M-Instruct"
|
| 94 |
DATASET_ID = "yentinglin/TaiwanChat"
|
| 95 |
-
N_SAMPLES =
|
| 96 |
-
MAX_LEN =
|
| 97 |
|
| 98 |
# CUDA and W&B setup
|
| 99 |
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True,max_split_size_mb:128"
|
|
|
|
| 92 |
PROJECT_NAME = 'SmolLM2-360M-Instruct-TaiwanChat'
|
| 93 |
BASE_MODEL_ID = "unsloth/SmolLM2-360M-Instruct"
|
| 94 |
DATASET_ID = "yentinglin/TaiwanChat"
|
| 95 |
+
N_SAMPLES = 600000
|
| 96 |
+
MAX_LEN = 512
|
| 97 |
|
| 98 |
# CUDA and W&B setup
|
| 99 |
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True,max_split_size_mb:128"
|