daresearch commited on
Commit
a35a06c
·
verified ·
1 Parent(s): a244f90

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -12,7 +12,7 @@ from transformers import TrainingArguments
12
  from unsloth import is_bfloat16_supported
13
 
14
  # 1. Configuration
15
- max_seq_length = 2048
16
  dtype = None
17
  load_in_4bit = True
18
 
@@ -127,8 +127,8 @@ trainer = SFTTrainer(
127
  dataset_num_proc=2,
128
  packing=False, # Can make training 5x faster for short sequences.
129
  args=TrainingArguments(
130
- per_device_train_batch_size=8,
131
- gradient_accumulation_steps=4,
132
  warmup_steps=5,
133
  max_steps=-1,
134
  num_train_epochs=3,
 
12
  from unsloth import is_bfloat16_supported
13
 
14
  # 1. Configuration
15
+ max_seq_length = 1024
16
  dtype = None
17
  load_in_4bit = True
18
 
 
127
  dataset_num_proc=2,
128
  packing=False, # Can make training 5x faster for short sequences.
129
  args=TrainingArguments(
130
+ per_device_train_batch_size=32,
131
+ gradient_accumulation_steps=2,
132
  warmup_steps=5,
133
  max_steps=-1,
134
  num_train_epochs=3,