cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
|
@@ -82,7 +82,7 @@ trainer = UnslothTrainer(
|
|
| 82 |
max_seq_length=max_seq_length,
|
| 83 |
dataset_num_proc=32,
|
| 84 |
max_steps=len(litgpt_streaming_dataset),
|
| 85 |
-
packing
|
| 86 |
|
| 87 |
args = UnslothTrainingArguments(
|
| 88 |
per_device_train_batch_size=16,
|
|
|
|
| 82 |
max_seq_length=max_seq_length,
|
| 83 |
dataset_num_proc=32,
|
| 84 |
max_steps=len(litgpt_streaming_dataset),
|
| 85 |
+
packing=False, # Can make training 5x faster for short sequences.
|
| 86 |
|
| 87 |
args = UnslothTrainingArguments(
|
| 88 |
per_device_train_batch_size=16,
|