Skip to content

Commit 1e5b0b7

Browse files
committed
update data collator swap logic (?)
1 parent 42a0a25 commit 1e5b0b7

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

unsloth_zoo/dataset_utils.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -364,8 +364,12 @@ def _train_on_responses_only(examples):
364364

365365
# Edit data collator as well if not DataCollatorForSeq2Seq
366366
from transformers import DataCollatorForSeq2Seq
367-
if hasattr(trainer, "data_collator") and \
368-
not isinstance(trainer.data_collator, DataCollatorForSeq2Seq):
367+
packing_enabled = getattr(trainer.args, "packing", False)
368+
if (
369+
hasattr(trainer, "data_collator")
370+
and not isinstance(trainer.data_collator, DataCollatorForSeq2Seq)
371+
and not packing_enabled
372+
):
369373
trainer.data_collator = DataCollatorForSeq2Seq(tokenizer = tokenizer)
370374

371375
# Check if all labels randomnly got masked to nothing - maybe wrong chat template?

0 commit comments

Comments
 (0)