This commit is contained in:
Jake Poznanski 2024-09-27 01:19:21 +00:00
parent c00e40d1c4
commit 37f10051f6

View File

@ -144,7 +144,7 @@ def run_train(config: TrainConfig):
validation_ds = dataset["validation"]
train_ds = train_ds.map(partial(prepare_data_for_qwen2_training, processor=processor, add_batch_dim=True), remove_columns=train_ds.column_names).filter(filter_by_max_seq_len)
validation_ds = validation_ds.map(partial(prepare_data_for_qwen2_training, processor=processor, add_batch_dim=True)), remove_columns=validation_ds.column_names)
validation_ds = validation_ds.map(partial(prepare_data_for_qwen2_training, processor=processor, add_batch_dim=True), remove_columns=validation_ds.column_names)
print(train_ds)
print(validation_ds)