diff --git a/olmocr/train/train.py b/olmocr/train/train.py index d5fd5b4..26e6843 100644 --- a/olmocr/train/train.py +++ b/olmocr/train/train.py @@ -276,6 +276,7 @@ def main(): if len(dataset) > 0: eval_datasets[dataset_name] = dataset + # Log total evaluation samples across all datasets total_eval_samples = sum(len(dataset) for dataset in eval_datasets.values()) logger.info(f"Total evaluation samples across {len(eval_datasets)} datasets: {total_eval_samples}")