shared_params: passages_path: null max_passage_length: 64 prefetch_batches: True use_topics: False datamodule: _target_: goldenretriever.lightning_modules.pl_data_modules.PLDataModule tokenizer: ${model.language_model} datasets: train: _target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset name: "train" path: null passages_path: ${data.shared_params.passages_path} max_passage_length: ${data.shared_params.max_passage_length} prefetch_batches: ${data.shared_params.prefetch_batches} subsample: null shuffle: True use_topics: ${data.shared_params.use_topics} val: - _target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset name: "val" path: null passages_path: ${data.shared_params.passages_path} max_passage_length: ${data.shared_params.max_passage_length} prefetch_batches: ${data.shared_params.prefetch_batches} use_topics: ${data.shared_params.use_topics} test: - _target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset name: "test" path: null passages_path: ${data.shared_params.passages_path} max_passage_length: ${data.shared_params.max_passage_length} prefetch_batches: ${data.shared_params.prefetch_batches} use_topics: ${data.shared_params.use_topics} batch_sizes: train: 64 val: 64 test: 64 num_workers: train: 4 val: 4 test: 4