relik-entity-linking / relik /retriever /conf /data /in_batch_negatives.yaml
riccorl's picture
first commit
626eca0
raw
history blame
No virus
1.51 kB
shared_params:
passages_path: null
max_passage_length: 64
prefetch_batches: True
use_topics: False
datamodule:
_target_: goldenretriever.lightning_modules.pl_data_modules.PLDataModule
tokenizer: ${model.language_model}
datasets:
train:
_target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset
name: "train"
path: null
passages_path: ${data.shared_params.passages_path}
max_passage_length: ${data.shared_params.max_passage_length}
prefetch_batches: ${data.shared_params.prefetch_batches}
subsample: null
shuffle: True
use_topics: ${data.shared_params.use_topics}
val:
- _target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset
name: "val"
path: null
passages_path: ${data.shared_params.passages_path}
max_passage_length: ${data.shared_params.max_passage_length}
prefetch_batches: ${data.shared_params.prefetch_batches}
use_topics: ${data.shared_params.use_topics}
test:
- _target_: goldenretriever.data.dpr.datasets.InBatchNegativesDPRDataset
name: "test"
path: null
passages_path: ${data.shared_params.passages_path}
max_passage_length: ${data.shared_params.max_passage_length}
prefetch_batches: ${data.shared_params.prefetch_batches}
use_topics: ${data.shared_params.use_topics}
batch_sizes:
train: 64
val: 64
test: 64
num_workers:
train: 4
val: 4
test: 4