riccorl's picture
first commit
626eca0
raw
history blame
1.66 kB
shared_params:
passages_path: null
max_passage_length: 64
passage_batch_size: 64
question_batch_size: 64
use_topics: False
datamodule:
_target_: relik.retriever.lightning_modules.pl_data_modules.GoldenRetrieverPLDataModule
datasets:
train:
_target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset
name: "train"
path: null
tokenizer: ${model.language_model}
max_passage_length: ${data.shared_params.max_passage_length}
question_batch_size: ${data.shared_params.question_batch_size}
passage_batch_size: ${data.shared_params.passage_batch_size}
subsample_strategy: null
subsample_portion: 0.1
shuffle: True
use_topics: ${data.shared_params.use_topics}
val:
- _target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset
name: "val"
path: null
tokenizer: ${model.language_model}
max_passage_length: ${data.shared_params.max_passage_length}
question_batch_size: ${data.shared_params.question_batch_size}
passage_batch_size: ${data.shared_params.passage_batch_size}
use_topics: ${data.shared_params.use_topics}
test:
- _target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset
name: "test"
path: null
tokenizer: ${model.language_model}
max_passage_length: ${data.shared_params.max_passage_length}
question_batch_size: ${data.shared_params.question_batch_size}
passage_batch_size: ${data.shared_params.passage_batch_size}
use_topics: ${data.shared_params.use_topics}
num_workers:
train: 4
val: 4
test: 4