|
shared_params: |
|
passages_path: null |
|
max_passage_length: 64 |
|
passage_batch_size: 64 |
|
question_batch_size: 64 |
|
use_topics: False |
|
|
|
datamodule: |
|
_target_: relik.retriever.lightning_modules.pl_data_modules.GoldenRetrieverPLDataModule |
|
datasets: |
|
train: |
|
_target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset |
|
name: "train" |
|
path: null |
|
tokenizer: ${model.language_model} |
|
max_passage_length: ${data.shared_params.max_passage_length} |
|
question_batch_size: ${data.shared_params.question_batch_size} |
|
passage_batch_size: ${data.shared_params.passage_batch_size} |
|
subsample_strategy: null |
|
subsample_portion: 0.1 |
|
shuffle: True |
|
use_topics: ${data.shared_params.use_topics} |
|
|
|
val: |
|
- _target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset |
|
name: "val" |
|
path: null |
|
tokenizer: ${model.language_model} |
|
max_passage_length: ${data.shared_params.max_passage_length} |
|
question_batch_size: ${data.shared_params.question_batch_size} |
|
passage_batch_size: ${data.shared_params.passage_batch_size} |
|
use_topics: ${data.shared_params.use_topics} |
|
|
|
test: |
|
- _target_: relik.retriever.data.datasets.AidaInBatchNegativesDataset |
|
name: "test" |
|
path: null |
|
tokenizer: ${model.language_model} |
|
max_passage_length: ${data.shared_params.max_passage_length} |
|
question_batch_size: ${data.shared_params.question_batch_size} |
|
passage_batch_size: ${data.shared_params.passage_batch_size} |
|
use_topics: ${data.shared_params.use_topics} |
|
|
|
num_workers: |
|
train: 4 |
|
val: 4 |
|
test: 4 |
|
|