|
trainer: "gist" |
|
model_name: "albertina-900m-ptpt-mmarco-pairs-gist1-v1" |
|
base_model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1" |
|
guide_model_name: "bertimbau-100m-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1" |
|
validation_ir: True |
|
validation_ir_corpus_size: 50000 |
|
|
|
|
|
|
|
train_dataset_configs: |
|
- alias: "mmarco" |
|
path: "unicamp-dl/mmarco" |
|
name: "portuguese" |
|
split: "train" |
|
|
|
|
|
examples_are_triples: False |
|
examples_are_labelled: False |
|
seed: 1 |
|
learning_rate: 1e-6 |
|
warmup_ratio: 0.1 |
|
weight_decay: 0.01 |
|
batch_size: 40 |
|
use_amp: True |
|
epochs: 1 |
|
|
|
validations_per_epoch: 100 |
|
|