luismsgomes's picture
added model
472e467
raw
history blame
803 Bytes
trainer: "gist"
model_name: "albertina-900m-ptpt-mmarco-pairs-gist1-v1"
base_model_name: "albertina-900m-ptpt-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
guide_model_name: "bertimbau-100m-europarl-eubookshop-ted2020-tatoeba-ct1-nli-gist10-sts-cosent20-v1"
validation_ir: True
validation_ir_corpus_size: 50000
# validation_ir_corpus_size: 500
# see https://huggingface.co/docs/datasets/v2.18.0/en/about_dataset_load
train_dataset_configs:
- alias: "mmarco"
path: "unicamp-dl/mmarco"
name: "portuguese"
split: "train"
# split: "train[1000:2000]"
examples_are_triples: False
examples_are_labelled: False
seed: 1
learning_rate: 1e-6
warmup_ratio: 0.1
weight_decay: 0.01
batch_size: 40
use_amp: True
epochs: 1
# validations_per_epoch: 1
validations_per_epoch: 100