File size: 1,144 Bytes
d055e04 3b4f698 d055e04 3b4f698 d055e04 3b4f698 d055e04 3b4f698 d055e04 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 |
---
biencoder:
alias: vdr
sequence_length: 512
dropout: 0.1
shared_encoder: false
semiparametric: true
device: null
encoder_q:
base_model_id: bert-base-uncased
max_seq_len: 128
pretrained: true
norm: false
shift_vocab_num: 1000
prefix: encoder_q.
encoder_p:
base_model_id: bert-base-uncased
max_seq_len: 256
pretrained: true
norm: false
shift_vocab_num: 1000
prefix: encoder_p.
train_datasets:
- dl
- cm
dev_datasets:
- marco_dev_30neg
datastore: null
output_dir: null
train_sampling_rates: null
batch_size: 256
num_train_epochs: 5
num_warmup_epochs: 1
num_save_epochs: 1
num_eval_epochs: 1
hard_negatives: 0
other_negatives: 0
ret_negatives: 0
train_insert_title: true
valid_insert_title: false
adam_eps: 1.e-8
adam_betas: (0.9, 0.999)
learning_rate: 0.00002
max_grad_norm: 2
log_batch_step: 100
train_rolling_loss_step: 100
weight_decay: 0
sym_loss: true
do_lower_case: true
seed: 12345
checkpoint_file_name: vdr
model_file: null
local_rank: -1
local-rank: 2
device: null
distributed_world_size: null
distributed_port: null
no_cuda: false
n_gpu: null
fp16: true
license: mit
--- |