|
allow_missing_params: false |
|
amp: false |
|
apex_amp: false |
|
batch_sentences_multiple_of: 8 |
|
batch_size: 1025 |
|
batch_type: word |
|
bow_task_pos_weight: 10 |
|
bow_task_weight: 1.0 |
|
bucket_scaling: false |
|
bucket_width: 8 |
|
cache_last_best_params: 0 |
|
cache_metric: perplexity |
|
cache_strategy: best |
|
checkpoint_improvement_threshold: 0.0 |
|
checkpoint_interval: 1000 |
|
clamp_to_dtype: false |
|
config: null |
|
decode_and_evaluate: 1000 |
|
decoder: transformer |
|
deepspeed_bf16: false |
|
deepspeed_fp16: false |
|
device_id: 0 |
|
dist: false |
|
dry_run: false |
|
dtype: float32 |
|
embed_dropout: |
|
- 0.5 |
|
- 0.5 |
|
encoder: transformer |
|
end_of_prepending_tag: null |
|
env: null |
|
fixed_param_names: [] |
|
fixed_param_strategy: null |
|
gradient_clipping_threshold: 1.0 |
|
gradient_clipping_type: none |
|
ignore_extra_params: false |
|
initial_learning_rate: 0.0002 |
|
keep_initializations: false |
|
keep_last_params: -1 |
|
label_smoothing: 0.2 |
|
label_smoothing_impl: torch |
|
learning_rate_reduce_factor: 0.7 |
|
learning_rate_reduce_num_not_improved: 8 |
|
learning_rate_scheduler_type: plateau-reduce |
|
learning_rate_warmup: 1000 |
|
length_task: null |
|
length_task_layers: 1 |
|
length_task_weight: 1.0 |
|
lhuc: null |
|
local_rank: null |
|
loglevel: INFO |
|
loglevel_secondary_workers: INFO |
|
max_checkpoints: null |
|
max_num_checkpoint_not_improved: 100 |
|
max_num_epochs: null |
|
max_samples: null |
|
max_seconds: null |
|
max_seq_len: |
|
- 512 |
|
- 512 |
|
max_updates: null |
|
min_num_epochs: 10 |
|
min_samples: null |
|
min_updates: null |
|
momentum: 0.0 |
|
neural_vocab_selection: null |
|
neural_vocab_selection_block_loss: false |
|
no_bucketing: true |
|
no_logfile: false |
|
no_reload_on_learning_rate_reduce: false |
|
num_embed: |
|
- null |
|
- null |
|
num_layers: |
|
- 6 |
|
- 6 |
|
num_words: |
|
- 0 |
|
- 0 |
|
optimized_metric: signwriting-similarity |
|
optimizer: adam |
|
optimizer_betas: |
|
- 0.9 |
|
- 0.999 |
|
optimizer_eps: 1.0e-08 |
|
output: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt-tuned/model |
|
overwrite_output: false |
|
pad_vocab_to_multiple_of: 8 |
|
params: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt/model/params.best |
|
prepared_data: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt-tuned/train_data |
|
quiet: false |
|
quiet_secondary_workers: false |
|
seed: 1 |
|
shared_vocab: false |
|
source: null |
|
source_factor_vocabs: [] |
|
source_factors: [] |
|
source_factors_combine: [] |
|
source_factors_num_embed: [] |
|
source_factors_share_embedding: [] |
|
source_factors_use_source_vocab: [] |
|
source_vocab: null |
|
stop_training_on_decoder_failure: false |
|
target: null |
|
target_factor_vocabs: [] |
|
target_factors: [] |
|
target_factors_combine: |
|
- sum |
|
- sum |
|
- sum |
|
- sum |
|
target_factors_num_embed: [] |
|
target_factors_share_embedding: |
|
- false |
|
- false |
|
- false |
|
- false |
|
target_factors_use_target_vocab: [] |
|
target_factors_weight: |
|
- 0.2 |
|
target_vocab: null |
|
tf32: true |
|
transformer_activation_type: |
|
- relu |
|
- relu |
|
transformer_attention_heads: |
|
- 8 |
|
- 8 |
|
transformer_block_prepended_cross_attention: false |
|
transformer_dropout_act: |
|
- 0.2 |
|
- 0.2 |
|
transformer_dropout_attention: |
|
- 0.2 |
|
- 0.2 |
|
transformer_dropout_prepost: |
|
- 0.2 |
|
- 0.2 |
|
transformer_feed_forward_num_hidden: |
|
- 2048 |
|
- 2048 |
|
transformer_feed_forward_use_glu: false |
|
transformer_model_size: |
|
- 512 |
|
- 512 |
|
transformer_positional_embedding_type: fixed |
|
transformer_postprocess: |
|
- dr |
|
- dr |
|
transformer_preprocess: |
|
- n |
|
- n |
|
update_interval: 1 |
|
use_cpu: false |
|
validation_source: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/source.txt |
|
validation_source_factors: [] |
|
validation_target: /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_0.txt |
|
validation_target_factors: |
|
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_1.txt |
|
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_2.txt |
|
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_3.txt |
|
- /home/amoryo/sign-language/signwriting-translation/parallel-clean/spoken-to-signed/test/target_4.txt |
|
weight_decay: 0.0 |
|
weight_tying_type: trg_softmax |
|
word_min_count: |
|
- 1 |
|
- 1 |
|
|