{ "dataset_reader": { "type": "seq2rel", "max_length": 512, "source_token_indexers": { "tokens": { "type": "pretrained_transformer", "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext", "tokenizer_kwargs": { "additional_special_tokens": [ "@ARG@", "@TRIGGER@" ], "do_lower_case": true } } }, "source_tokenizer": { "type": "pretrained_transformer", "add_special_tokens": true, "max_length": 512, "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext", "tokenizer_kwargs": { "additional_special_tokens": [ "@ARG@", "@TRIGGER@" ], "do_lower_case": true } }, "target_namespace": "target_tokens", "target_tokenizer": { "type": "pretrained_transformer", "add_special_tokens": false, "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext", "tokenizer_kwargs": { "additional_special_tokens": [ "@ARG@", "@TRIGGER@", "@OSP@", "@start@", "@end@", ";" ], "do_lower_case": true } } }, "model": { "type": "copynet_seq2rel", "attention": { "type": "multihead_attention", "dropout": 0.1, "num_heads": 6 }, "beam_search": { "beam_size": 1, "final_sequence_scorer": { "type": "length-normalized-sequence-log-prob", "length_penalty": 1 }, "max_steps": 96 }, "dropout": 0.1, "sequence_based_metrics": [ { "average": "micro", "labels": [ "OSP" ], "remove_duplicate_ents": true, "type": "f1_seq2rel" } ], "source_embedder": { "token_embedders": { "tokens": { "type": "pretrained_transformer", "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext", "reinit_modules": 2, "tokenizer_kwargs": { "additional_special_tokens": [ "@ARG@", "@TRIGGER@" ], "do_lower_case": true } } } }, "target_embedding_dim": 256, "target_tokenizer": { "type": "pretrained_transformer", "add_special_tokens": false, "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext", "tokenizer_kwargs": { "additional_special_tokens": [ "@ARG@", "@TRIGGER@", "@OSP@", "@start@", "@end@", ";" ], "do_lower_case": true } }, "weight_dropout": 0.5 }, "train_data_path": "../granular/train_transform.tsv", "validation_data_path": "../granular/dev_transform.tsv", "trainer": { "callbacks": [ { "type": "should_validate_callback", "validation_interval": 1, "validation_start": 15 } ], "checkpointer": { "keep_most_recent_by_count": 1 }, "grad_norm": 1, "learning_rate_scheduler": { "type": "linear_with_warmup", "warmup_steps": 2906 }, "num_epochs": 25, "num_gradient_accumulation_steps": 1, "optimizer": { "type": "huggingface_adamw", "correct_bias": true, "eps": 1e-08, "lr": 0.0004, "parameter_groups": [ [ [ "transformer_model(?!.*(?:bias|LayerNorm|layer_norm))" ], { "lr": 2e-05, "weight_decay": 0.01 } ], [ [ "transformer_model(?=.*(?:bias|LayerNorm|layer_norm))" ], { "lr": 2e-05, "weight_decay": 0 } ] ], "weight_decay": 0 }, "use_amp": true, "validation_metric": "+fscore" }, "vocabulary": { "max_vocab_size": { "target_tokens": 1 }, "tokens_to_add": { "target_tokens": [ "@ARG@", "@TRIGGER@", "@OSP@", "@start@", "@end@", ";" ] } }, "data_loader": { "batch_sampler": { "type": "bucket", "batch_size": 4, "sorting_keys": [ "source_tokens" ] } }, "validation_data_loader": { "batch_sampler": { "type": "bucket", "batch_size": 128, "padding_noise": 0, "sorting_keys": [ "source_tokens" ] } } }