MenahemOz's picture
Upload folder using huggingface_hub
5c058d4
{
"dataset_reader": {
"type": "seq2rel",
"max_length": 512,
"source_token_indexers": {
"tokens": {
"type": "pretrained_transformer",
"model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
"tokenizer_kwargs": {
"additional_special_tokens": [
"@ARG@",
"@TRIGGER@"
],
"do_lower_case": true
}
}
},
"source_tokenizer": {
"type": "pretrained_transformer",
"add_special_tokens": true,
"max_length": 512,
"model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
"tokenizer_kwargs": {
"additional_special_tokens": [
"@ARG@",
"@TRIGGER@"
],
"do_lower_case": true
}
},
"target_namespace": "target_tokens",
"target_tokenizer": {
"type": "pretrained_transformer",
"add_special_tokens": false,
"model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
"tokenizer_kwargs": {
"additional_special_tokens": [
"@ARG@",
"@TRIGGER@",
"@OSP@",
"@start@",
"@end@",
";"
],
"do_lower_case": true
}
}
},
"model": {
"type": "copynet_seq2rel",
"attention": {
"type": "multihead_attention",
"dropout": 0.1,
"num_heads": 6
},
"beam_search": {
"beam_size": 1,
"final_sequence_scorer": {
"type": "length-normalized-sequence-log-prob",
"length_penalty": 1
},
"max_steps": 96
},
"dropout": 0.1,
"sequence_based_metrics": [
{
"average": "micro",
"labels": [
"OSP"
],
"remove_duplicate_ents": true,
"type": "f1_seq2rel"
}
],
"source_embedder": {
"token_embedders": {
"tokens": {
"type": "pretrained_transformer",
"model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
"reinit_modules": 2,
"tokenizer_kwargs": {
"additional_special_tokens": [
"@ARG@",
"@TRIGGER@"
],
"do_lower_case": true
}
}
}
},
"target_embedding_dim": 256,
"target_tokenizer": {
"type": "pretrained_transformer",
"add_special_tokens": false,
"model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
"tokenizer_kwargs": {
"additional_special_tokens": [
"@ARG@",
"@TRIGGER@",
"@OSP@",
"@start@",
"@end@",
";"
],
"do_lower_case": true
}
},
"weight_dropout": 0.5
},
"train_data_path": "../granular/train_transform.tsv",
"validation_data_path": "../granular/dev_transform.tsv",
"trainer": {
"callbacks": [
{
"type": "should_validate_callback",
"validation_interval": 1,
"validation_start": 15
}
],
"checkpointer": {
"keep_most_recent_by_count": 1
},
"grad_norm": 1,
"learning_rate_scheduler": {
"type": "linear_with_warmup",
"warmup_steps": 2906
},
"num_epochs": 25,
"num_gradient_accumulation_steps": 1,
"optimizer": {
"type": "huggingface_adamw",
"correct_bias": true,
"eps": 1e-08,
"lr": 0.0004,
"parameter_groups": [
[
[
"transformer_model(?!.*(?:bias|LayerNorm|layer_norm))"
],
{
"lr": 2e-05,
"weight_decay": 0.01
}
],
[
[
"transformer_model(?=.*(?:bias|LayerNorm|layer_norm))"
],
{
"lr": 2e-05,
"weight_decay": 0
}
]
],
"weight_decay": 0
},
"use_amp": true,
"validation_metric": "+fscore"
},
"vocabulary": {
"max_vocab_size": {
"target_tokens": 1
},
"tokens_to_add": {
"target_tokens": [
"@ARG@",
"@TRIGGER@",
"@OSP@",
"@start@",
"@end@",
";"
]
}
},
"data_loader": {
"batch_sampler": {
"type": "bucket",
"batch_size": 4,
"sorting_keys": [
"source_tokens"
]
}
},
"validation_data_loader": {
"batch_sampler": {
"type": "bucket",
"batch_size": 128,
"padding_noise": 0,
"sorting_keys": [
"source_tokens"
]
}
}
}