{ "dataset_reader": { "type": "conllu", "features": [ "token", "char" ], "lemma_indexers": { "char": { "type": "characters_const_padding", "character_tokenizer": { "end_tokens": [ "__END__" ], "start_tokens": [ "__START__" ] }, "min_padding_length": 32, "namespace": "lemma_characters" } }, "targets": [ "deprel", "feats", "head", "lemma", "upostag", "xpostag" ], "token_indexers": { "char": { "type": "characters_const_padding", "character_tokenizer": { "end_tokens": [ "__END__" ], "start_tokens": [ "__START__" ] }, "min_padding_length": 32 }, "feats": { "type": "feats_indexer" }, "lemma": { "type": "characters_const_padding", "character_tokenizer": { "end_tokens": [ "__END__" ], "start_tokens": [ "__START__" ] }, "min_padding_length": 32 }, "token": { "type": "pretrained_transformer_mismatched_fixed", "model_name": "transformer_models/electra-base-igc-is/", "tokenizer_kwargs": {} }, "upostag": { "type": "single_id", "feature_name": "pos_", "namespace": "upostag" }, "xpostag": { "type": "single_id", "feature_name": "tag_", "namespace": "xpostag" } }, "use_sem": false }, "model": { "type": "semantic_multitask", "dependency_relation": { "type": "combo_dependency_parsing_from_vocab", "dependency_projection_layer": { "activation": "tanh", "dropout_rate": 0.25, "in_features": 1024, "out_features": 128 }, "head_predictor": { "cycle_loss_n": 0, "dependency_projection_layer": { "activation": "tanh", "in_features": 1024, "out_features": 512 }, "head_projection_layer": { "activation": "tanh", "in_features": 1024, "out_features": 512 } }, "head_projection_layer": { "activation": "tanh", "dropout_rate": 0.25, "in_features": 1024, "out_features": 128 }, "vocab_namespace": "deprel_labels" }, "lemmatizer": { "type": "combo_lemma_predictor_from_vocab", "activations": [ "relu", "relu", "relu", "linear" ], "char_vocab_namespace": "token_characters", "dilation": [ 1, 2, 4, 1 ], "embedding_dim": 256, "filters": [ 256, 256, 256 ], "input_projection_layer": { "activation": "tanh", "dropout_rate": 0.25, "in_features": 1024, "out_features": 32 }, "kernel_size": [ 3, 3, 3, 1 ], "lemma_vocab_namespace": "lemma_characters", "padding": [ 1, 2, 4, 0 ], "stride": [ 1, 1, 1, 1 ] }, "loss_weights": { "deprel": 0.8, "feats": 0.2, "head": 0.2, "lemma": 0.05, "semrel": 0.05, "upostag": 0.05, "xpostag": 0.05 }, "morphological_feat": { "type": "combo_morpho_from_vocab", "activations": [ "tanh", "linear" ], "dropout": [ 0.25, 0 ], "hidden_dims": [ 128 ], "input_dim": 1024, "num_layers": 2, "vocab_namespace": "feats_labels" }, "regularizer": { "regexes": [ [ ".*conv1d.*", { "alpha": 1e-06, "type": "l2" } ], [ ".*forward.*", { "alpha": 1e-06, "type": "l2" } ], [ ".*backward.*", { "alpha": 1e-06, "type": "l2" } ], [ ".*char_embed.*", { "alpha": 1e-05, "type": "l2" } ] ] }, "seq_encoder": { "type": "combo_encoder", "layer_dropout_probability": 0.33, "stacked_bilstm": { "hidden_size": 512, "input_size": 164, "layer_dropout_probability": 0.33, "num_layers": 2, "recurrent_dropout_probability": 0.33 } }, "text_field_embedder": { "type": "basic", "token_embedders": { "char": { "type": "char_embeddings_from_config", "dilated_cnn_encoder": { "activations": [ "relu", "relu", "linear" ], "dilation": [ 1, 2, 4 ], "filters": [ 512, 256, 64 ], "input_dim": 64, "kernel_size": [ 3, 3, 3 ], "padding": [ 1, 2, 4 ], "stride": [ 1, 1, 1 ] }, "embedding_dim": 64 }, "token": { "type": "transformers_word_embeddings", "model_name": "transformer_models/electra-base-igc-is/", "projection_dim": 100 } } }, "upos_tagger": { "activations": [ "tanh", "linear" ], "dropout": [ 0.25, 0 ], "hidden_dims": [ 64 ], "input_dim": 1024, "num_layers": 2, "vocab_namespace": "upostag_labels" }, "xpos_tagger": { "activations": [ "tanh", "linear" ], "dropout": [ 0.25, 0 ], "hidden_dims": [ 128 ], "input_dim": 1024, "num_layers": 2, "vocab_namespace": "xpostag_labels" } }, "train_data_path": "is_combined-ud-train.conllu", "validation_data_path": "is_combined-ud-dev.conllu", "trainer": { "type": "gradient_descent_validate_n", "checkpointer": { "type": "finishing_only_checkpointer" }, "cuda_device": 0, "epoch_callbacks": [ { "type": "transfer_patience" } ], "grad_clipping": 5, "learning_rate_scheduler": { "type": "combo_scheduler" }, "num_epochs": 400, "optimizer": { "type": "adam", "betas": [ 0.9, 0.9 ], "lr": 0.002 }, "patience": 1, "validation_metric": "+EM" }, "vocabulary": { "type": "from_instances_extended", "non_padded_namespaces": [ "head_labels" ], "only_include_pretrained_words": true, "oov_token": "_", "padding_token": "__PAD__" }, "type": "default", "data_loader": { "batch_sampler": { "type": "token_count", "word_batch_size": 2500 } }, "datasets_for_vocab_creation": [ "train" ], "numpy_seed": 8787, "pytorch_seed": 8787, "random_seed": 8787 }