Untar

Browse files

Files changed (4) hide show

config.json +111 -0
vocabulary/non_padded_namespaces.txt +2 -0
vocabulary/tokens.txt +0 -0
weights.th +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,111 @@

+{
+    "dataset_reader": {
+        "type": "squad",
+        "token_indexers": {
+            "token_characters": {
+                "type": "characters",
+                "character_tokenizer": {
+                    "byte_encoding": "utf-8",
+                    "end_tokens": [
+                        260
+                    ],
+                    "start_tokens": [
+                        259
+                    ]
+                },
+                "min_padding_length": 5
+            },
+            "tokens": {
+                "type": "single_id",
+                "lowercase_tokens": true
+            }
+        }
+    },
+    "model": {
+        "type": "bidaf",
+        "dropout": 0.2,
+        "matrix_attention": {
+            "type": "linear",
+            "combination": "x,y,x*y",
+            "tensor_1_dim": 200,
+            "tensor_2_dim": 200
+        },
+        "modeling_layer": {
+            "type": "lstm",
+            "bidirectional": true,
+            "dropout": 0.2,
+            "hidden_size": 100,
+            "input_size": 800,
+            "num_layers": 2
+        },
+        "num_highway_layers": 2,
+        "phrase_layer": {
+            "type": "lstm",
+            "bidirectional": true,
+            "hidden_size": 100,
+            "input_size": 200,
+            "num_layers": 1
+        },
+        "span_end_encoder": {
+            "type": "lstm",
+            "bidirectional": true,
+            "hidden_size": 100,
+            "input_size": 1400,
+            "num_layers": 1
+        },
+        "text_field_embedder": {
+            "token_embedders": {
+                "token_characters": {
+                    "type": "character_encoding",
+                    "dropout": 0.2,
+                    "embedding": {
+                        "embedding_dim": 16,
+                        "num_embeddings": 262
+                    },
+                    "encoder": {
+                        "type": "cnn",
+                        "embedding_dim": 16,
+                        "ngram_filter_sizes": [
+                            5
+                        ],
+                        "num_filters": 100
+                    }
+                },
+                "tokens": {
+                    "type": "embedding",
+                    "embedding_dim": 100,
+                    "pretrained_file": "https://allennlp.s3.amazonaws.com/datasets/glove/glove.6B.100d.txt.gz",
+                    "trainable": false
+                }
+            }
+        }
+    },
+    "train_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-train-v1.1.json",
+    "validation_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-dev-v1.1.json",
+    "trainer": {
+        "cuda_device": 0,
+        "grad_norm": 5,
+        "learning_rate_scheduler": {
+            "type": "reduce_on_plateau",
+            "factor": 0.5,
+            "mode": "max",
+            "patience": 2
+        },
+        "num_epochs": 20,
+        "optimizer": {
+            "type": "adam",
+            "betas": [
+                0.9,
+                0.9
+            ]
+        },
+        "patience": 10,
+        "validation_metric": "+em"
+    },
+    "data_loader": {
+        "batch_sampler": {
+            "type": "bucket",
+            "batch_size": 40
+        }
+    }
+}

vocabulary/non_padded_namespaces.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ *labels
2	+ *tags

vocabulary/tokens.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

weights.th ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd30ae4bacc172504f44f2b21d1fa50cf71855818316a40028025d36058bc7c7
+size 49249265