Update repository

Browse files

Files changed (8) hide show

.gitattributes +1 -0
README.md +6 -0
config.json +110 -0
metrics.json +27 -0
model.th +3 -0
vocabulary/.lock +0 -0
vocabulary/non_padded_namespaces.txt +2 -0
vocabulary/tokens.txt +0 -0

.gitattributes CHANGED Viewed

@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.th filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,6 @@

+---
+tags:
+- allennlp
+---
+# TODO: Fill this model card

config.json ADDED Viewed

	@@ -0,0 +1,110 @@

+{
+    "dataset_reader": {
+        "type": "squad",
+        "token_indexers": {
+            "token_characters": {
+                "type": "characters",
+                "character_tokenizer": {
+                    "byte_encoding": "utf-8",
+                    "end_tokens": [
+                        260
+                    ],
+                    "start_tokens": [
+                        259
+                    ]
+                },
+                "min_padding_length": 5
+            },
+            "tokens": {
+                "type": "single_id",
+                "lowercase_tokens": true
+            }
+        }
+    },
+    "model": {
+        "type": "bidaf",
+        "dropout": 0.2,
+        "matrix_attention": {
+            "type": "linear",
+            "combination": "x,y,x*y",
+            "tensor_1_dim": 200,
+            "tensor_2_dim": 200
+        },
+        "modeling_layer": {
+            "type": "lstm",
+            "bidirectional": true,
+            "dropout": 0.2,
+            "hidden_size": 100,
+            "input_size": 800,
+            "num_layers": 2
+        },
+        "num_highway_layers": 2,
+        "phrase_layer": {
+            "type": "lstm",
+            "bidirectional": true,
+            "hidden_size": 100,
+            "input_size": 200,
+            "num_layers": 1
+        },
+        "span_end_encoder": {
+            "type": "lstm",
+            "bidirectional": true,
+            "hidden_size": 100,
+            "input_size": 1400,
+            "num_layers": 1
+        },
+        "text_field_embedder": {
+            "token_embedders": {
+                "token_characters": {
+                    "type": "character_encoding",
+                    "dropout": 0.2,
+                    "embedding": {
+                        "embedding_dim": 16,
+                        "num_embeddings": 262
+                    },
+                    "encoder": {
+                        "type": "cnn",
+                        "embedding_dim": 16,
+                        "ngram_filter_sizes": [
+                            5
+                        ],
+                        "num_filters": 100
+                    }
+                },
+                "tokens": {
+                    "type": "embedding",
+                    "embedding_dim": 100,
+                    "pretrained_file": "https://allennlp.s3.amazonaws.com/datasets/glove/glove.6B.100d.txt.gz",
+                    "trainable": false
+                }
+            }
+        }
+    },
+    "train_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-train-v1.1.json",
+    "validation_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-dev-v1.1.json",
+    "trainer": {
+        "grad_norm": 5,
+        "learning_rate_scheduler": {
+            "type": "reduce_on_plateau",
+            "factor": 0.5,
+            "mode": "max",
+            "patience": 2
+        },
+        "num_epochs": 20,
+        "optimizer": {
+            "type": "adam",
+            "betas": [
+                0.9,
+                0.9
+            ]
+        },
+        "patience": 10,
+        "validation_metric": "+em"
+    },
+    "data_loader": {
+        "batch_sampler": {
+            "type": "bucket",
+            "batch_size": 40
+        }
+    }
+}

metrics.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "best_epoch": 6,
+  "peak_worker_0_memory_MB": 10198.55859375,
+  "peak_gpu_0_memory_MB": 2483.1318359375,
+  "training_duration": "1:05:21.359214",
+  "epoch": 16,
+  "training_start_acc": 0.8171212000136988,
+  "training_end_acc": 0.8648158083996392,
+  "training_span_acc": 0.7419034463863743,
+  "training_em": 0.7959451591913149,
+  "training_f1": 0.9018048409974154,
+  "training_loss": 0.9448039527761337,
+  "training_worker_0_memory_MB": 10198.55859375,
+  "training_gpu_0_memory_MB": 2474.52490234375,
+  "validation_start_acc": 0.6181646168401135,
+  "validation_end_acc": 0.6535477767265847,
+  "validation_span_acc": 0.5310312204351939,
+  "validation_em": 0.661116367076632,
+  "validation_f1": 0.7646617261058106,
+  "validation_loss": 3.421157140551873,
+  "best_validation_start_acc": 0.6307473982970672,
+  "best_validation_end_acc": 0.6674550614947966,
+  "best_validation_span_acc": 0.5439924314096499,
+  "best_validation_em": 0.6747398297067171,
+  "best_validation_f1": 0.7706741501743936,
+  "best_validation_loss": 2.50613601477641
+}

model.th ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6b1ef8c68f1840c7a458358782ce8e4359552e8cb358c6856a3dffd8c5b9ff2
+size 49008050

vocabulary/.lock ADDED Viewed

File without changes

vocabulary/non_padded_namespaces.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ *labels
2	+ *tags

vocabulary/tokens.txt ADDED Viewed

The diff for this file is too large to render. See raw diff