dirkgr commited on
Commit
49a6ee1
1 Parent(s): bf86aa1

Update repository

Browse files
.gitattributes CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ *.th filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - allennlp
4
+ ---
5
+
6
+ # TODO: Fill this model card
config.json ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_reader": {
3
+ "type": "squad",
4
+ "token_indexers": {
5
+ "elmo": {
6
+ "type": "elmo_characters"
7
+ },
8
+ "token_characters": {
9
+ "type": "characters",
10
+ "character_tokenizer": {
11
+ "byte_encoding": "utf-8",
12
+ "end_tokens": [
13
+ 260
14
+ ],
15
+ "start_tokens": [
16
+ 259
17
+ ]
18
+ },
19
+ "min_padding_length": 5
20
+ },
21
+ "tokens": {
22
+ "type": "single_id",
23
+ "lowercase_tokens": true
24
+ }
25
+ }
26
+ },
27
+ "model": {
28
+ "type": "bidaf",
29
+ "dropout": 0.2,
30
+ "matrix_attention": {
31
+ "type": "linear",
32
+ "combination": "x,y,x*y",
33
+ "tensor_1_dim": 200,
34
+ "tensor_2_dim": 200
35
+ },
36
+ "modeling_layer": {
37
+ "type": "lstm",
38
+ "bidirectional": true,
39
+ "dropout": 0.2,
40
+ "hidden_size": 100,
41
+ "input_size": 800,
42
+ "num_layers": 2
43
+ },
44
+ "num_highway_layers": 2,
45
+ "phrase_layer": {
46
+ "type": "lstm",
47
+ "bidirectional": true,
48
+ "hidden_size": 100,
49
+ "input_size": 1224,
50
+ "num_layers": 1
51
+ },
52
+ "span_end_encoder": {
53
+ "type": "lstm",
54
+ "bidirectional": true,
55
+ "hidden_size": 100,
56
+ "input_size": 1400,
57
+ "num_layers": 1
58
+ },
59
+ "text_field_embedder": {
60
+ "token_embedders": {
61
+ "elmo": {
62
+ "type": "elmo_token_embedder",
63
+ "do_layer_norm": false,
64
+ "dropout": 0,
65
+ "options_file": "https://allennlp.s3.amazonaws.com/models/elmo/2x4096_512_2048cnn_2xhighway/elmo_2x4096_512_2048cnn_2xhighway_options.json",
66
+ "weight_file": "https://allennlp.s3.amazonaws.com/models/elmo/2x4096_512_2048cnn_2xhighway/elmo_2x4096_512_2048cnn_2xhighway_weights.hdf5"
67
+ },
68
+ "token_characters": {
69
+ "type": "character_encoding",
70
+ "dropout": 0.2,
71
+ "embedding": {
72
+ "embedding_dim": 16,
73
+ "num_embeddings": 262
74
+ },
75
+ "encoder": {
76
+ "type": "cnn",
77
+ "embedding_dim": 16,
78
+ "ngram_filter_sizes": [
79
+ 5
80
+ ],
81
+ "num_filters": 100
82
+ }
83
+ },
84
+ "tokens": {
85
+ "type": "embedding",
86
+ "embedding_dim": 100,
87
+ "pretrained_file": "https://allennlp.s3.amazonaws.com/datasets/glove/glove.6B.100d.txt.gz",
88
+ "trainable": false
89
+ }
90
+ }
91
+ }
92
+ },
93
+ "train_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-train-v1.1.json",
94
+ "validation_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-dev-v1.1.json",
95
+ "trainer": {
96
+ "grad_norm": 5,
97
+ "learning_rate_scheduler": {
98
+ "type": "reduce_on_plateau",
99
+ "factor": 0.5,
100
+ "mode": "max",
101
+ "patience": 2
102
+ },
103
+ "num_epochs": 20,
104
+ "optimizer": {
105
+ "type": "adam",
106
+ "betas": [
107
+ 0.9,
108
+ 0.9
109
+ ]
110
+ },
111
+ "patience": 10,
112
+ "validation_metric": "+em"
113
+ },
114
+ "data_loader": {
115
+ "batch_sampler": {
116
+ "type": "bucket",
117
+ "batch_size": 40
118
+ }
119
+ }
120
+ }
metrics.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_epoch": 4,
3
+ "peak_worker_0_memory_MB": 39697.6484375,
4
+ "peak_gpu_0_memory_MB": 7284.326171875,
5
+ "training_duration": "4:33:51.728517",
6
+ "epoch": 14,
7
+ "training_start_acc": 0.9632758364821516,
8
+ "training_end_acc": 0.9648968595531913,
9
+ "training_span_acc": 0.9375221178323954,
10
+ "training_em": 0.9490519298165504,
11
+ "training_f1": 0.9746247710065422,
12
+ "training_loss": 0.21539007184950457,
13
+ "training_worker_0_memory_MB": 39697.6484375,
14
+ "training_gpu_0_memory_MB": 7283.4765625,
15
+ "validation_start_acc": 0.6205298013245033,
16
+ "validation_end_acc": 0.6693472090823084,
17
+ "validation_span_acc": 0.5271523178807948,
18
+ "validation_em": 0.6779564806054872,
19
+ "validation_f1": 0.786469085303725,
20
+ "validation_loss": 4.7776187914722374,
21
+ "best_validation_start_acc": 0.6631031220435194,
22
+ "best_validation_end_acc": 0.6990539262062441,
23
+ "best_validation_span_acc": 0.5754020813623463,
24
+ "best_validation_em": 0.7165562913907285,
25
+ "best_validation_f1": 0.8039716876069539,
26
+ "best_validation_loss": 2.22837360759951
27
+ }
model.th ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24c6ab78b861d00865e4ea3973d9be71677c2f08a7ed72607b1dfd6a2a9d827c
3
+ size 450055351
vocabulary/.lock ADDED
File without changes
vocabulary/non_padded_namespaces.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ *labels
2
+ *tags
vocabulary/tokens.txt ADDED
The diff for this file is too large to render. See raw diff