LysandreJik commited on
Commit
084226a
1 Parent(s): 462ff97
.gitattributes CHANGED
@@ -14,3 +14,4 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ weights.th filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_reader": {
3
+ "type": "snli",
4
+ "token_indexers": {
5
+ "tokens": {
6
+ "type": "pretrained_transformer",
7
+ "max_length": 512,
8
+ "model_name": "roberta-large"
9
+ }
10
+ },
11
+ "tokenizer": {
12
+ "type": "pretrained_transformer",
13
+ "add_special_tokens": false,
14
+ "model_name": "roberta-large"
15
+ }
16
+ },
17
+ "model": {
18
+ "type": "basic_classifier",
19
+ "dropout": 0.1,
20
+ "feedforward": {
21
+ "activations": "tanh",
22
+ "hidden_dims": 1024,
23
+ "input_dim": 1024,
24
+ "num_layers": 1
25
+ },
26
+ "namespace": "tags",
27
+ "seq2vec_encoder": {
28
+ "type": "cls_pooler",
29
+ "embedding_dim": 1024
30
+ },
31
+ "text_field_embedder": {
32
+ "token_embedders": {
33
+ "tokens": {
34
+ "type": "pretrained_transformer",
35
+ "max_length": 512,
36
+ "model_name": "roberta-large"
37
+ }
38
+ }
39
+ }
40
+ },
41
+ "train_data_path": "https://allennlp.s3.amazonaws.com/datasets/multinli/multinli_1.0_train.jsonl",
42
+ "validation_data_path": "https://allennlp.s3.amazonaws.com/datasets/multinli/multinli_1.0_dev_matched.jsonl",
43
+ "test_data_path": "https://allennlp.s3.amazonaws.com/datasets/multinli/multinli_1.0_dev_mismatched.jsonl",
44
+ "trainer": {
45
+ "cuda_device": 0,
46
+ "learning_rate_scheduler": {
47
+ "type": "slanted_triangular",
48
+ "cut_frac": 0.06
49
+ },
50
+ "num_epochs": 3,
51
+ "optimizer": {
52
+ "type": "huggingface_adamw",
53
+ "lr": 2e-06,
54
+ "weight_decay": 0.1
55
+ },
56
+ "validation_metric": "+accuracy"
57
+ },
58
+ "data_loader": {
59
+ "batch_sampler": {
60
+ "type": "bucket",
61
+ "batch_size": 16
62
+ }
63
+ }
64
+ }
vocabulary/.lock ADDED
File without changes
vocabulary/labels.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ entailment
2
+ contradiction
3
+ neutral
vocabulary/non_padded_namespaces.txt ADDED
@@ -0,0 +1,2 @@
 
 
1
+ *labels
2
+ *tags
archive.tar.gz → weights.th RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:794be8d5bd4fef827682773fe10905616ee40a748c9b1e6ac6be075fd78a4002
3
- size 1317831133
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d79919ceddea78f6c1531c3f811f9a7f242081b1cce331b2f0f00412e7ec4131
3
+ size 1425795576