silviacamplani commited on
Commit
0ec0622
1 Parent(s): 00629f0

Training in progress epoch 0

Browse files
Files changed (3) hide show
  1. README.md +4 -6
  2. config.json +58 -58
  3. tf_model.h5 +1 -1
README.md CHANGED
@@ -14,9 +14,9 @@ probably proofread and complete it, then remove this comment. -->
14
 
15
  This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
- - Train Loss: 2.5466
18
- - Validation Loss: 2.5109
19
- - Epoch: 2
20
 
21
  ## Model description
22
 
@@ -42,9 +42,7 @@ The following hyperparameters were used during training:
42
 
43
  | Train Loss | Validation Loss | Epoch |
44
  |:----------:|:---------------:|:-----:|
45
- | 3.2920 | 3.0536 | 0 |
46
- | 2.8585 | 2.6748 | 1 |
47
- | 2.5466 | 2.5109 | 2 |
48
 
49
 
50
  ### Framework versions
 
14
 
15
  This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
+ - Train Loss: 3.1628
18
+ - Validation Loss: 2.9340
19
+ - Epoch: 0
20
 
21
  ## Model description
22
 
 
42
 
43
  | Train Loss | Validation Loss | Epoch |
44
  |:----------:|:---------------:|:-----:|
45
+ | 3.1628 | 2.9340 | 0 |
 
 
46
 
47
 
48
  ### Framework versions
config.json CHANGED
@@ -9,67 +9,67 @@
9
  "dropout": 0.1,
10
  "hidden_dim": 3072,
11
  "id2label": {
12
- "0": 0,
13
- "1": 19,
14
- "2": 20,
15
- "3": 7,
16
- "4": 8,
17
- "5": 25,
18
- "6": 26,
19
- "7": 23,
20
- "8": 24,
21
- "9": 27,
22
- "10": 21,
23
- "11": 1,
24
- "12": 2,
25
- "13": 13,
26
- "14": 14,
27
- "15": 28,
28
- "16": 11,
29
- "17": 15,
30
- "18": 16,
31
- "19": 12,
32
- "20": 3,
33
- "21": 4,
34
- "22": 5,
35
- "23": 22,
36
- "24": 9,
37
- "25": 17,
38
- "26": 18,
39
- "27": 6,
40
- "28": 10
41
  },
42
  "initializer_range": 0.02,
43
  "label2id": {
44
- "0": 0,
45
- "1": 11,
46
- "2": 12,
47
- "3": 20,
48
- "4": 21,
49
- "5": 22,
50
- "6": 27,
51
- "7": 3,
52
- "8": 4,
53
- "9": 24,
54
- "10": 28,
55
- "11": 16,
56
- "12": 19,
57
- "13": 13,
58
- "14": 14,
59
- "15": 17,
60
- "16": 18,
61
- "17": 25,
62
- "18": 26,
63
- "19": 1,
64
- "20": 2,
65
- "21": 10,
66
- "22": 23,
67
- "23": 7,
68
- "24": 8,
69
- "25": 5,
70
- "26": 6,
71
- "27": 9,
72
- "28": 15
73
  },
74
  "max_position_embeddings": 512,
75
  "model_type": "distilbert",
 
9
  "dropout": 0.1,
10
  "hidden_dim": 3072,
11
  "id2label": {
12
+ "0": "O",
13
+ "1": "B-algorithm",
14
+ "2": "I-algorithm",
15
+ "3": "B-conference",
16
+ "4": "I-conference",
17
+ "5": "B-country",
18
+ "6": "I-country",
19
+ "7": "B-field",
20
+ "8": "I-field",
21
+ "9": "B-location",
22
+ "10": "I-location",
23
+ "11": "B-metrics",
24
+ "12": "I-metrics",
25
+ "13": "B-misc",
26
+ "14": "I-misc",
27
+ "15": "B-organisation",
28
+ "16": "I-organisation",
29
+ "17": "B-person",
30
+ "18": "I-person",
31
+ "19": "B-product",
32
+ "20": "I-product",
33
+ "21": "B-programlang",
34
+ "22": "I-programlang",
35
+ "23": "B-researcher",
36
+ "24": "I-researcher",
37
+ "25": "B-task",
38
+ "26": "I-task",
39
+ "27": "B-university",
40
+ "28": "I-university"
41
  },
42
  "initializer_range": 0.02,
43
  "label2id": {
44
+ "B-algorithm": 1,
45
+ "B-conference": 3,
46
+ "B-country": 5,
47
+ "B-field": 7,
48
+ "B-location": 9,
49
+ "B-metrics": 11,
50
+ "B-misc": 13,
51
+ "B-organisation": 15,
52
+ "B-person": 17,
53
+ "B-product": 19,
54
+ "B-programlang": 21,
55
+ "B-researcher": 23,
56
+ "B-task": 25,
57
+ "B-university": 27,
58
+ "I-algorithm": 2,
59
+ "I-conference": 4,
60
+ "I-country": 6,
61
+ "I-field": 8,
62
+ "I-location": 10,
63
+ "I-metrics": 12,
64
+ "I-misc": 14,
65
+ "I-organisation": 16,
66
+ "I-person": 18,
67
+ "I-product": 20,
68
+ "I-programlang": 22,
69
+ "I-researcher": 24,
70
+ "I-task": 26,
71
+ "I-university": 28,
72
+ "O": 0
73
  },
74
  "max_position_embeddings": 512,
75
  "model_type": "distilbert",
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12e9ab80e9ae58775098043b004549492022429f3d33146fcb6ced6159423ed0
3
  size 265666912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a16b0eac3d3c5f4ef0c67633f7f91a2f6a4c26b6490cdb5b562c7d8bb6c817e6
3
  size 265666912