justin871030 commited on
Commit
31da19d
โ€ข
1 Parent(s): 1d62521

Uploaded the first version finetuned model

Browse files
.gitattributes CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language: en
3
+ tags:
4
+ - go-emotion
5
+ - text-classification
6
+ - pytorch
7
+ datasets:
8
+ - go_emotions
9
+ metrics:
10
+ - f1
11
+ widget:
12
+ - text: "Thanks for giving advice to the people who need it! ๐Ÿ‘Œ๐Ÿ™"
13
+ license: mit
14
+ ---
15
+
16
+ ## Model Description
17
+ 1. Based on the uncased BERT pretrained model with a linear output layer.
18
+ 2. Added several commonly-used emoji and tokens to the special token list of the tokenizer.
19
+ 3. Did label smoothing while training.
20
+ 4. Used weighted loss and focal loss to help the cases which trained badly.
config.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-base-uncased",
3
+ "architectures": [
4
+ "BertForMultiLabelClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "finetuning_task": "goemotions",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "admiration",
15
+ "1": "amusement",
16
+ "10": "disapproval",
17
+ "11": "disgust",
18
+ "12": "embarrassment",
19
+ "13": "excitement",
20
+ "14": "fear",
21
+ "15": "gratitude",
22
+ "16": "grief",
23
+ "17": "joy",
24
+ "18": "love",
25
+ "19": "nervousness",
26
+ "2": "anger",
27
+ "20": "optimism",
28
+ "21": "pride",
29
+ "22": "realization",
30
+ "23": "relief",
31
+ "24": "remorse",
32
+ "25": "sadness",
33
+ "26": "surprise",
34
+ "27": "neutral",
35
+ "3": "annoyance",
36
+ "4": "approval",
37
+ "5": "caring",
38
+ "6": "confusion",
39
+ "7": "curiosity",
40
+ "8": "desire",
41
+ "9": "disappointment"
42
+ },
43
+ "initializer_range": 0.02,
44
+ "intermediate_size": 3072,
45
+ "label2id": {
46
+ "admiration": 0,
47
+ "amusement": 1,
48
+ "anger": 2,
49
+ "annoyance": 3,
50
+ "approval": 4,
51
+ "caring": 5,
52
+ "confusion": 6,
53
+ "curiosity": 7,
54
+ "desire": 8,
55
+ "disappointment": 9,
56
+ "disapproval": 10,
57
+ "disgust": 11,
58
+ "embarrassment": 12,
59
+ "excitement": 13,
60
+ "fear": 14,
61
+ "gratitude": 15,
62
+ "grief": 16,
63
+ "joy": 17,
64
+ "love": 18,
65
+ "nervousness": 19,
66
+ "neutral": 27,
67
+ "optimism": 20,
68
+ "pride": 21,
69
+ "realization": 22,
70
+ "relief": 23,
71
+ "remorse": 24,
72
+ "sadness": 25,
73
+ "surprise": 26
74
+ },
75
+ "layer_norm_eps": 1e-12,
76
+ "max_position_embeddings": 512,
77
+ "model_type": "bert",
78
+ "num_attention_heads": 12,
79
+ "num_hidden_layers": 12,
80
+ "pad_token_id": 0,
81
+ "position_embedding_type": "absolute",
82
+ "torch_dtype": "float32",
83
+ "transformers_version": "4.13.0",
84
+ "type_vocab_size": 2,
85
+ "vocab_size": 30522
86
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e30f069158667a5a8a0b532821065926c9a0bff4cb43d842935f68870caf113
3
+ size 438109155
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "additional_special_tokens": ["[NAME]", "[RELIGION]", "๐Ÿ˜‚", "โค", "๐Ÿคฃ", "๐Ÿ˜ญ", "๐Ÿ‘", "โ™€", "๐Ÿ˜", "๐Ÿค”", "๐Ÿฆ€", "๐Ÿ‘", "๐Ÿป", "๐Ÿคท", "๐Ÿผ", "๐Ÿ™„", "๐Ÿ˜Š", "๐Ÿ”ฅ", "๐Ÿ˜ข", "๐Ÿ˜…", "๐Ÿ’œ", "๐Ÿ‘Œ", "โ™‚", "โ˜บ", "๐Ÿ˜Ž", "๐Ÿ’ฏ", "๐Ÿ’ฆ", "๐Ÿ˜", "๐Ÿ˜”", "๐Ÿคข", "๐Ÿ’•", "๐Ÿ™", "๐Ÿ˜‰", "๐Ÿ™Œ", "๐Ÿคฆ", "๐Ÿ™ƒ", "๐Ÿ˜†", "๐Ÿ˜˜", "๐ŸŽถ", "๐Ÿ˜ค", "๐Ÿ˜", "๐Ÿ˜€", "๐Ÿค—", "๐Ÿ˜", "๐Ÿฝ", "๐Ÿ’ช", "๐Ÿ˜ก", "๐ŸŽ‰", "๐Ÿ‘€", "โœ”", "๐Ÿ”ช", "๐Ÿ˜„", "๐Ÿ˜ฌ", "๐Ÿ’–", "๐Ÿ˜ฅ", "๐Ÿ˜’", "โœŒ", "๐Ÿ’ƒ", "๐Ÿ˜ฉ", "โ˜น", "๐Ÿ’…", "๐Ÿ˜ช", "๐Ÿ‘‘", "๐Ÿ˜ณ", "๐Ÿคช", "๐Ÿ˜•", "๐ŸŽ‚", "๐Ÿ˜ซ", "๐Ÿ’™", "๐Ÿคฎ", "๐Ÿšซ", "๐Ÿ˜ž", "๐Ÿ’Ž", "๐Ÿ˜ฑ", "๐Ÿ˜‘", "๐Ÿ˜–", "๐ŸŠ", "๐Ÿ™ˆ", "๐Ÿค ", "โฃ", "๐Ÿคฉ", "๐Ÿ™‚", "๐Ÿ‘Š", "๐Ÿ’›", "๐Ÿ’“", "๐Ÿ‘ฉ", "โœจ", "๐Ÿ˜ฃ", "๐Ÿ’—", "๐Ÿคž", "๐Ÿฅ€", "๐Ÿš“", "๐Ÿ˜ฐ", "๐Ÿ‘…", "๐Ÿ˜", "๐Ÿป", "๐Ÿค•", "๐Ÿ˜œ", "๐Ÿฆˆ", "๐Ÿ˜ƒ", "๐Ÿ˜ฎ", "โœŠ", "๐Ÿ’š", "๐ŸŽต", "๐Ÿ’จ", "โ˜", "๐ŸŒˆ", "๐Ÿ’„", "๐Ÿ‘ธ", "๐Ÿ’ฅ", "๐Ÿ–ค", "๐Ÿพ", "๐Ÿฉ", "๐Ÿ˜‹", "๐Ÿคฒ", "๐Ÿคค", "๐Ÿง›", "๐Ÿ˜‡", "โ„", "โ–ซ", "๐Ÿ’", "๐Ÿ˜ด", ":)", ":(", "XD", "xD", ":D", ":'("]}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
1
+ {"do_lower_case": true, "model_max_length": 512, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "additional_special_tokens": ["[NAME]", "[RELIGION]", "๐Ÿ˜‚", "โค", "๐Ÿคฃ", "๐Ÿ˜ญ", "๐Ÿ‘", "โ™€", "๐Ÿ˜", "๐Ÿค”", "๐Ÿฆ€", "๐Ÿ‘", "๐Ÿป", "๐Ÿคท", "๐Ÿผ", "๐Ÿ™„", "๐Ÿ˜Š", "๐Ÿ”ฅ", "๐Ÿ˜ข", "๐Ÿ˜…", "๐Ÿ’œ", "๐Ÿ‘Œ", "โ™‚", "โ˜บ", "๐Ÿ˜Ž", "๐Ÿ’ฏ", "๐Ÿ’ฆ", "๐Ÿ˜", "๐Ÿ˜”", "๐Ÿคข", "๐Ÿ’•", "๐Ÿ™", "๐Ÿ˜‰", "๐Ÿ™Œ", "๐Ÿคฆ", "๐Ÿ™ƒ", "๐Ÿ˜†", "๐Ÿ˜˜", "๐ŸŽถ", "๐Ÿ˜ค", "๐Ÿ˜", "๐Ÿ˜€", "๐Ÿค—", "๐Ÿ˜", "๐Ÿฝ", "๐Ÿ’ช", "๐Ÿ˜ก", "๐ŸŽ‰", "๐Ÿ‘€", "โœ”", "๐Ÿ”ช", "๐Ÿ˜„", "๐Ÿ˜ฌ", "๐Ÿ’–", "๐Ÿ˜ฅ", "๐Ÿ˜’", "โœŒ", "๐Ÿ’ƒ", "๐Ÿ˜ฉ", "โ˜น", "๐Ÿ’…", "๐Ÿ˜ช", "๐Ÿ‘‘", "๐Ÿ˜ณ", "๐Ÿคช", "๐Ÿ˜•", "๐ŸŽ‚", "๐Ÿ˜ซ", "๐Ÿ’™", "๐Ÿคฎ", "๐Ÿšซ", "๐Ÿ˜ž", "๐Ÿ’Ž", "๐Ÿ˜ฑ", "๐Ÿ˜‘", "๐Ÿ˜–", "๐ŸŠ", "๐Ÿ™ˆ", "๐Ÿค ", "โฃ", "๐Ÿคฉ", "๐Ÿ™‚", "๐Ÿ‘Š", "๐Ÿ’›", "๐Ÿ’“", "๐Ÿ‘ฉ", "โœจ", "๐Ÿ˜ฃ", "๐Ÿ’—", "๐Ÿคž", "๐Ÿฅ€", "๐Ÿš“", "๐Ÿ˜ฐ", "๐Ÿ‘…", "๐Ÿ˜", "๐Ÿป", "๐Ÿค•", "๐Ÿ˜œ", "๐Ÿฆˆ", "๐Ÿ˜ƒ", "๐Ÿ˜ฎ", "โœŠ", "๐Ÿ’š", "๐ŸŽต", "๐Ÿ’จ", "โ˜", "๐ŸŒˆ", "๐Ÿ’„", "๐Ÿ‘ธ", "๐Ÿ’ฅ", "๐Ÿ–ค", "๐Ÿพ", "๐Ÿฉ", "๐Ÿ˜‹", "๐Ÿคฒ", "๐Ÿคค", "๐Ÿง›", "๐Ÿ˜‡", "โ„", "โ–ซ", "๐Ÿ’", "๐Ÿ˜ด", ":)", ":(", "XD", "xD", ":D", ":'("]}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f849f78dd0bc9d2061d3ab766fd4e60f0f64f1e0fc33eacf5828e43d59283048
3
+ size 1839
vocab.txt ADDED
The diff for this file is too large to render. See raw diff