WillHeld commited on
Commit
2ba8dc9
1 Parent(s): b7dbb5e

Training in progress, step 200

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,239 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<pt-0>": 250173,
3
+ "<pt-10>": 250159,
4
+ "<pt-11>": 250186,
5
+ "<pt-12>": 250240,
6
+ "<pt-13>": 250131,
7
+ "<pt-14>": 250226,
8
+ "<pt-15>": 250145,
9
+ "<pt-16>": 250140,
10
+ "<pt-17>": 250133,
11
+ "<pt-18>": 250265,
12
+ "<pt-19>": 250239,
13
+ "<pt-1>": 250246,
14
+ "<pt-20>": 250146,
15
+ "<pt-21>": 250103,
16
+ "<pt-22>": 250280,
17
+ "<pt-23>": 250230,
18
+ "<pt-24>": 250305,
19
+ "<pt-25>": 250291,
20
+ "<pt-26>": 250286,
21
+ "<pt-27>": 250288,
22
+ "<pt-28>": 250302,
23
+ "<pt-29>": 250303,
24
+ "<pt-2>": 250181,
25
+ "<pt-30>": 250306,
26
+ "<pt-31>": 250301,
27
+ "<pt-32>": 250331,
28
+ "<pt-33>": 250328,
29
+ "<pt-34>": 250327,
30
+ "<pt-35>": 250330,
31
+ "<pt-36>": 250329,
32
+ "<pt-37>": 250326,
33
+ "<pt-38>": 250335,
34
+ "<pt-3>": 250199,
35
+ "<pt-40>": 250334,
36
+ "<pt-41>": 250333,
37
+ "<pt-42>": 250332,
38
+ "<pt-4>": 250148,
39
+ "<pt-5>": 250245,
40
+ "<pt-6>": 250134,
41
+ "<pt-7>": 250224,
42
+ "<pt-8>": 250234,
43
+ "<pt-9>": 250189,
44
+ "[IN:ADD_TIME_TIMER": 250101,
45
+ "[IN:ADD_TO_PLAYLIST_MUSIC": 250194,
46
+ "[IN:ANSWER_CALL": 250100,
47
+ "[IN:CANCEL_CALL": 250322,
48
+ "[IN:CANCEL_MESSAGE": 250274,
49
+ "[IN:CREATE_ALARM": 250150,
50
+ "[IN:CREATE_CALL": 250183,
51
+ "[IN:CREATE_PLAYLIST_MUSIC": 250244,
52
+ "[IN:CREATE_REMINDER": 250170,
53
+ "[IN:CREATE_TIMER": 250208,
54
+ "[IN:DELETE_ALARM": 250122,
55
+ "[IN:DELETE_PLAYLIST_MUSIC": 250287,
56
+ "[IN:DELETE_REMINDER": 250253,
57
+ "[IN:DELETE_TIMER": 250175,
58
+ "[IN:DISLIKE_MUSIC": 250295,
59
+ "[IN:DISPREFER": 250309,
60
+ "[IN:END_CALL": 250220,
61
+ "[IN:FAST_FORWARD_MUSIC": 250294,
62
+ "[IN:FOLLOW_MUSIC": 250321,
63
+ "[IN:GET_AGE": 250129,
64
+ "[IN:GET_AIRQUALITY": 250315,
65
+ "[IN:GET_ALARM": 250229,
66
+ "[IN:GET_ATTENDEE_EVENT": 250109,
67
+ "[IN:GET_AVAILABILITY": 250147,
68
+ "[IN:GET_BIRTHDAY": 250318,
69
+ "[IN:GET_CALL": 250248,
70
+ "[IN:GET_CALL_CONTACT": 250191,
71
+ "[IN:GET_CALL_TIME": 250118,
72
+ "[IN:GET_CATEGORY_EVENT": 250205,
73
+ "[IN:GET_CONTACT": 250123,
74
+ "[IN:GET_CONTACT_METHOD": 250277,
75
+ "[IN:GET_DATE_TIME_EVENT": 250285,
76
+ "[IN:GET_DETAILS_NEWS": 250283,
77
+ "[IN:GET_EDUCATION_DEGREE": 250275,
78
+ "[IN:GET_EDUCATION_TIME": 250254,
79
+ "[IN:GET_EMPLOYER": 250169,
80
+ "[IN:GET_EMPLOYMENT_TIME": 250228,
81
+ "[IN:GET_EVENT": 250252,
82
+ "[IN:GET_EVENT_ATTENDEE": 250319,
83
+ "[IN:GET_GENDER": 250323,
84
+ "[IN:GET_GROUP": 250325,
85
+ "[IN:GET_INFO_CONTACT": 250260,
86
+ "[IN:GET_INFO_RECIPES": 250231,
87
+ "[IN:GET_JOB": 250177,
88
+ "[IN:GET_LANGUAGE": 250316,
89
+ "[IN:GET_LIFE_EVENT": 250160,
90
+ "[IN:GET_LIFE_EVENT_TIME": 250299,
91
+ "[IN:GET_LOCATION": 250125,
92
+ "[IN:GET_LYRICS_MUSIC": 250314,
93
+ "[IN:GET_MAJOR": 250276,
94
+ "[IN:GET_MESSAGE": 250223,
95
+ "[IN:GET_MESSAGE_CONTACT": 250120,
96
+ "[IN:GET_MUTUAL_FRIENDS": 250126,
97
+ "[IN:GET_RECIPES": 250157,
98
+ "[IN:GET_REMINDER": 250237,
99
+ "[IN:GET_REMINDER_AMOUNT": 250174,
100
+ "[IN:GET_REMINDER_DATE_TIME": 250241,
101
+ "[IN:GET_REMINDER_LOCATION": 250137,
102
+ "[IN:GET_STORIES_NEWS": 250162,
103
+ "[IN:GET_SUNRISE": 250149,
104
+ "[IN:GET_SUNSET": 250243,
105
+ "[IN:GET_TIMER": 250151,
106
+ "[IN:GET_TODO": 250112,
107
+ "[IN:GET_TRACK_INFO_MUSIC": 250221,
108
+ "[IN:GET_UNDERGRAD": 250179,
109
+ "[IN:GET_WEATHER": 250203,
110
+ "[IN:HELP_REMINDER": 250311,
111
+ "[IN:HOLD_CALL": 250172,
112
+ "[IN:IGNORE_CALL": 250113,
113
+ "[IN:IS_TRUE_RECIPES": 250222,
114
+ "[IN:LIKE_MUSIC": 250255,
115
+ "[IN:LOOP_MUSIC": 250102,
116
+ "[IN:MERGE_CALL": 250165,
117
+ "[IN:PAUSE_MUSIC": 250242,
118
+ "[IN:PAUSE_TIMER": 250166,
119
+ "[IN:PLAY_MEDIA": 250213,
120
+ "[IN:PLAY_MUSIC": 250211,
121
+ "[IN:PREFER": 250141,
122
+ "[IN:PREVIOUS_TRACK_MUSIC": 250238,
123
+ "[IN:QUESTION_MUSIC": 250195,
124
+ "[IN:QUESTION_NEWS": 250204,
125
+ "[IN:REMOVE_FROM_PLAYLIST_MUSIC": 250154,
126
+ "[IN:REPEAT_ALL_MUSIC": 250296,
127
+ "[IN:REPEAT_ALL_OFF_MUSIC": 250307,
128
+ "[IN:REPLAY_MUSIC": 250251,
129
+ "[IN:REPLY_MESSAGE": 250310,
130
+ "[IN:RESTART_TIMER": 250192,
131
+ "[IN:RESUME_CALL": 250270,
132
+ "[IN:RESUME_MUSIC": 250290,
133
+ "[IN:RESUME_TIMER": 250259,
134
+ "[IN:REWIND_MUSIC": 250289,
135
+ "[IN:SEND_MESSAGE": 250143,
136
+ "[IN:SET_AVAILABLE": 250198,
137
+ "[IN:SET_DEFAULT_PROVIDER_CALLING": 250281,
138
+ "[IN:SET_DEFAULT_PROVIDER_MUSIC": 250136,
139
+ "[IN:SET_RSVP_INTERESTED": 250144,
140
+ "[IN:SET_RSVP_NO": 250282,
141
+ "[IN:SET_RSVP_YES": 250124,
142
+ "[IN:SET_UNAVAILABLE": 250256,
143
+ "[IN:SHARE_EVENT": 250266,
144
+ "[IN:SILENCE_ALARM": 250180,
145
+ "[IN:SKIP_TRACK_MUSIC": 250264,
146
+ "[IN:SNOOZE_ALARM": 250115,
147
+ "[IN:START_SHUFFLE_MUSIC": 250164,
148
+ "[IN:STOP_MUSIC": 250272,
149
+ "[IN:STOP_SHUFFLE_MUSIC": 250313,
150
+ "[IN:SUBTRACT_TIME_TIMER": 250188,
151
+ "[IN:SWITCH_CALL": 250201,
152
+ "[IN:UNLOOP_MUSIC": 250278,
153
+ "[IN:UPDATE_ALARM": 250184,
154
+ "[IN:UPDATE_CALL": 250193,
155
+ "[IN:UPDATE_METHOD_CALL": 250215,
156
+ "[IN:UPDATE_REMINDER": 250293,
157
+ "[IN:UPDATE_REMINDER_DATE_TIME": 250249,
158
+ "[IN:UPDATE_REMINDER_LOCATION": 250279,
159
+ "[IN:UPDATE_REMINDER_TODO": 250171,
160
+ "[IN:UPDATE_TIMER": 250190,
161
+ "[SL:AGE": 250284,
162
+ "[SL:ALARM_NAME": 250261,
163
+ "[SL:AMOUNT": 250110,
164
+ "[SL:ATTENDEE": 250185,
165
+ "[SL:ATTENDEE_EVENT": 250271,
166
+ "[SL:ATTRIBUTE_EVENT": 250168,
167
+ "[SL:CATEGORY_EVENT": 250158,
168
+ "[SL:CONTACT": 250232,
169
+ "[SL:CONTACT_ADDED": 250111,
170
+ "[SL:CONTACT_METHOD": 250269,
171
+ "[SL:CONTACT_RELATED": 250121,
172
+ "[SL:CONTACT_REMOVED": 250107,
173
+ "[SL:CONTENT_EXACT": 250202,
174
+ "[SL:DATE_TIME": 250178,
175
+ "[SL:EDUCATION_DEGREE": 250267,
176
+ "[SL:EMPLOYER": 250187,
177
+ "[SL:GENDER": 250324,
178
+ "[SL:GROUP": 250247,
179
+ "[SL:JOB": 250206,
180
+ "[SL:LIFE_EVENT": 250262,
181
+ "[SL:LOCATION": 250216,
182
+ "[SL:MAJOR": 250320,
183
+ "[SL:METHOD_MESSAGE": 250128,
184
+ "[SL:METHOD_RECIPES": 250139,
185
+ "[SL:METHOD_RETRIEVAL_REMINDER": 250235,
186
+ "[SL:METHOD_TIMER": 250161,
187
+ "[SL:MUSIC_ALBUM_MODIFIER": 250268,
188
+ "[SL:MUSIC_ALBUM_TITLE": 250135,
189
+ "[SL:MUSIC_ARTIST_NAME": 250156,
190
+ "[SL:MUSIC_GENRE": 250138,
191
+ "[SL:MUSIC_PLAYLIST_MODIFIER": 250308,
192
+ "[SL:MUSIC_PLAYLIST_TITLE": 250236,
193
+ "[SL:MUSIC_PROVIDER_NAME": 250227,
194
+ "[SL:MUSIC_RADIO_ID": 250167,
195
+ "[SL:MUSIC_REWIND_TIME": 250292,
196
+ "[SL:MUSIC_TRACK_TITLE": 250106,
197
+ "[SL:MUSIC_TYPE": 250217,
198
+ "[SL:MUTUAL_EMPLOYER": 250304,
199
+ "[SL:MUTUAL_SCHOOL": 250312,
200
+ "[SL:NAME_APP": 250218,
201
+ "[SL:NEWS_CATEGORY": 250114,
202
+ "[SL:NEWS_REFERENCE": 250152,
203
+ "[SL:NEWS_SOURCE": 250153,
204
+ "[SL:NEWS_TOPIC": 250225,
205
+ "[SL:NEWS_TYPE": 250233,
206
+ "[SL:ORDINAL": 250182,
207
+ "[SL:PERIOD": 250200,
208
+ "[SL:PERSON_REMINDED": 250209,
209
+ "[SL:PHONE_NUMBER": 250176,
210
+ "[SL:RECIPES_ATTRIBUTE": 250130,
211
+ "[SL:RECIPES_COOKING_METHOD": 250119,
212
+ "[SL:RECIPES_CUISINE": 250298,
213
+ "[SL:RECIPES_DIET": 250219,
214
+ "[SL:RECIPES_DISH": 250197,
215
+ "[SL:RECIPES_EXCLUDED_INGREDIENT": 250263,
216
+ "[SL:RECIPES_INCLUDED_INGREDIENT": 250257,
217
+ "[SL:RECIPES_MEAL": 250212,
218
+ "[SL:RECIPES_QUALIFIER_NUTRITION": 250273,
219
+ "[SL:RECIPES_RATING": 250116,
220
+ "[SL:RECIPES_SOURCE": 250300,
221
+ "[SL:RECIPES_TIME_PREPARATION": 250336,
222
+ "[SL:RECIPES_TYPE": 250117,
223
+ "[SL:RECIPES_TYPE_NUTRITION": 250207,
224
+ "[SL:RECIPES_UNIT_MEASUREMENT": 250108,
225
+ "[SL:RECIPES_UNIT_NUTRITION": 250210,
226
+ "[SL:RECIPIENT": 250105,
227
+ "[SL:SCHOOL": 250155,
228
+ "[SL:SENDER": 250127,
229
+ "[SL:SIMILARITY": 250258,
230
+ "[SL:TIMER_NAME": 250104,
231
+ "[SL:TITLE_EVENT": 250214,
232
+ "[SL:TODO": 250196,
233
+ "[SL:TYPE_CONTACT": 250317,
234
+ "[SL:TYPE_CONTENT": 250142,
235
+ "[SL:TYPE_RELATION": 250250,
236
+ "[SL:USER_ATTENDEE_EVENT": 250297,
237
+ "[SL:WEATHER_ATTRIBUTE": 250163,
238
+ "[SL:WEATHER_TEMPERATURE_UNIT": 250132
239
+ }
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/mt5-small",
3
+ "architectures": [
4
+ "AlignedMT5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 1024,
7
+ "d_kv": 64,
8
+ "d_model": 512,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "gelu_new",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "gated-gelu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": true,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "mt5",
19
+ "num_decoder_layers": 8,
20
+ "num_heads": 6,
21
+ "num_layers": 8,
22
+ "pad_token_id": 0,
23
+ "relative_attention_max_distance": 128,
24
+ "relative_attention_num_buckets": 32,
25
+ "tie_word_embeddings": false,
26
+ "tokenizer_class": "T5Tokenizer",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.24.0",
29
+ "use_cache": true,
30
+ "vocab_size": 250337
31
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:072ef189445ab9e4e191f2fc34e1653410caf1adb3a79229627201c11d4b9ec2
3
+ size 1202749609
special_tokens_map.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
1
+ {
2
+ "eos_token": "</s>",
3
+ "pad_token": "<pad>",
4
+ "unk_token": "<unk>"
5
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
3
+ size 4309802
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3342e872890c61e379cad274f044f962d4ae413b682819949c22fd3f2b368238
3
+ size 16376194
tokenizer_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "eos_token": "</s>",
4
+ "extra_ids": 0,
5
+ "name_or_path": "google/mt5-small",
6
+ "pad_token": "<pad>",
7
+ "sp_model_kwargs": {},
8
+ "special_tokens_map_file": "/nethome/wheld3/.cache/huggingface/hub/models--google--mt5-small/snapshots/f03a52d3eaa650878b6f52e443bc4d5b385e786e/special_tokens_map.json",
9
+ "tokenizer_class": "T5Tokenizer",
10
+ "unk_token": "<unk>"
11
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cdc79c7f71b0f1a50f6e2301636874639838dab639b4355a847c8b06bf10b8f
3
+ size 3579