add int8 embedding

Files changed (5) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/home2/xinhe/intel-model-mrpc/roberta-base-mrpc/",
   "architectures": [
     "RobertaForSequenceClassification"
   ],

 {
+  "_name_or_path": "Intel/roberta-base-mrpc",
   "architectures": [
     "RobertaForSequenceClassification"
   ],

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40946530ea1bb6a7889d32b0aed23e9f2ba0a407fe9e68f20ccaf6269a45ea19
-size 127033837

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0d78079577f379740987673369c23a05dbf9425fd406e763783b2966669e99b
+size 127038057

tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 256,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
-      "Fixed": 256
     },
     "direction": "Right",
     "pad_to_multiple_of": null,
@@ -67,7 +67,8 @@
   "pre_tokenizer": {
     "type": "ByteLevel",
     "add_prefix_space": false,
-    "trim_offsets": true
   },
   "post_processor": {
     "type": "RobertaProcessing",
@@ -85,7 +86,8 @@
   "decoder": {
     "type": "ByteLevel",
     "add_prefix_space": true,
-    "trim_offsets": true
   },
   "model": {
     "type": "BPE",

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 128,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
+      "Fixed": 128
     },
     "direction": "Right",
     "pad_to_multiple_of": null,
   "pre_tokenizer": {
     "type": "ByteLevel",
     "add_prefix_space": false,
+    "trim_offsets": true,
+    "use_regex": true
   },
   "post_processor": {
     "type": "RobertaProcessing",
   "decoder": {
     "type": "ByteLevel",
     "add_prefix_space": true,
+    "trim_offsets": true,
+    "use_regex": true
   },
   "model": {
     "type": "BPE",

tokenizer_config.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"errors": "replace", "bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "add_prefix_space": false, "trim_offsets": true, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "/~~home2/xinhe/intel-model-mrpc/~~roberta-base-mrpc/", "tokenizer_class": "RobertaTokenizer"}


1	+ {"errors": "replace", "bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "add_prefix_space": false, "trim_offsets": true, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "Intel/roberta-base-mrpc", "tokenizer_class": "RobertaTokenizer"}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff