|
{
|
|
"added_tokens_decoder": {
|
|
"0": {
|
|
"content": "<s>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"1": {
|
|
"content": "<pad>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"2": {
|
|
"content": "</s>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"3": {
|
|
"content": "<unk>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"57521": {
|
|
"content": "<mask>",
|
|
"lstrip": true,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"57522": {
|
|
"content": "<sep/>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57523": {
|
|
"content": "<s_iitcdip>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"57524": {
|
|
"content": "<s_synthdog>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"57525": {
|
|
"content": "<s_items>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57526": {
|
|
"content": "</s_items>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57527": {
|
|
"content": "<s_item_code>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57528": {
|
|
"content": "</s_item_code>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57529": {
|
|
"content": "<s_item_description>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57530": {
|
|
"content": "</s_item_description>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57531": {
|
|
"content": "<s_qty_supplied>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57532": {
|
|
"content": "</s_qty_supplied>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57533": {
|
|
"content": "<s_uom>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57534": {
|
|
"content": "</s_uom>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57535": {
|
|
"content": "<s_unit_price_ex_gst>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57536": {
|
|
"content": "</s_unit_price_ex_gst>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
},
|
|
"57537": {
|
|
"content": "<s_cord-v2>",
|
|
"lstrip": false,
|
|
"normalized": true,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": false
|
|
}
|
|
},
|
|
"additional_special_tokens": [
|
|
"<s_iitcdip>",
|
|
"<s_synthdog>"
|
|
],
|
|
"bos_token": "<s>",
|
|
"clean_up_tokenization_spaces": true,
|
|
"cls_token": "<s>",
|
|
"eos_token": "</s>",
|
|
"mask_token": "<mask>",
|
|
"model_max_length": 1000000000000000019884624838656,
|
|
"pad_token": "<pad>",
|
|
"processor_class": "DonutProcessor",
|
|
"sep_token": "</s>",
|
|
"sp_model_kwargs": {},
|
|
"tokenizer_class": "XLMRobertaTokenizer",
|
|
"unk_token": "<unk>"
|
|
}
|
|
|