mychen76 commited on
Commit
abecec5
1 Parent(s): 5b3b0a0

mychen76/donut-receipt_v3

Browse files
README.md CHANGED
@@ -3,8 +3,6 @@ license: mit
3
  base_model: naver-clova-ix/donut-base
4
  tags:
5
  - generated_from_trainer
6
- datasets:
7
- - imagefolder
8
  model-index:
9
  - name: donut-receipt_v3
10
  results: []
@@ -15,9 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # donut-receipt_v3
17
 
18
- This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the imagefolder dataset.
19
- It achieves the following results on the evaluation set:
20
- - Loss: 0.3299
21
 
22
  ## Model description
23
 
@@ -37,7 +33,7 @@ More information needed
37
 
38
  The following hyperparameters were used during training:
39
  - learning_rate: 2e-05
40
- - train_batch_size: 3
41
  - eval_batch_size: 8
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 
3
  base_model: naver-clova-ix/donut-base
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: donut-receipt_v3
8
  results: []
 
13
 
14
  # donut-receipt_v3
15
 
16
+ This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on an unknown dataset.
 
 
17
 
18
  ## Model description
19
 
 
33
 
34
  The following hyperparameters were used during training:
35
  - learning_rate: 2e-05
36
+ - train_batch_size: 4
37
  - eval_batch_size: 8
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
added_tokens.json CHANGED
@@ -1,13 +1,39 @@
1
  {
2
- "</s_address>": 57532,
3
- "</s_company>": 57530,
4
- "</s_date>": 57528,
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "</s_total>": 57526,
6
- "<s_address>": 57531,
7
- "<s_company>": 57529,
8
- "<s_date>": 57527,
9
  "<s_iitcdip>": 57523,
 
 
 
 
 
 
 
 
 
10
  "<s_synthdog>": 57524,
 
 
 
 
 
11
  "<s_total>": 57525,
12
  "<sep/>": 57522
13
  }
 
1
  {
2
+ "</s_date>": 57558,
3
+ "</s_ignore>": 57556,
4
+ "</s_item_key>": 57554,
5
+ "</s_item_name>": 57552,
6
+ "</s_item_quantity>": 57550,
7
+ "</s_item_value>": 57548,
8
+ "</s_line_items>": 57546,
9
+ "</s_others>": 57542,
10
+ "</s_store_addr>": 57540,
11
+ "</s_store_name>": 57538,
12
+ "</s_subtotal>": 57536,
13
+ "</s_tax>": 57534,
14
+ "</s_telephone>": 57532,
15
+ "</s_text>": 57544,
16
+ "</s_time>": 57530,
17
+ "</s_tips>": 57528,
18
  "</s_total>": 57526,
19
+ "<s_date>": 57557,
20
+ "<s_ignore>": 57555,
 
21
  "<s_iitcdip>": 57523,
22
+ "<s_item_key>": 57553,
23
+ "<s_item_name>": 57551,
24
+ "<s_item_quantity>": 57549,
25
+ "<s_item_value>": 57547,
26
+ "<s_line_items>": 57545,
27
+ "<s_others>": 57541,
28
+ "<s_store_addr>": 57539,
29
+ "<s_store_name>": 57537,
30
+ "<s_subtotal>": 57535,
31
  "<s_synthdog>": 57524,
32
+ "<s_tax>": 57533,
33
+ "<s_telephone>": 57531,
34
+ "<s_text>": 57543,
35
+ "<s_time>": 57529,
36
+ "<s_tips>": 57527,
37
  "<s_total>": 57525,
38
  "<sep/>": 57522
39
  }
config.json CHANGED
@@ -85,7 +85,7 @@
85
  "typical_p": 1.0,
86
  "use_bfloat16": false,
87
  "use_cache": true,
88
- "vocab_size": 57533
89
  },
90
  "decoder_start_token_id": 0,
91
  "encoder": {
@@ -124,8 +124,8 @@
124
  "1": "LABEL_1"
125
  },
126
  "image_size": [
127
- 1280,
128
- 960
129
  ],
130
  "initializer_range": 0.02,
131
  "is_decoder": false,
 
85
  "typical_p": 1.0,
86
  "use_bfloat16": false,
87
  "use_cache": true,
88
+ "vocab_size": 57559
89
  },
90
  "decoder_start_token_id": 0,
91
  "encoder": {
 
124
  "1": "LABEL_1"
125
  },
126
  "image_size": [
127
+ 960,
128
+ 720
129
  ],
130
  "initializer_range": 0.02,
131
  "is_decoder": false,
generation_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
6
- "max_length": 720,
7
  "pad_token_id": 1,
8
  "transformers_version": "4.34.0.dev0"
9
  }
 
3
  "bos_token_id": 0,
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
6
+ "max_length": 768,
7
  "pad_token_id": 1,
8
  "transformers_version": "4.34.0.dev0"
9
  }
preprocessor_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
- "size": {
23
- "height": 960,
24
- "width": 720
25
- }
26
  }
 
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
+ "size": [
23
+ 960,
24
+ 720
25
+ ]
26
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adac532db99dcd72e3b44c6835516ac772f1135ec7ff4cd157cab965fd4f4231
3
- size 809211673
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b2056ff6e22914837b730a821695396ad266d95750adc030972723c1ee9c06b
3
+ size 809318169
special_tokens_map.json CHANGED
@@ -2,12 +2,38 @@
2
  "additional_special_tokens": [
3
  "<s_total>",
4
  "</s_total>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "<s_date>",
6
  "</s_date>",
7
- "<s_company>",
8
- "</s_company>",
9
- "<s_address>",
10
- "</s_address>",
11
  "<s>",
12
  "</s>"
13
  ],
 
2
  "additional_special_tokens": [
3
  "<s_total>",
4
  "</s_total>",
5
+ "<s_tips>",
6
+ "</s_tips>",
7
+ "<s_time>",
8
+ "</s_time>",
9
+ "<s_telephone>",
10
+ "</s_telephone>",
11
+ "<s_tax>",
12
+ "</s_tax>",
13
+ "<s_subtotal>",
14
+ "</s_subtotal>",
15
+ "<s_store_name>",
16
+ "</s_store_name>",
17
+ "<s_store_addr>",
18
+ "</s_store_addr>",
19
+ "<s_others>",
20
+ "</s_others>",
21
+ "<s_text>",
22
+ "</s_text>",
23
+ "<s_line_items>",
24
+ "</s_line_items>",
25
+ "<s_item_value>",
26
+ "</s_item_value>",
27
+ "<s_item_quantity>",
28
+ "</s_item_quantity>",
29
+ "<s_item_name>",
30
+ "</s_item_name>",
31
+ "<s_item_key>",
32
+ "</s_item_key>",
33
+ "<s_ignore>",
34
+ "</s_ignore>",
35
  "<s_date>",
36
  "</s_date>",
 
 
 
 
37
  "<s>",
38
  "</s>"
39
  ],
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -11,18 +11,11 @@
11
  "rstrip": false,
12
  "single_word": false
13
  },
14
- "max_length": 512,
15
  "model_max_length": 1000000000000000019884624838656,
16
- "pad_to_multiple_of": null,
17
  "pad_token": "<pad>",
18
- "pad_token_type_id": 0,
19
- "padding_side": "right",
20
  "processor_class": "DonutProcessor",
21
  "sep_token": "</s>",
22
  "sp_model_kwargs": {},
23
- "stride": 0,
24
  "tokenizer_class": "XLMRobertaTokenizer",
25
- "truncation_side": "right",
26
- "truncation_strategy": "longest_first",
27
  "unk_token": "<unk>"
28
  }
 
11
  "rstrip": false,
12
  "single_word": false
13
  },
 
14
  "model_max_length": 1000000000000000019884624838656,
 
15
  "pad_token": "<pad>",
 
 
16
  "processor_class": "DonutProcessor",
17
  "sep_token": "</s>",
18
  "sp_model_kwargs": {},
 
19
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
20
  "unk_token": "<unk>"
21
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02bfc74ed50a2a9ecca5fd558a26ac3f1bebc494e403066fe8490111ee94e213
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37c92230417edb0b83fd852b0e8071ec1b87ea49c61337458217bd243c226888
3
  size 4283