Training in progress, epoch 1
Browse files
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "microsoft/trocr-large-
|
3 |
"architectures": [
|
4 |
"VisionEncoderDecoderModel"
|
5 |
],
|
@@ -15,7 +15,7 @@
|
|
15 |
"bos_token_id": 0,
|
16 |
"chunk_size_feed_forward": 0,
|
17 |
"classifier_dropout": 0.0,
|
18 |
-
"cross_attention_hidden_size":
|
19 |
"d_model": 1024,
|
20 |
"decoder_attention_heads": 16,
|
21 |
"decoder_ffn_dim": 4096,
|
@@ -26,6 +26,7 @@
|
|
26 |
"do_sample": false,
|
27 |
"dropout": 0.1,
|
28 |
"early_stopping": false,
|
|
|
29 |
"encoder_no_repeat_ngram_size": 0,
|
30 |
"eos_token_id": 2,
|
31 |
"exponential_decay_length_penalty": null,
|
@@ -172,6 +173,6 @@
|
|
172 |
"pad_token_id": 1,
|
173 |
"tie_word_embeddings": false,
|
174 |
"torch_dtype": "float32",
|
175 |
-
"transformers_version": "4.
|
176 |
"vocab_size": 50265
|
177 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "microsoft/trocr-large-stage1",
|
3 |
"architectures": [
|
4 |
"VisionEncoderDecoderModel"
|
5 |
],
|
|
|
15 |
"bos_token_id": 0,
|
16 |
"chunk_size_feed_forward": 0,
|
17 |
"classifier_dropout": 0.0,
|
18 |
+
"cross_attention_hidden_size": null,
|
19 |
"d_model": 1024,
|
20 |
"decoder_attention_heads": 16,
|
21 |
"decoder_ffn_dim": 4096,
|
|
|
26 |
"do_sample": false,
|
27 |
"dropout": 0.1,
|
28 |
"early_stopping": false,
|
29 |
+
"encoder_hidden_size": 1024,
|
30 |
"encoder_no_repeat_ngram_size": 0,
|
31 |
"eos_token_id": 2,
|
32 |
"exponential_decay_length_penalty": null,
|
|
|
173 |
"pad_token_id": 1,
|
174 |
"tie_word_embeddings": false,
|
175 |
"torch_dtype": "float32",
|
176 |
+
"transformers_version": "4.37.2",
|
177 |
"vocab_size": 50265
|
178 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2436757100
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bee196663a8d7d2735603e71e8c2d6d058984dd011a8b87454d4ce4ac6483f70
|
3 |
size 2436757100
|
runs/Feb12_20-07-43_104-171-203-98/events.out.tfevents.1707768464.104-171-203-98.2525.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9afcb2743806e6428a5eaa86e724b178e8e560f033be123a553d1a2814a6b24
|
3 |
+
size 9306
|
runs/Feb12_20-11-05_104-171-203-98/events.out.tfevents.1707768665.104-171-203-98.10676.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aaee1b1b63a49f7de9269c360525fb1f1b99e567513df3d468ae9af9b91d3d1
|
3 |
+
size 56403
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77d2f2aac669541bf81947f1f8f4dc60450ab9f1696170ab8d2eb969c2f769af
|
3 |
+
size 4475
|