shiromart commited on
Commit
801d0ef
1 Parent(s): ebaba83

Training in progress epoch 0

Browse files
Files changed (49) hide show
  1. README.md +53 -0
  2. config.json +23 -0
  3. logs/train/events.out.tfevents.1645617275.1647b03f284e.15.0.v2 +3 -0
  4. logs/train/events.out.tfevents.1645617298.1647b03f284e.profile-empty +3 -0
  5. logs/train/events.out.tfevents.1645617524.1647b03f284e.15.1.v2 +3 -0
  6. logs/train/events.out.tfevents.1645617575.1647b03f284e.15.2.v2 +3 -0
  7. logs/train/events.out.tfevents.1645617657.1647b03f284e.15.3.v2 +3 -0
  8. logs/train/events.out.tfevents.1645618747.48c7fa266c4b.15.0.v2 +3 -0
  9. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.input_pipeline.pb +3 -0
  10. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.kernel_stats.pb +0 -0
  11. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.memory_profile.json.gz +3 -0
  12. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.overview_page.pb +3 -0
  13. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.tensorflow_stats.pb +3 -0
  14. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.trace.json.gz +3 -0
  15. logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.xplane.pb +3 -0
  16. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.input_pipeline.pb +3 -0
  17. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.kernel_stats.pb +0 -0
  18. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.memory_profile.json.gz +3 -0
  19. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.overview_page.pb +3 -0
  20. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.tensorflow_stats.pb +3 -0
  21. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.trace.json.gz +3 -0
  22. logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.xplane.pb +3 -0
  23. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.input_pipeline.pb +3 -0
  24. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.kernel_stats.pb +0 -0
  25. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.memory_profile.json.gz +3 -0
  26. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.overview_page.pb +3 -0
  27. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.tensorflow_stats.pb +3 -0
  28. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.trace.json.gz +3 -0
  29. logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.xplane.pb +3 -0
  30. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.input_pipeline.pb +3 -0
  31. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.kernel_stats.pb +0 -0
  32. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.memory_profile.json.gz +3 -0
  33. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.overview_page.pb +3 -0
  34. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.tensorflow_stats.pb +3 -0
  35. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.trace.json.gz +3 -0
  36. logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.xplane.pb +3 -0
  37. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.input_pipeline.pb +3 -0
  38. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.kernel_stats.pb +0 -0
  39. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.memory_profile.json.gz +3 -0
  40. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.overview_page.pb +3 -0
  41. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.tensorflow_stats.pb +3 -0
  42. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.trace.json.gz +3 -0
  43. logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.xplane.pb +3 -0
  44. logs/validation/events.out.tfevents.1645662083.48c7fa266c4b.15.1.v2 +3 -0
  45. special_tokens_map.json +1 -0
  46. tf_model.h5 +3 -0
  47. tokenizer.json +0 -0
  48. tokenizer_config.json +1 -0
  49. vocab.txt +0 -0
README.md ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - generated_from_keras_callback
5
+ model-index:
6
+ - name: shiromart/distilbert-base-uncased-finetuned-squad
7
+ results: []
8
+ ---
9
+
10
+ <!-- This model card has been generated automatically according to the information Keras had access to. You should
11
+ probably proofread and complete it, then remove this comment. -->
12
+
13
+ # shiromart/distilbert-base-uncased-finetuned-squad
14
+
15
+ This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - Train Loss: 1.5135
18
+ - Validation Loss: 1.1688
19
+ - Epoch: 0
20
+
21
+ ## Model description
22
+
23
+ More information needed
24
+
25
+ ## Intended uses & limitations
26
+
27
+ More information needed
28
+
29
+ ## Training and evaluation data
30
+
31
+ More information needed
32
+
33
+ ## Training procedure
34
+
35
+ ### Training hyperparameters
36
+
37
+ The following hyperparameters were used during training:
38
+ - optimizer: {'name': 'Adam', 'learning_rate': {'class_name': 'PolynomialDecay', 'config': {'initial_learning_rate': 2e-05, 'decay_steps': 11064, 'end_learning_rate': 0.0, 'power': 1.0, 'cycle': False, 'name': None}}, 'decay': 0.0, 'beta_1': 0.9, 'beta_2': 0.999, 'epsilon': 1e-08, 'amsgrad': False}
39
+ - training_precision: float32
40
+
41
+ ### Training results
42
+
43
+ | Train Loss | Validation Loss | Epoch |
44
+ |:----------:|:---------------:|:-----:|
45
+ | 1.5135 | 1.1688 | 0 |
46
+
47
+
48
+ ### Framework versions
49
+
50
+ - Transformers 4.16.2
51
+ - TensorFlow 2.6.2
52
+ - Datasets 1.18.3
53
+ - Tokenizers 0.11.0
config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForQuestionAnswering"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "initializer_range": 0.02,
12
+ "max_position_embeddings": 512,
13
+ "model_type": "distilbert",
14
+ "n_heads": 12,
15
+ "n_layers": 6,
16
+ "pad_token_id": 0,
17
+ "qa_dropout": 0.1,
18
+ "seq_classif_dropout": 0.2,
19
+ "sinusoidal_pos_embds": false,
20
+ "tie_weights_": true,
21
+ "transformers_version": "4.16.2",
22
+ "vocab_size": 30522
23
+ }
logs/train/events.out.tfevents.1645617275.1647b03f284e.15.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:049629a27707dbd6bfe71bb949096f4dabb97fb2b5a040c9e74d5005b551d625
3
+ size 1478727
logs/train/events.out.tfevents.1645617298.1647b03f284e.profile-empty ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5121d9a7eb7d7ad0d1d18632e35c675b5f0295e8acccc82db842bc5f9ff6fb71
3
+ size 40
logs/train/events.out.tfevents.1645617524.1647b03f284e.15.1.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be42169f236332abc8ce02edf8f6f1cd4be3860346569d2dcce4e22c7d208243
3
+ size 6421262
logs/train/events.out.tfevents.1645617575.1647b03f284e.15.2.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9c6f63d07dbe66e27821e9bff9ed598b04dee1c4a2f2cb010832e749d82279f
3
+ size 1478727
logs/train/events.out.tfevents.1645617657.1647b03f284e.15.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce79a6823f777cc4fcc772e3ae3e17c88eeb9b4f51cac5be1f2f5efe8ce408f
3
+ size 6421262
logs/train/events.out.tfevents.1645618747.48c7fa266c4b.15.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:264a10c9007c91fb701c661468fb59e04a4b1a4b447f94064a148e7d5feedc82
3
+ size 1478868
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a00ad978b268eef340ed64f90394e1eae42c8a2aee639cbbc7bdf509a3583c48
3
+ size 2618
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.kernel_stats.pb ADDED
File without changes
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee89330712a5dd3baf5485f7e0a89fca67ecac77e3482a2b27e1a529f3e5b5d9
3
+ size 73
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1af69374340cb919c53a14d6c9a5b82f0b3427719cdca89519ef04cb02968a3
3
+ size 3917
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9189cc436257c471672df5d54806ecd8a31f11364b36bf6d85630bb5f928e005
3
+ size 189707
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4372ca6665be1730387b481f4cbfbb9c47e4c1311e928efb0ccab044a239c2fb
3
+ size 49557
logs/train/plugins/profile/2022_02_23_11_54_58/1647b03f284e.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4695e75e16150d4309b67a4899ef66c66893b985c4cea0c840fbe605fc997dcc
3
+ size 280759
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec6cb1725349360e79185a4ad600ef17fc9ef27dfb7bdb120f7c2f87a0e24f44
3
+ size 2618
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.kernel_stats.pb ADDED
File without changes
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee89330712a5dd3baf5485f7e0a89fca67ecac77e3482a2b27e1a529f3e5b5d9
3
+ size 73
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ff69b27553dc761d1d23d97e0a6df77079c71233779609b2f1a480169ad3491
3
+ size 3917
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bef40c9893a4e6e0af9c5e2a47217e615f861e3b5a6a28d65e0161294166615
3
+ size 189713
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba1faede53a3b3d6c3d25da31f018e92717747e83938dfafb755a2477a5c7854
3
+ size 49248
logs/train/plugins/profile/2022_02_23_11_59_05/1647b03f284e.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6245389dbf3d027ffaa62c706c15242fb94ced0631d1ba5045167473b706847c
3
+ size 280643
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b45f1efb1835f21ba35663a63f9460fe80b2a6a745648d38bcf5611e78f98c9
3
+ size 2618
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.kernel_stats.pb ADDED
File without changes
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee89330712a5dd3baf5485f7e0a89fca67ecac77e3482a2b27e1a529f3e5b5d9
3
+ size 73
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61edb9a10181666cbcfc514fe9f9598ec0346eb242416671452faf261efa1458
3
+ size 3917
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1da1469d05a67857c9f7ce36f13c001f25967ba390dd3d688626b477774d365
3
+ size 189909
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28186cf099dbc2c68680fca1d8bb89daea1416a5e023d43ed599a13dc73d1d60
3
+ size 49547
logs/train/plugins/profile/2022_02_23_11_59_51/1647b03f284e.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ba0172d8699f672eaad7f562c4674bedd9112ba71328e7c020ff8d372eebe28
3
+ size 280809
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e337d785f89ae353af4deb13dad280929533734eec13e5b4e9c923552cc6b92
3
+ size 2618
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.kernel_stats.pb ADDED
File without changes
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee89330712a5dd3baf5485f7e0a89fca67ecac77e3482a2b27e1a529f3e5b5d9
3
+ size 73
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe565dc3bf01b2b9b91a1eb34ac76e28a34f25dd67e725fb8d315cb8032fe03c
3
+ size 3917
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6bfab3614dcdef7877af22094d343435a93160e1bba756df3b8aabc355b2863
3
+ size 189723
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:941f524d3e12f3265cfc9e6302aee13fc909f97909ca6dc34360bf553541167a
3
+ size 49601
logs/train/plugins/profile/2022_02_23_12_01_18/1647b03f284e.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3730aa93ef3da87deb1c9be0f19bc360eaf4510462a6b5d4a1648ad646e75c04
3
+ size 281020
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5bdf0b03e45edfc623eabf90974a7807fe2bb80e15f94aacec46feb15e22cfa
3
+ size 2618
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.kernel_stats.pb ADDED
File without changes
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee89330712a5dd3baf5485f7e0a89fca67ecac77e3482a2b27e1a529f3e5b5d9
3
+ size 73
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39c8e7d34013c1890d01aec19828a3c04878aa524f93356e0860dbf08b8ebfef
3
+ size 3999
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0bf1176ad863ae418d57c83516bc040c5aad7b071ba247f6de36e733934273
3
+ size 189495
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96535f826830ad595f890dc999ffd211ac1c855cee836a04598316c0d405c68d
3
+ size 49343
logs/train/plugins/profile/2022_02_23_12_19_29/48c7fa266c4b.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:060ba347ac702db4fa6f3e251249915dd882849822d8d9bd8eaaaf53f4e64be5
3
+ size 280715
logs/validation/events.out.tfevents.1645662083.48c7fa266c4b.15.1.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab92ce6a1cf7bd3836d1371072de99620f81fac1d5eed18721cc61b6057209c7
3
+ size 194
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d7b06806d8d3680239be4e248772701339e78723df2d2e5c8d4ca9f2c77032f
3
+ size 265583688
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilbert-base-uncased", "tokenizer_class": "DistilBertTokenizer"}
vocab.txt ADDED
The diff for this file is too large to render. See raw diff