HARSHAPALNATIUNH commited on
Commit
e549e23
1 Parent(s): a2d9b19

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: bigscience-bloom-rail-1.0
3
- base_model: bigscience/bloomz-560m
4
  tags:
5
  - generated_from_trainer
6
  model-index:
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # BLOOM560mfinetune
15
 
16
- This model is a fine-tuned version of [bigscience/bloomz-560m](https://huggingface.co/bigscience/bloomz-560m) on an unknown dataset.
17
 
18
  ## Model description
19
 
@@ -40,10 +40,6 @@ The following hyperparameters were used during training:
40
  - lr_scheduler_type: linear
41
  - num_epochs: 2
42
 
43
- ### Training results
44
-
45
-
46
-
47
  ### Framework versions
48
 
49
  - Transformers 4.35.2
 
1
  ---
2
  license: bigscience-bloom-rail-1.0
3
+ base_model: bigscience/bloom-560m
4
  tags:
5
  - generated_from_trainer
6
  model-index:
 
13
 
14
  # BLOOM560mfinetune
15
 
16
+ This model is a fine-tuned version of [bigscience/bloom-560m](https://huggingface.co/bigscience/bloom-560m) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
40
  - lr_scheduler_type: linear
41
  - num_epochs: 2
42
 
 
 
 
 
43
  ### Framework versions
44
 
45
  - Transformers 4.35.2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "bigscience/bloomz-560m",
3
  "apply_residual_connection_post_layernorm": false,
4
  "architectures": [
5
  "BloomForCausalLM"
@@ -21,7 +21,6 @@
21
  "offset_alibi": 100,
22
  "pad_token_id": 3,
23
  "pretraining_tp": 1,
24
- "seq_length": 2048,
25
  "skip_bias_add": true,
26
  "skip_bias_add_qkv": false,
27
  "slow_but_exact": false,
 
1
  {
2
+ "_name_or_path": "bigscience/bloom-560m",
3
  "apply_residual_connection_post_layernorm": false,
4
  "architectures": [
5
  "BloomForCausalLM"
 
21
  "offset_alibi": 100,
22
  "pad_token_id": 3,
23
  "pretraining_tp": 1,
 
24
  "skip_bias_add": true,
25
  "skip_bias_add_qkv": false,
26
  "slow_but_exact": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e5f61fbbfd5dd09a703695971850088e7f6f4f4478493726eb2a18b447cd38e
3
  size 2236892304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81385b8c5f54795c2458c129b60eafaac977cb755117b3600585593c9b580656
3
  size 2236892304
runs/Dec16_19-32-11_5c865fdaac76/events.out.tfevents.1702755143.5c865fdaac76.1170.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72ac9b602103e15be67f0905ec604b59bb10cb9d7e6bd8f596c71e74fad6618
3
+ size 4325
runs/Dec16_19-33-28_5c865fdaac76/events.out.tfevents.1702755210.5c865fdaac76.1170.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26551c2ab968496825ee31d71e0d6d40429b46a7a9bcd8af418917f06f2eb148
3
+ size 4325
runs/Dec16_19-34-15_5c865fdaac76/events.out.tfevents.1702755258.5c865fdaac76.1170.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eb93209cc424b1860d646e895dfb13a30ca9a9bf1791ff22f883f4953329692
3
+ size 4325
runs/Dec16_19-37-08_5c865fdaac76/events.out.tfevents.1702755446.5c865fdaac76.1170.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bab99274221b287272e11486e9dc5e71359a1643a2d72f52c732230f39492e6
3
+ size 4325
runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755476.5c865fdaac76.1170.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddc37418be28644d78ada46d7e4c72e90e6bdafc7f4e0adcbbd7af514f1d1f92
3
+ size 4325
runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755579.5c865fdaac76.1170.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79d4c3342afd023f69c48c60142a0ae4b1b5740860d908dc53375445ca410e1b
3
+ size 4325
runs/Dec16_19-41-13_5c865fdaac76/events.out.tfevents.1702755674.5c865fdaac76.1170.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2a65e59a69b0fc0c99593019c18c2c99acbbfcae76d08a623a21d90cc056ae4
3
+ size 4325
runs/Dec16_19-42-16_5c865fdaac76/events.out.tfevents.1702755737.5c865fdaac76.1170.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb8ece7dec7082dd5b32a761ffc11ec4c1558942dcdb4ec5415127ef61e2398a
3
+ size 4325
runs/Dec16_19-50-55_5c865fdaac76/events.out.tfevents.1702756268.5c865fdaac76.1170.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9c4cc968ee9e9ced8aa8425c9c51d5ac3c97ad0e4cad053ba519a448d9964f
3
+ size 4184
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4300c248e1b3d2b373ab8874b1a2de6586588c9953bf5250665c26a7dc538bf2
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4b72cec6a5c4334780d5d14810fa8ee88e21dcaf7cea501b11c96ea73d6786e
3
  size 4600