HARSHAPALNATIUNH
commited on
Commit
•
e549e23
1
Parent(s):
a2d9b19
End of training
Browse files- README.md +2 -6
- config.json +1 -2
- model.safetensors +1 -1
- runs/Dec16_19-32-11_5c865fdaac76/events.out.tfevents.1702755143.5c865fdaac76.1170.5 +3 -0
- runs/Dec16_19-33-28_5c865fdaac76/events.out.tfevents.1702755210.5c865fdaac76.1170.6 +3 -0
- runs/Dec16_19-34-15_5c865fdaac76/events.out.tfevents.1702755258.5c865fdaac76.1170.7 +3 -0
- runs/Dec16_19-37-08_5c865fdaac76/events.out.tfevents.1702755446.5c865fdaac76.1170.8 +3 -0
- runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755476.5c865fdaac76.1170.9 +3 -0
- runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755579.5c865fdaac76.1170.10 +3 -0
- runs/Dec16_19-41-13_5c865fdaac76/events.out.tfevents.1702755674.5c865fdaac76.1170.11 +3 -0
- runs/Dec16_19-42-16_5c865fdaac76/events.out.tfevents.1702755737.5c865fdaac76.1170.12 +3 -0
- runs/Dec16_19-50-55_5c865fdaac76/events.out.tfevents.1702756268.5c865fdaac76.1170.13 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
---
|
2 |
license: bigscience-bloom-rail-1.0
|
3 |
-
base_model: bigscience/
|
4 |
tags:
|
5 |
- generated_from_trainer
|
6 |
model-index:
|
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
13 |
|
14 |
# BLOOM560mfinetune
|
15 |
|
16 |
-
This model is a fine-tuned version of [bigscience/
|
17 |
|
18 |
## Model description
|
19 |
|
@@ -40,10 +40,6 @@ The following hyperparameters were used during training:
|
|
40 |
- lr_scheduler_type: linear
|
41 |
- num_epochs: 2
|
42 |
|
43 |
-
### Training results
|
44 |
-
|
45 |
-
|
46 |
-
|
47 |
### Framework versions
|
48 |
|
49 |
- Transformers 4.35.2
|
|
|
1 |
---
|
2 |
license: bigscience-bloom-rail-1.0
|
3 |
+
base_model: bigscience/bloom-560m
|
4 |
tags:
|
5 |
- generated_from_trainer
|
6 |
model-index:
|
|
|
13 |
|
14 |
# BLOOM560mfinetune
|
15 |
|
16 |
+
This model is a fine-tuned version of [bigscience/bloom-560m](https://huggingface.co/bigscience/bloom-560m) on an unknown dataset.
|
17 |
|
18 |
## Model description
|
19 |
|
|
|
40 |
- lr_scheduler_type: linear
|
41 |
- num_epochs: 2
|
42 |
|
|
|
|
|
|
|
|
|
43 |
### Framework versions
|
44 |
|
45 |
- Transformers 4.35.2
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "bigscience/
|
3 |
"apply_residual_connection_post_layernorm": false,
|
4 |
"architectures": [
|
5 |
"BloomForCausalLM"
|
@@ -21,7 +21,6 @@
|
|
21 |
"offset_alibi": 100,
|
22 |
"pad_token_id": 3,
|
23 |
"pretraining_tp": 1,
|
24 |
-
"seq_length": 2048,
|
25 |
"skip_bias_add": true,
|
26 |
"skip_bias_add_qkv": false,
|
27 |
"slow_but_exact": false,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "bigscience/bloom-560m",
|
3 |
"apply_residual_connection_post_layernorm": false,
|
4 |
"architectures": [
|
5 |
"BloomForCausalLM"
|
|
|
21 |
"offset_alibi": 100,
|
22 |
"pad_token_id": 3,
|
23 |
"pretraining_tp": 1,
|
|
|
24 |
"skip_bias_add": true,
|
25 |
"skip_bias_add_qkv": false,
|
26 |
"slow_but_exact": false,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2236892304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81385b8c5f54795c2458c129b60eafaac977cb755117b3600585593c9b580656
|
3 |
size 2236892304
|
runs/Dec16_19-32-11_5c865fdaac76/events.out.tfevents.1702755143.5c865fdaac76.1170.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b72ac9b602103e15be67f0905ec604b59bb10cb9d7e6bd8f596c71e74fad6618
|
3 |
+
size 4325
|
runs/Dec16_19-33-28_5c865fdaac76/events.out.tfevents.1702755210.5c865fdaac76.1170.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26551c2ab968496825ee31d71e0d6d40429b46a7a9bcd8af418917f06f2eb148
|
3 |
+
size 4325
|
runs/Dec16_19-34-15_5c865fdaac76/events.out.tfevents.1702755258.5c865fdaac76.1170.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7eb93209cc424b1860d646e895dfb13a30ca9a9bf1791ff22f883f4953329692
|
3 |
+
size 4325
|
runs/Dec16_19-37-08_5c865fdaac76/events.out.tfevents.1702755446.5c865fdaac76.1170.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bab99274221b287272e11486e9dc5e71359a1643a2d72f52c732230f39492e6
|
3 |
+
size 4325
|
runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755476.5c865fdaac76.1170.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddc37418be28644d78ada46d7e4c72e90e6bdafc7f4e0adcbbd7af514f1d1f92
|
3 |
+
size 4325
|
runs/Dec16_19-37-56_5c865fdaac76/events.out.tfevents.1702755579.5c865fdaac76.1170.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79d4c3342afd023f69c48c60142a0ae4b1b5740860d908dc53375445ca410e1b
|
3 |
+
size 4325
|
runs/Dec16_19-41-13_5c865fdaac76/events.out.tfevents.1702755674.5c865fdaac76.1170.11
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2a65e59a69b0fc0c99593019c18c2c99acbbfcae76d08a623a21d90cc056ae4
|
3 |
+
size 4325
|
runs/Dec16_19-42-16_5c865fdaac76/events.out.tfevents.1702755737.5c865fdaac76.1170.12
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb8ece7dec7082dd5b32a761ffc11ec4c1558942dcdb4ec5415127ef61e2398a
|
3 |
+
size 4325
|
runs/Dec16_19-50-55_5c865fdaac76/events.out.tfevents.1702756268.5c865fdaac76.1170.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f9c4cc968ee9e9ced8aa8425c9c51d5ac3c97ad0e4cad053ba519a448d9964f
|
3 |
+
size 4184
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4b72cec6a5c4334780d5d14810fa8ee88e21dcaf7cea501b11c96ea73d6786e
|
3 |
size 4600
|