Training in progress, step 50
Browse files- config.json +51 -0
- runs/Apr22_06-37-13_bosshome/events.out.tfevents.1713767835.bosshome +3 -0
- runs/Apr22_06-41-46_bosshome/events.out.tfevents.1713768108.bosshome +3 -0
- runs/Apr22_06-43-04_bosshome/events.out.tfevents.1713768186.bosshome +3 -0
- runs/Apr22_06-44-47_bosshome/events.out.tfevents.1713768289.bosshome +3 -0
- runs/Apr22_06-54-42_bosshome/events.out.tfevents.1713768884.bosshome +3 -0
- runs/Apr22_07-00-41_bosshome/events.out.tfevents.1713769248.bosshome +3 -0
- runs/Apr22_07-02-20_bosshome/events.out.tfevents.1713769343.bosshome +3 -0
- runs/Apr22_07-08-37_bosshome/events.out.tfevents.1713769736.bosshome +3 -0
- runs/Apr22_07-19-12_bosshome/events.out.tfevents.1713770368.bosshome +3 -0
- runs/Apr22_07-31-40_bosshome/events.out.tfevents.1713771101.bosshome +3 -0
- runs/Apr22_07-34-04_bosshome/events.out.tfevents.1713771246.bosshome +3 -0
- runs/Apr22_07-36-25_bosshome/events.out.tfevents.1713771387.bosshome +3 -0
- training_args.bin +3 -0
config.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/home/bla_ckb/projects/supeai4/hack1/custom",
|
3 |
+
"architectures": [
|
4 |
+
"Blip2ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"initializer_factor": 1.0,
|
7 |
+
"initializer_range": 0.02,
|
8 |
+
"model_type": "blip-2",
|
9 |
+
"num_query_tokens": 32,
|
10 |
+
"qformer_config": {
|
11 |
+
"classifier_dropout": null,
|
12 |
+
"model_type": "blip_2_qformer"
|
13 |
+
},
|
14 |
+
"text_config": {
|
15 |
+
"_name_or_path": "sail/Sailor-1.8B",
|
16 |
+
"architectures": [
|
17 |
+
"Qwen2ForCausalLM"
|
18 |
+
],
|
19 |
+
"bos_token_id": 151643,
|
20 |
+
"eos_token_id": 151643,
|
21 |
+
"hidden_act": "silu",
|
22 |
+
"hidden_size": 2048,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"intermediate_size": 5504,
|
25 |
+
"max_position_embeddings": 8192,
|
26 |
+
"max_window_layers": 21,
|
27 |
+
"model_type": "qwen2",
|
28 |
+
"num_attention_heads": 16,
|
29 |
+
"num_hidden_layers": 24,
|
30 |
+
"num_key_value_heads": 16,
|
31 |
+
"pad_token_id": null,
|
32 |
+
"rms_norm_eps": 1e-06,
|
33 |
+
"rope_theta": 1000000.0,
|
34 |
+
"sliding_window": 4096,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "bfloat16",
|
37 |
+
"use_sliding_window": false,
|
38 |
+
"vocab_size": 151936
|
39 |
+
},
|
40 |
+
"tie_word_embeddings": false,
|
41 |
+
"torch_dtype": "bfloat16",
|
42 |
+
"transformers_version": "4.40.0",
|
43 |
+
"use_decoder_only_language_model": true,
|
44 |
+
"vision_config": {
|
45 |
+
"dropout": 0.0,
|
46 |
+
"initializer_factor": 1.0,
|
47 |
+
"model_type": "blip_2_vision_model",
|
48 |
+
"num_channels": 3,
|
49 |
+
"projection_dim": 512
|
50 |
+
}
|
51 |
+
}
|
runs/Apr22_06-37-13_bosshome/events.out.tfevents.1713767835.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:211c37e2428b094b2d4e42f054844f09d4f0d4714546264faa3094f80d5379b2
|
3 |
+
size 3942
|
runs/Apr22_06-41-46_bosshome/events.out.tfevents.1713768108.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c727d5232a652c729fae930f9d88be9eee0256fcc175115f8fccec1c4cde79d
|
3 |
+
size 3942
|
runs/Apr22_06-43-04_bosshome/events.out.tfevents.1713768186.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7251f49fb42f0218ff7e7a90f61e649f78d81744161ac6e70d162b7046476e5
|
3 |
+
size 3940
|
runs/Apr22_06-44-47_bosshome/events.out.tfevents.1713768289.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13272051a1069757a7adaa9b9ecbc08f30c111dbd32eafe17c436feef4182d26
|
3 |
+
size 5358
|
runs/Apr22_06-54-42_bosshome/events.out.tfevents.1713768884.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96d4300ff774fdde0a8aa83ade56282166f675ab188a1a74a16da0272d3441d4
|
3 |
+
size 3940
|
runs/Apr22_07-00-41_bosshome/events.out.tfevents.1713769248.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1096c1c35e2f2799d33dda4a9fbae913ca372b584472a9c574c8f52bd5c2c1a1
|
3 |
+
size 3940
|
runs/Apr22_07-02-20_bosshome/events.out.tfevents.1713769343.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44e3a9f6abbb74be55ed5af85a60869925dae059200dbd6b27f48d787b595ab5
|
3 |
+
size 3940
|
runs/Apr22_07-08-37_bosshome/events.out.tfevents.1713769736.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db6102a4a129df540baec7c80fd2e2cf7f3a6352e522bf32a8ad3146891d4e05
|
3 |
+
size 3940
|
runs/Apr22_07-19-12_bosshome/events.out.tfevents.1713770368.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6ba5261d8934a81c5d0e02a4fe222ce8e2325d2fb42094d2a6c193804b6e457
|
3 |
+
size 5201
|
runs/Apr22_07-31-40_bosshome/events.out.tfevents.1713771101.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da682925ef75ac1b34c10e622c7d4d0cf729ca0fd7a5221c9d429a6abe74c57a
|
3 |
+
size 5358
|
runs/Apr22_07-34-04_bosshome/events.out.tfevents.1713771246.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40631902c732920a5c6af472fcf4d73c652076f3eacf0718e0be6de7f9602807
|
3 |
+
size 5358
|
runs/Apr22_07-36-25_bosshome/events.out.tfevents.1713771387.bosshome
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e0d625c5f36a339a27cf5c5d11bb808ffcecd4fa426b8873e250421dbf8667
|
3 |
+
size 6184
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8280953a0aed469b56d42a5a41aeaa14353e18992136719e4418691a94bd95f6
|
3 |
+
size 4984
|