DongfuJiang
commited on
Commit
•
d2e46e5
1
Parent(s):
9f51357
Training in progress, step 39
Browse files- config.json +1 -0
- initial_model/config.json +29 -0
- initial_model/model.safetensors +3 -0
- model.safetensors +1 -1
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
"SiglipVideoModel"
|
4 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "../../checkpoints/siglip-so400m-patch14-384/siglip-video_16384/initial_model",
|
3 |
"architectures": [
|
4 |
"SiglipVideoModel"
|
5 |
],
|
initial_model/config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"SiglipVideoModel"
|
4 |
+
],
|
5 |
+
"initializer_factor": 1.0,
|
6 |
+
"model_type": "siglip_video",
|
7 |
+
"perceiver_config": {
|
8 |
+
"_attn_implementation_autoset": true,
|
9 |
+
"model_type": "siglip_video_perceiver"
|
10 |
+
},
|
11 |
+
"text_config": {
|
12 |
+
"hidden_size": 1152,
|
13 |
+
"intermediate_size": 4304,
|
14 |
+
"model_type": "siglip_text_model",
|
15 |
+
"num_attention_heads": 16,
|
16 |
+
"num_hidden_layers": 27
|
17 |
+
},
|
18 |
+
"torch_dtype": "bfloat16",
|
19 |
+
"transformers_version": "4.47.1",
|
20 |
+
"vision_config": {
|
21 |
+
"hidden_size": 1152,
|
22 |
+
"image_size": 384,
|
23 |
+
"intermediate_size": 4304,
|
24 |
+
"model_type": "siglip_vision_model",
|
25 |
+
"num_attention_heads": 16,
|
26 |
+
"num_hidden_layers": 27,
|
27 |
+
"patch_size": 14
|
28 |
+
}
|
29 |
+
}
|
initial_model/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c060a01c78afa749ae65e6dafdfab404ef427e2caf8477a0b88321c9b078b9
|
3 |
+
size 1908776156
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1908776156
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a69d2eff5f9e67eb7cbdf96da4ddd284e8c61a9d11909a4833c5077454ad200b
|
3 |
size 1908776156
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6712
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2babfac6d2015857e2311adcab661baead4b4af170cff1a8f9f1498e55867941
|
3 |
size 6712
|