RaushanTurganbay HF staff commited on
Commit
c2ef27c
1 Parent(s): 8ecee59

add video index

Browse files
added_tokens.json CHANGED
@@ -1,4 +1,5 @@
1
  {
2
  "<image>": 32001,
 
3
  "[PAD]": 32000
4
  }
 
1
  {
2
  "<image>": 32001,
3
+ "<video>": 32002,
4
  "[PAD]": 32000
5
  }
config.json CHANGED
@@ -44,6 +44,7 @@
44
  "torch_dtype": "float32",
45
  "transformers_version": "4.47.0.dev0",
46
  "use_decoder_only_language_model": true,
 
47
  "vision_config": {
48
  "_attn_implementation_autoset": true,
49
  "model_type": "instructblip_vision_model"
 
44
  "torch_dtype": "float32",
45
  "transformers_version": "4.47.0.dev0",
46
  "use_decoder_only_language_model": true,
47
+ "video_token_index": 32002,
48
  "vision_config": {
49
  "_attn_implementation_autoset": true,
50
  "model_type": "instructblip_vision_model"
qformer_tokenizer/tokenizer_config.json CHANGED
@@ -53,6 +53,7 @@
53
  "clean_up_tokenization_spaces": true,
54
  "cls_token": "[CLS]",
55
  "do_lower_case": true,
 
56
  "mask_token": "[MASK]",
57
  "model_max_length": 512,
58
  "pad_token": "[PAD]",
 
53
  "clean_up_tokenization_spaces": true,
54
  "cls_token": "[CLS]",
55
  "do_lower_case": true,
56
+ "extra_special_tokens": {},
57
  "mask_token": "[MASK]",
58
  "model_max_length": 512,
59
  "pad_token": "[PAD]",
tokenizer.json CHANGED
@@ -47,6 +47,15 @@
47
  "rstrip": false,
48
  "normalized": false,
49
  "special": true
 
 
 
 
 
 
 
 
 
50
  }
51
  ],
52
  "normalizer": {
 
47
  "rstrip": false,
48
  "normalized": false,
49
  "special": true
50
+ },
51
+ {
52
+ "id": 32002,
53
+ "content": "<video>",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
  }
60
  ],
61
  "normalizer": {
tokenizer_config.json CHANGED
@@ -42,11 +42,20 @@
42
  "rstrip": false,
43
  "single_word": false,
44
  "special": true
 
 
 
 
 
 
 
 
45
  }
46
  },
47
  "bos_token": "</s>",
48
  "clean_up_tokenization_spaces": false,
49
  "eos_token": "</s>",
 
50
  "legacy": true,
51
  "model_max_length": 2048,
52
  "pad_token": "[PAD]",
 
42
  "rstrip": false,
43
  "single_word": false,
44
  "special": true
45
+ },
46
+ "32002": {
47
+ "content": "<video>",
48
+ "lstrip": false,
49
+ "normalized": false,
50
+ "rstrip": false,
51
+ "single_word": false,
52
+ "special": true
53
  }
54
  },
55
  "bos_token": "</s>",
56
  "clean_up_tokenization_spaces": false,
57
  "eos_token": "</s>",
58
+ "extra_special_tokens": {},
59
  "legacy": true,
60
  "model_max_length": 2048,
61
  "pad_token": "[PAD]",