DevAsService commited on
Commit
5c4e6a2
·
verified ·
1 Parent(s): 7ee85b8

(Trained with Unsloth)

Browse files
Files changed (2) hide show
  1. config.json +123 -0
  2. tokenizer_config.json +3 -2
config.json ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CsmForConditionalGeneration"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "audio_eos_token_id": 128003,
8
+ "audio_token_id": 128002,
9
+ "bos_token_id": 128000,
10
+ "codebook_eos_token_id": 0,
11
+ "codebook_pad_token_id": 2050,
12
+ "codec_config": {
13
+ "_frame_rate": 12.5,
14
+ "_name_or_path": "kyutai/mimi",
15
+ "architectures": [
16
+ "MimiModel"
17
+ ],
18
+ "attention_bias": false,
19
+ "attention_dropout": 0.0,
20
+ "audio_channels": 1,
21
+ "codebook_dim": 256,
22
+ "codebook_size": 2048,
23
+ "compress": 2,
24
+ "dilation_growth_rate": 2,
25
+ "torch_dtype": "float16",
26
+ "head_dim": 64,
27
+ "hidden_act": "gelu",
28
+ "hidden_size": 512,
29
+ "initializer_range": 0.02,
30
+ "intermediate_size": 2048,
31
+ "kernel_size": 7,
32
+ "last_kernel_size": 3,
33
+ "layer_scale_initial_scale": 0.01,
34
+ "max_position_embeddings": 8000,
35
+ "model_type": "mimi",
36
+ "norm_eps": 1e-05,
37
+ "normalize": false,
38
+ "num_attention_heads": 8,
39
+ "num_filters": 64,
40
+ "num_hidden_layers": 8,
41
+ "num_key_value_heads": 8,
42
+ "num_quantizers": 32,
43
+ "num_residual_layers": 1,
44
+ "num_semantic_quantizers": 1,
45
+ "pad_mode": "constant",
46
+ "residual_kernel_size": 3,
47
+ "rope_theta": 10000.0,
48
+ "sampling_rate": 24000,
49
+ "sliding_window": 250,
50
+ "trim_right_ratio": 1.0,
51
+ "upsample_groups": 512,
52
+ "upsampling_ratios": [
53
+ 8,
54
+ 6,
55
+ 5,
56
+ 4
57
+ ],
58
+ "use_cache": false,
59
+ "use_causal_conv": true,
60
+ "use_conv_shortcut": false,
61
+ "use_streaming": false,
62
+ "vector_quantization_hidden_dimension": 256
63
+ },
64
+ "depth_decoder_config": {
65
+ "attention_bias": false,
66
+ "attention_dropout": 0.0,
67
+ "backbone_hidden_size": 2048,
68
+ "torch_dtype": "float16",
69
+ "head_dim": 128,
70
+ "hidden_act": "silu",
71
+ "hidden_size": 1024,
72
+ "initializer_range": 0.02,
73
+ "intermediate_size": 8192,
74
+ "max_position_embeddings": 33,
75
+ "mlp_bias": false,
76
+ "model_type": "csm_depth_decoder_model",
77
+ "num_attention_heads": 8,
78
+ "num_codebooks": 32,
79
+ "num_hidden_layers": 4,
80
+ "num_key_value_heads": 2,
81
+ "rms_norm_eps": 1e-05,
82
+ "rope_scaling": {
83
+ "factor": 32.0,
84
+ "high_freq_factor": 0.0078125,
85
+ "low_freq_factor": 0.001953125,
86
+ "original_max_position_embeddings": 16,
87
+ "rope_type": "llama3"
88
+ },
89
+ "rope_theta": 500000,
90
+ "use_cache": true,
91
+ "vocab_size": 2051
92
+ },
93
+ "torch_dtype": "float16",
94
+ "head_dim": 64,
95
+ "hidden_act": "silu",
96
+ "hidden_size": 2048,
97
+ "initializer_range": 0.02,
98
+ "intermediate_size": 8192,
99
+ "max_position_embeddings": 2048,
100
+ "mlp_bias": false,
101
+ "model_type": "csm",
102
+ "num_attention_heads": 32,
103
+ "num_codebooks": 32,
104
+ "num_hidden_layers": 16,
105
+ "num_key_value_heads": 8,
106
+ "pad_token_id": 128256,
107
+ "rms_norm_eps": 1e-05,
108
+ "rope_scaling": {
109
+ "factor": 32.0,
110
+ "high_freq_factor": 0.5,
111
+ "low_freq_factor": 0.125,
112
+ "original_max_position_embeddings": 1024,
113
+ "rope_type": "llama3"
114
+ },
115
+ "rope_theta": 500000,
116
+ "text_vocab_size": 128256,
117
+ "tie_codebooks_embeddings": true,
118
+ "tie_word_embeddings": false,
119
+ "transformers_version": "4.56.2",
120
+ "unsloth_version": "2025.10.3",
121
+ "use_cache": true,
122
+ "vocab_size": 2051
123
+ }
tokenizer_config.json CHANGED
@@ -2060,5 +2060,6 @@
2060
  "model_max_length": 131072,
2061
  "pad_token": "<|end_of_text|>",
2062
  "processor_class": "CsmProcessor",
2063
- "tokenizer_class": "PreTrainedTokenizerFast"
2064
- }
 
 
2060
  "model_max_length": 131072,
2061
  "pad_token": "<|end_of_text|>",
2062
  "processor_class": "CsmProcessor",
2063
+ "tokenizer_class": "PreTrainedTokenizerFast",
2064
+ "chat_template": "\n{%- for message in messages %}\n {#-- Validate role is a stringified integer --#}\n {%- if not message['role'] is string or not message['role'].isdigit() %}\n {{- raise_exception(\"The role must be an integer or a stringified integer (e.g. '0') designating the speaker id\") }}\n {%- endif %}\n\n {#-- Validate content is a list --#}\n {%- set content = message['content'] %}\n {%- if content is not iterable or content is string %}\n {{- raise_exception(\"The content must be a list\") }}\n {%- endif %}\n\n {#-- Collect content types --#}\n {%- set content_types = content | map(attribute='type') | list %}\n {%- set is_last = loop.last %}\n\n {#-- Last message validation --#}\n {%- if is_last %}\n {%- if 'text' not in content_types %}\n {{- raise_exception(\"The last message must include one item of type 'text'\") }}\n {%- elif (content_types | select('equalto', 'text') | list | length > 1) or (content_types | select('equalto', 'audio') | list | length > 1) %}\n {{- raise_exception(\"At most two items are allowed in the last message: one 'text' and one 'audio'\") }}\n {%- endif %}\n\n {#-- All other messages validation --#}\n {%- else %}\n {%- if content_types | select('equalto', 'text') | list | length != 1\n or content_types | select('equalto', 'audio') | list | length != 1 %}\n {{- raise_exception(\"Each message (except the last) must contain exactly one 'text' and one 'audio' item\") }}\n {%- elif content_types | reject('in', ['text', 'audio']) | list | length > 0 %}\n {{- raise_exception(\"Only 'text' and 'audio' types are allowed in content\") }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n\n{%- for message in messages %}\n {{- bos_token }}\n {{- '[' + message['role'] + ']' }}\n {{- message['content'][0]['text'] }}\n {{- eos_token }}\n {%- if message['content']|length > 1 %}\n {{- '<|AUDIO|><|audio_eos|>' }}\n {%- endif %}\n{%- endfor %}\n"
2065
+ }