felixem commited on
Commit
cbe76d8
·
verified ·
1 Parent(s): 62de961

Add ONNX FP32 models

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ onnx/decoder_model.onnx.data filter=lfs diff=lfs merge=lfs -text
37
+ onnx/decoder_with_past_model.onnx.data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/encoder_model.onnx.data filter=lfs diff=lfs merge=lfs -text
onnx/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "attention_bias": false,
3
+ "attention_dropout": 0.0,
4
+ "bos_token_id": 1,
5
+ "decoder_start_token_id": 1,
6
+ "dtype": "float32",
7
+ "encoder_config": {
8
+ "attention_bias": false,
9
+ "attention_dropout": 0.0,
10
+ "dtype": "float32",
11
+ "frame_ms": 5.0,
12
+ "head_dim": 40,
13
+ "hidden_act": "gelu",
14
+ "hidden_size": 320,
15
+ "intermediate_size": 1280,
16
+ "max_position_embeddings": 4096,
17
+ "model_type": "moonshine_streaming_encoder",
18
+ "num_attention_heads": 8,
19
+ "num_hidden_layers": 6,
20
+ "num_key_value_heads": 8,
21
+ "sample_rate": 16000,
22
+ "sliding_windows": [
23
+ [
24
+ 16,
25
+ 4
26
+ ],
27
+ [
28
+ 16,
29
+ 4
30
+ ],
31
+ [
32
+ 16,
33
+ 0
34
+ ],
35
+ [
36
+ 16,
37
+ 0
38
+ ],
39
+ [
40
+ 16,
41
+ 4
42
+ ],
43
+ [
44
+ 16,
45
+ 4
46
+ ]
47
+ ]
48
+ },
49
+ "encoder_hidden_size": 320,
50
+ "eos_token_id": 2,
51
+ "ffn_mult": 4,
52
+ "head_dim": 40,
53
+ "hidden_act": "silu",
54
+ "hidden_size": 320,
55
+ "intermediate_size": 1280,
56
+ "is_encoder_decoder": true,
57
+ "max_position_embeddings": 4096,
58
+ "model_type": "moonshine_streaming",
59
+ "num_attention_heads": 8,
60
+ "num_hidden_layers": 6,
61
+ "num_key_value_heads": 8,
62
+ "pad_head_dim_to_multiple_of": null,
63
+ "pad_token_id": 0,
64
+ "rope_parameters": {
65
+ "partial_rotary_factor": 0.8,
66
+ "rope_theta": 10000.0,
67
+ "rope_type": "default"
68
+ },
69
+ "tie_word_embeddings": false,
70
+ "transformers_version": "5.6.2",
71
+ "use_cache": true,
72
+ "vocab_size": 32768
73
+ }
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740bad720c0f5c9a85d136e8dcf663ae1e0c1983d08b02fd16c72f319cc412ed
3
+ size 1133251
onnx/decoder_model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:706c2c14ea7b82968111bfa7d8aa2d80a4f37c2bb35eaa1e0bfc7cd9873207e8
3
+ size 138412032
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5291822f80aa9b76a7c2511290a6edb54a256e7ca7ae4fd93e7213f63ae80ca
3
+ size 1163100
onnx/decoder_with_past_model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c03f554a4180eba9171ffe0d8ba698c02cee25d727d7f04add71fdf3e14b8157
3
+ size 128253952
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de20c3c602636498980194646bbc87b219c74c5d8eaa769ff8328da0929f7d05
3
+ size 699936
onnx/encoder_model.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b990c5914f11fe7b5a393afebdc1cc41c2f295e3aee04d3e4f6aef65b1f46dc9
3
+ size 37912576
onnx/processor_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "feature_extractor": {
3
+ "do_normalize": false,
4
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
5
+ "feature_size": 1,
6
+ "pad_to_multiple_of": 80,
7
+ "padding_side": "right",
8
+ "padding_value": 0.0,
9
+ "return_attention_mask": true,
10
+ "sampling_rate": 16000
11
+ },
12
+ "processor_class": "MoonshineStreamingProcessor"
13
+ }
onnx/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
onnx/tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "is_local": false,
6
+ "local_files_only": false,
7
+ "model_max_length": 4096,
8
+ "pad_token": "<unk>",
9
+ "processor_class": "MoonshineStreamingProcessor",
10
+ "tokenizer_class": "TokenizersBackend",
11
+ "unk_token": "<unk>"
12
+ }