madroid commited on
Commit
6817bfc
1 Parent(s): d27e5f8

add small int8 model

Browse files
small.en/small.en_cpu_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acdd8b5e343bf07e46c8a37e169d6f1f1691e5118ce5c7505f95a1c508646108
3
+ size 442984159
small.en/whisper_cpu_int8_cpu-cpu_metrics .json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "latency-avg": {
3
+ "value": 9164.66956,
4
+ "priority": 1,
5
+ "higher_is_better": false
6
+ }
7
+ }
small.en/whisper_cpu_int8_cpu-cpu_model.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "ONNXModel",
3
+ "config": {
4
+ "model_path": "/content/Olive/examples/whisper/models/conversion-transformers_optimization-onnx_dynamic_quantization-insert_beam_search-prepost/whisper_cpu_int8_cpu-cpu_model.onnx",
5
+ "onnx_file_name": null,
6
+ "inference_settings": null,
7
+ "use_ort_extensions": true,
8
+ "hf_config": {
9
+ "model_name": "openai/whisper-small.en",
10
+ "task": null,
11
+ "feature": null,
12
+ "model_class": "WhisperForConditionalGeneration",
13
+ "components": [
14
+ {
15
+ "name": "encoder_decoder_init",
16
+ "io_config": "get_encdec_io_config",
17
+ "component_func": "get_encoder_decoder_init",
18
+ "dummy_inputs_func": "encoder_decoder_init_dummy_inputs"
19
+ },
20
+ {
21
+ "name": "decoder",
22
+ "io_config": "get_dec_io_config",
23
+ "component_func": "get_decoder",
24
+ "dummy_inputs_func": "decoder_dummy_inputs"
25
+ }
26
+ ],
27
+ "dataset": null,
28
+ "model_loading_args": null
29
+ }
30
+ }
31
+ }
small/small-whisper_cpu_int8-2.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce1b414bd1a2226d5eda170027c2b77175d0e9d52775b4a3575bafdbb1d3c661
3
+ size 443023501
small/whisper_cpu_int8_cpu-cpu_metrics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "latency-avg": {
3
+ "value": 9404.15679,
4
+ "priority": 1,
5
+ "higher_is_better": false
6
+ }
7
+ }
small/whisper_cpu_int8_cpu-cpu_model.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "ONNXModel",
3
+ "config": {
4
+ "model_path": "/content/Olive/examples/whisper/models/conversion-transformers_optimization-onnx_dynamic_quantization-insert_beam_search-prepost/whisper_cpu_int8_cpu-cpu_model.onnx",
5
+ "onnx_file_name": null,
6
+ "inference_settings": null,
7
+ "use_ort_extensions": true,
8
+ "hf_config": {
9
+ "model_name": "openai/whisper-small",
10
+ "task": null,
11
+ "feature": null,
12
+ "model_class": "WhisperForConditionalGeneration",
13
+ "components": [
14
+ {
15
+ "name": "encoder_decoder_init",
16
+ "io_config": "get_encdec_io_config",
17
+ "component_func": "get_encoder_decoder_init",
18
+ "dummy_inputs_func": "encoder_decoder_init_dummy_inputs"
19
+ },
20
+ {
21
+ "name": "decoder",
22
+ "io_config": "get_dec_io_config",
23
+ "component_func": "get_decoder",
24
+ "dummy_inputs_func": "decoder_dummy_inputs"
25
+ }
26
+ ],
27
+ "dataset": null,
28
+ "model_loading_args": null
29
+ }
30
+ }
31
+ }