Automatic Speech Recognition
NeMo
Core ML
English
speech-recognition
FastConformer
end-of-utterance
voice agent
Instructions to use aoiandroid/parakeet-realtime-eou-120m-coreml with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- NeMo
How to use aoiandroid/parakeet-realtime-eou-120m-coreml with NeMo:
import nemo.collections.asr as nemo_asr asr_model = nemo_asr.models.ASRModel.from_pretrained("aoiandroid/parakeet-realtime-eou-120m-coreml") transcriptions = asr_model.transcribe(["file.wav"]) - Notebooks
- Google Colab
- Kaggle
| [ | |
| { | |
| "metadataOutputVersion" : "3.0", | |
| "shortDescription" : "Parakeet EOU decoder (RNNT prediction network)", | |
| "outputSchema" : [ | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float32", | |
| "formattedType" : "MultiArray (Float32 1 × 640 × 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 640, 1]", | |
| "name" : "decoder", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float32", | |
| "formattedType" : "MultiArray (Float32 1 × 1 × 640)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1, 640]", | |
| "name" : "h_out", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float32", | |
| "formattedType" : "MultiArray (Float32 1 × 1 × 640)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1, 640]", | |
| "name" : "c_out", | |
| "type" : "MultiArray" | |
| } | |
| ], | |
| "storagePrecision" : "Float16", | |
| "modelParameters" : [ | |
| ], | |
| "author" : "Fluid Inference", | |
| "specificationVersion" : 8, | |
| "mlProgramOperationTypeHistogram" : { | |
| "Ios17.squeeze" : 2, | |
| "Ios17.gather" : 1, | |
| "Ios17.cast" : 6, | |
| "Ios17.lstm" : 1, | |
| "Ios17.transpose" : 2, | |
| "Identity" : 1, | |
| "Ios17.expandDims" : 2 | |
| }, | |
| "computePrecision" : "Mixed (Float16, Float32, Int16, Int32)", | |
| "isUpdatable" : "0", | |
| "stateSchema" : [ | |
| ], | |
| "availability" : { | |
| "macOS" : "14.0", | |
| "tvOS" : "17.0", | |
| "visionOS" : "1.0", | |
| "watchOS" : "10.0", | |
| "iOS" : "17.0", | |
| "macCatalyst" : "17.0" | |
| }, | |
| "modelType" : { | |
| "name" : "MLModelType_mlProgram" | |
| }, | |
| "inputSchema" : [ | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Int32", | |
| "formattedType" : "MultiArray (Int32 1 × 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1]", | |
| "name" : "targets", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Int32", | |
| "formattedType" : "MultiArray (Int32 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "target_length", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float32", | |
| "formattedType" : "MultiArray (Float32 1 × 1 × 640)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1, 640]", | |
| "name" : "h_in", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float32", | |
| "formattedType" : "MultiArray (Float32 1 × 1 × 640)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1, 640]", | |
| "name" : "c_in", | |
| "type" : "MultiArray" | |
| } | |
| ], | |
| "userDefinedMetadata" : { | |
| "com.github.apple.coremltools.version" : "8.3.0", | |
| "com.github.apple.coremltools.source" : "torch==2.4.0", | |
| "com.github.apple.coremltools.source_dialect" : "TorchScript" | |
| }, | |
| "generatedClassName" : "parakeet_eou_decoder", | |
| "method" : "predict" | |
| } | |
| ] |