| { | |
| "model_id": "nvidia/parakeet-ctc-0.6b-Vietnamese", | |
| "model_type": "ctc", | |
| "language": "", | |
| "sample_rate": 16000, | |
| "max_audio_seconds": 15.0, | |
| "max_audio_samples": 240000, | |
| "vocab_size": 1024, | |
| "blank_id": 1024, | |
| "checkpoint": { | |
| "type": "pretrained", | |
| "model_id": "nvidia/parakeet-ctc-0.6b-Vietnamese" | |
| }, | |
| "coreml": { | |
| "compute_precision": "FLOAT32", | |
| "quantization": "none" | |
| }, | |
| "components": { | |
| "mel_encoder": { | |
| "path": "parakeet_mel_encoder.mlpackage", | |
| "inputs": { | |
| "audio_signal": [ | |
| 1, | |
| 240000 | |
| ], | |
| "audio_length": [ | |
| 1 | |
| ] | |
| }, | |
| "outputs": { | |
| "encoder": [ | |
| 1, | |
| 1024, | |
| 188 | |
| ], | |
| "encoder_length": [ | |
| 1 | |
| ] | |
| } | |
| }, | |
| "ctc_decoder": { | |
| "path": "parakeet_ctc_decoder.mlpackage", | |
| "inputs": { | |
| "encoder": [ | |
| 1, | |
| 1024, | |
| 188 | |
| ] | |
| }, | |
| "outputs": { | |
| "log_probs": [ | |
| 1, | |
| 188, | |
| 1025 | |
| ] | |
| } | |
| } | |
| } | |
| } |