|
|
--- |
|
|
license: cc-by-4.0 |
|
|
thumbnail: null |
|
|
widget: |
|
|
- example_title: Librispeech sample 1 |
|
|
src: https://cdn-media.huggingface.co/speech_samples/sample1.flac |
|
|
- example_title: Librispeech sample 2 |
|
|
src: https://cdn-media.huggingface.co/speech_samples/sample2.flac |
|
|
metrics: |
|
|
- wer |
|
|
tags: |
|
|
- automatic-speech-recognition |
|
|
- speech |
|
|
- audio |
|
|
- Transducer |
|
|
- TDT |
|
|
- FastConformer |
|
|
- Conformer |
|
|
- pytorch |
|
|
- NeMo |
|
|
- hf-asr-leaderboard |
|
|
language: |
|
|
- en |
|
|
pipeline_tag: automatic-speech-recognition |
|
|
library_name: nemo |
|
|
base_model: |
|
|
- nvidia/parakeet-tdt-0.6b-v2 |
|
|
--- |
|
|
|
|
|
Parakeet TDT 0.6B V2 (En) |
|
|
|
|
|
Work in progress, follow this [repo](https://github.com/FluidInference/FluidAudio) for updates, models will continue to change as we tune them |