gradio>=5.0 huggingface_hub>=0.23 numpy>=1.24 soundfile>=0.12 nemo_toolkit[asr]