gradio==3.41.2 transformers==4.32.0 torch==2.0.1 torchvision==0.15.2 pillow==10.0.0 pydub==0.25.1 SpeechRecognition==3.9.0 sentencepiece==0.1.99