gradio>=4.0.0,<5.0.0 requests>=2.30.0 tqdm>=4.66.0 torch==2.0.1 transformers>=4.30.0,<4.36.0 diffusers==0.21.4 huggingface_hub==0.16.4 accelerate>=0.24.0 einops>=0.7.0 omegaconf>=2.0.0 librosa>=0.9.0 soundfile>=0.12.0