git+https://github.com/huggingface/diffusers.git torch==2.0.1 scipy torchaudio==2.0.2 torchvision==0.15.2 tqdm pyyaml einops numpy<=1.23.5 soundfile librosa pandas # transformers torchlibrosa transformers ftfy