| aeiou |
| alias-free-torch==0.0.6 |
| auraloss==0.4.0 |
| descript-audio-codec==1.0.0 |
| decord==0.6.0 |
| einops |
| einops_exts |
| ema-pytorch==0.2.3 |
| encodec==0.1.1 |
| gradio==4.44.1 |
| gradio_client==1.3.0 |
| huggingface_hub>=0.16.0 |
| importlib-resources==5.12.0 |
| k-diffusion==0.1.1 |
| laion-clap==1.1.6 |
| local-attention==1.8.6 |
| pandas |
| pedalboard==0.9.14 |
| prefigure==0.0.9 |
| pytorch_lightning==2.1.0 |
| PyWavelets==1.4.1 |
| safetensors |
| sentencepiece==0.1.99 |
| torch>=2.1.0 |
| torchvision>=0.16.0 |
| torchaudio>=2.1.0 |
| torchmetrics==1.5.2 |
| tqdm |
| transformers==4.30.0 |
| v-diffusion-pytorch==0.0.2 |
| vector-quantize-pytorch==1.9.14 |
| wandb |
| webdataset==0.2.48 |
| x-transformers==1.42.11 |
| numpy<=2.0.0 |
| accelerate>=0.20.3 |
| scipy>=1.10.1 |
| librosa>=0.10.0 |
| ffmpeg-python>=0.2.0 |
| ninja |
| spaces |