Spaces:

stabilityai
/

stable-audio-3

Running on Zero

multimodalart HF Staff commited on 1 day ago

Commit

d82866b

verified ·

1 Parent(s): 72c410e

swap torchaudio -> soundfile (avoid libcudart.so.12 load failure)

Files changed (2) hide show

app.py CHANGED Viewed

@@ -72,8 +72,8 @@ _ensure_stable_audio_tools()
 import gradio as gr
 import torch
-import torchaudio
 from einops import rearrange
 from stable_audio_tools import get_pretrained_model
@@ -216,7 +216,8 @@ def infer(
     output = output[:, : int(duration) * lv.sample_rate]
     out_path = os.path.join(tempfile.mkdtemp(), f"sa3_{variant_key}.wav")
-    torchaudio.save(out_path, output, lv.sample_rate)
     return out_path

 import gradio as gr
+import soundfile as sf
 import torch
 from einops import rearrange
 from stable_audio_tools import get_pretrained_model
     output = output[:, : int(duration) * lv.sample_rate]
     out_path = os.path.join(tempfile.mkdtemp(), f"sa3_{variant_key}.wav")
+    # soundfile expects (samples, channels); our tensor is (channels, samples).
+    sf.write(out_path, output.numpy().T, lv.sample_rate, subtype="PCM_16")
     return out_path

requirements.txt CHANGED Viewed

@@ -3,6 +3,7 @@
 # pre-installed) — its setup.py pulls flash-attn which fails to build in pip's
 # isolated env. See app.py.
 einops
 # PyWavelets 1.7+ ships wheels built for NumPy 2.x; older versions throw a
 # dtype-size ABI error on the ZeroGPU image.
 PyWavelets>=1.7.0

 # pre-installed) — its setup.py pulls flash-attn which fails to build in pip's
 # isolated env. See app.py.
 einops
+soundfile
 # PyWavelets 1.7+ ships wheels built for NumPy 2.x; older versions throw a
 # dtype-size ABI error on the ZeroGPU image.
 PyWavelets>=1.7.0