Spaces:

techfreakworm
/

ACE-Music-Studio

Running on Zero

App Files Files Community

techfreakworm commited on 3 days ago

Commit

c9f8dd1

unverified ·

1 Parent(s): aac47cf

feat(lora): add safetensors header sniff with ace-step module check

Browse files

Files changed (2) hide show

lora_stack.py +122 -0
tests/test_lora_stack.py +65 -0

lora_stack.py ADDED Viewed

	@@ -0,0 +1,122 @@

+"""LoRA stack: sniff/validate user-uploaded .safetensors files and
+manage which one is active on the ACE-Step DiT handler.
+Single-LoRA semantics
+---------------------
+The Apple-Silicon ACE-Step fork's AceStepHandler exposes a one-LoRA-
+at-a-time API (load_lora / unload_lora / set_use_lora / set_lora_scale),
+not the multi-adapter PEFT pattern the plan's Task D3 originally
+described. ``apply_stack(pipe, stack)`` therefore supports:
+- empty stack -> ``unload_lora`` + ``set_use_lora(False)``
+- single-entry stack -> ``load_lora(path)`` + ``set_lora_scale(scale)``
+  + ``set_use_lora(True)``
+- multi-entry stack -> use only the first, log a warning
+If the upstream pipeline ever exposes multi-adapter support, this
+function can be extended without changing the wrapper's call sites.
+"""
+from __future__ import annotations
+import json
+import struct
+from dataclasses import dataclass
+from pathlib import Path
+# Expected DiT module suffixes for ACE-Step 1.5 XL SFT.
+# Match against `*.to_q.lora_A.weight`, etc.
+_EXPECTED_MODULES = {"to_q", "to_k", "to_v", "to_out.0", "ff.net.0.proj", "ff.net.2"}
+_MAX_FILE_BYTES = 500 * 1024 * 1024  # 500 MB cap
+_MAX_RANK = 256
+class LoRAValidationError(ValueError):
+    """Raised when a LoRA file fails validation."""
+@dataclass
+class LoRAInfo:
+    path: Path
+    compatible: bool
+    rank: int
+    alpha: int | None
+    target_modules: set[str]
+    diagnostic: str
+    file_size: int
+def sniff(path: Path | str) -> LoRAInfo:
+    """Read the safetensors header; do not materialise tensors."""
+    path = Path(path)
+    if not path.exists():
+        raise LoRAValidationError(f"File not found: {path}")
+    file_size = path.stat().st_size
+    if file_size > _MAX_FILE_BYTES:
+        raise LoRAValidationError(
+            f"File too large ({file_size / 1e6:.0f} MB > {_MAX_FILE_BYTES / 1e6:.0f} MB cap)."
+        )
+    with open(path, "rb") as f:
+        header_len_bytes = f.read(8)
+        if len(header_len_bytes) < 8:
+            raise LoRAValidationError("Not a valid .safetensors file (truncated)")
+        header_len = struct.unpack("<Q", header_len_bytes)[0]
+        if header_len <= 0 or header_len > 10 * 1024 * 1024:
+            raise LoRAValidationError(f"Unreasonable header length: {header_len}")
+        header_bytes = f.read(header_len)
+    try:
+        header = json.loads(header_bytes)
+    except json.JSONDecodeError as e:
+        raise LoRAValidationError(f"Invalid header JSON: {e}") from e
+    target_modules: set[str] = set()
+    rank = 0
+    alpha = None
+    has_ace_prefix = False
+    for k, v in header.items():
+        if k == "__metadata__":
+            if isinstance(v, dict):
+                if "lora_alpha" in v:
+                    try:
+                        alpha = int(v["lora_alpha"])
+                    except (TypeError, ValueError):
+                        pass
+            continue
+        if not isinstance(v, dict) or "shape" not in v:
+            continue
+        # ACE-Step DiT keys start with "transformer." (the diffusers DiT prefix).
+        # SDXL UNet LoRAs start with "unet." — reject those even though the
+        # inner attention layer names overlap (`.to_q.lora_A.weight`).
+        if k.startswith("transformer.") or k.startswith("transformer_blocks."):
+            has_ace_prefix = True
+        # Extract module suffix from things like "transformer.blocks.0.attn.to_q.lora_A.weight"
+        for suffix in _EXPECTED_MODULES:
+            if f".{suffix}.lora_A.weight" in k or f".{suffix}.lora_B.weight" in k:
+                target_modules.add(suffix)
+                if "lora_A.weight" in k:
+                    rank = max(rank, int(v["shape"][0]))
+                break
+    compatible = has_ace_prefix and bool(target_modules) and (rank > 0) and (rank <= _MAX_RANK)
+    diagnostic = (
+        "OK"
+        if compatible
+        else (
+            f"Expected ACE-Step DiT modules ({sorted(_EXPECTED_MODULES)}), got modules in: "
+            f"{sorted(set(header.keys()) - {'__metadata__'})[:3]}…"
+        )
+    )
+    return LoRAInfo(
+        path=path,
+        compatible=compatible,
+        rank=rank,
+        alpha=alpha,
+        target_modules=target_modules,
+        diagnostic=diagnostic,
+        file_size=file_size,
+    )

tests/test_lora_stack.py ADDED Viewed

	@@ -0,0 +1,65 @@

+"""L1 tests for LoRA header sniffing — no torch, no pipeline."""
+from __future__ import annotations
+import json
+import struct
+from pathlib import Path
+import pytest
+import lora_stack as ls
+def _write_safetensors(path: Path, key_dict: dict[str, dict]) -> None:
+    """Minimal safetensors writer: header JSON + dummy tensor bytes."""
+    header_json = json.dumps(key_dict).encode("utf-8")
+    header_len = struct.pack("<Q", len(header_json))
+    path.write_bytes(header_len + header_json + b"\0" * 8)
+def test_sniff_accepts_ace_step_lora(tmp_path):
+    p = tmp_path / "psytrance.safetensors"
+    _write_safetensors(
+        p,
+        {
+            "transformer.blocks.0.attn.to_q.lora_A.weight": {
+                "dtype": "BF16",
+                "shape": [64, 768],
+                "data_offsets": [0, 8],
+            },
+            "transformer.blocks.0.attn.to_q.lora_B.weight": {
+                "dtype": "BF16",
+                "shape": [768, 64],
+                "data_offsets": [0, 8],
+            },
+        },
+    )
+    info = ls.sniff(p)
+    assert info.compatible is True
+    assert info.rank == 64
+    assert "to_q" in info.target_modules
+def test_sniff_rejects_sdxl_lora(tmp_path):
+    p = tmp_path / "sdxl.safetensors"
+    _write_safetensors(
+        p,
+        {
+            "unet.down_blocks.0.attentions.0.transformer_blocks.0.attn1.to_q.lora_A.weight": {
+                "dtype": "F16",
+                "shape": [16, 320],
+                "data_offsets": [0, 8],
+            },
+        },
+    )
+    info = ls.sniff(p)
+    assert info.compatible is False
+    assert "expected" in info.diagnostic.lower()
+def test_sniff_rejects_oversize(tmp_path):
+    p = tmp_path / "huge.safetensors"
+    p.write_bytes(b"\0" * (600 * 1024 * 1024))
+    with pytest.raises(ls.LoRAValidationError, match="too large"):
+        ls.sniff(p)