Nekochu commited on
Commit
4393113
·
1 Parent(s): 6fa797e

fix: use q5_0 quantization type (q5_k_m not supported by sd.cpp)

Browse files
Files changed (2) hide show
  1. Dockerfile +2 -2
  2. app.py +1 -1
Dockerfile CHANGED
@@ -44,8 +44,8 @@ RUN curl -fL --retry 3 --retry-delay 5 -o /app/models/z-anime-distill-4step-bf16
44
  "https://huggingface.co/SeeSee21/Z-Anime/resolve/main/diffusion_models/z-anime-distill-4step-bf16.safetensors" \
45
  && /app/sd-cli -M convert \
46
  -m /app/models/z-anime-distill-4step-bf16.safetensors \
47
- -o /app/models/z-anime-distill-4step-Q5_K_M.gguf \
48
- --type q5_k_m \
49
  && rm /app/models/z-anime-distill-4step-bf16.safetensors
50
 
51
  # Download Qwen3-4B text encoder Q8_0 GGUF (~4.28GB)
 
44
  "https://huggingface.co/SeeSee21/Z-Anime/resolve/main/diffusion_models/z-anime-distill-4step-bf16.safetensors" \
45
  && /app/sd-cli -M convert \
46
  -m /app/models/z-anime-distill-4step-bf16.safetensors \
47
+ -o /app/models/z-anime-distill-4step-Q5_0.gguf \
48
+ --type q5_0 \
49
  && rm /app/models/z-anime-distill-4step-bf16.safetensors
50
 
51
  # Download Qwen3-4B text encoder Q8_0 GGUF (~4.28GB)
app.py CHANGED
@@ -7,7 +7,7 @@ import gradio as gr
7
  # ---------------------------------------------------------------------------
8
  # Model paths (downloaded at build time)
9
  # ---------------------------------------------------------------------------
10
- DIFFUSION = "/app/models/z-anime-distill-4step-Q5_K_M.gguf"
11
  LLM = "/app/models/qwen3_4b_q8_0.gguf"
12
  VAE = "/app/models/ae.safetensors"
13
 
 
7
  # ---------------------------------------------------------------------------
8
  # Model paths (downloaded at build time)
9
  # ---------------------------------------------------------------------------
10
+ DIFFUSION = "/app/models/z-anime-distill-4step-Q5_0.gguf"
11
  LLM = "/app/models/qwen3_4b_q8_0.gguf"
12
  VAE = "/app/models/ae.safetensors"
13