Text-to-Image
Diffusers
Safetensors
LensPipeline
lens
sdnq
uint4
static-quantization
ablation
model-cpu-offload
Instructions to use WaveCut/Lens-SDNQ-uint4-static with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Diffusers
How to use WaveCut/Lens-SDNQ-uint4-static with Diffusers:
pip install -U diffusers transformers accelerate
import torch from diffusers import DiffusionPipeline # switch to "mps" for apple devices pipe = DiffusionPipeline.from_pretrained("WaveCut/Lens-SDNQ-uint4-static", dtype=torch.bfloat16, device_map="cuda") prompt = "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k" image = pipe(prompt).images[0] - Notebooks
- Google Colab
- Kaggle
- Local Apps
- Draw Things
- DiffusionBee
Add files using upload-large-folder tool
Browse files- .gitattributes +36 -0
- README.md +206 -0
- assets/comparison/comparison_grid_1to1_q98.webp +3 -0
- benchmark_metrics.json +349 -0
- comparison_matrix.json +362 -0
- model_cpu_offload_benchmark.json +363 -0
- model_index.json +24 -0
- scheduler/scheduler_config.json +18 -0
- sdnq_quantization_summary.json +62 -0
- text_encoder/config.json +78 -0
- text_encoder/generation_config.json +11 -0
- text_encoder/model-00001-of-00003.safetensors +3 -0
- text_encoder/model-00002-of-00003.safetensors +3 -0
- text_encoder/model-00003-of-00003.safetensors +3 -0
- text_encoder/model.safetensors.index.json +467 -0
- tokenizer/chat_template.jinja +331 -0
- tokenizer/tokenizer.json +3 -0
- tokenizer/tokenizer_config.json +15 -0
- transformer/config.json +476 -0
- transformer/diffusion_pytorch_model-00001-of-00002.safetensors +3 -0
- transformer/diffusion_pytorch_model-00002-of-00002.safetensors +3 -0
- transformer/diffusion_pytorch_model.safetensors.index.json +0 -0
- transformer/quantization_config.json +449 -0
- vae/config.json +40 -0
- vae/diffusion_pytorch_model.safetensors +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,39 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
assets/gallery/000-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
assets/gallery/001-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
assets/gallery/002-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
assets/gallery/003-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
assets/gallery/004-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
assets/gallery/005-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
assets/gallery/006-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
assets/gallery/007-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
assets/gallery/008-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
assets/gallery/009-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
assets/gallery/010-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
assets/gallery/011-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
assets/gallery/012-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
assets/gallery/013-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
assets/gallery/014-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
assets/gallery/015-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
assets/gallery/016-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
assets/gallery/017-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
assets/gallery/018-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
assets/gallery/019-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
assets/gallery/020-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
assets/gallery/021-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
assets/gallery/022-1440x1440.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
assets/gallery/023-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
assets/gallery/024-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
assets/gallery/025-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
assets/gallery/026-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
assets/gallery/027-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
assets/gallery/028-1248x1664.png filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
assets/gallery/029-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
assets/gallery/030-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
assets/gallery/031-1664x1248.png filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
assets/teaser.webp filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
assets/teaser.png filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
assets/comparison/comparison_grid_1to1_q98.webp filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,206 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
license: mit
|
| 3 |
+
base_model: microsoft/Lens
|
| 4 |
+
pipeline_tag: text-to-image
|
| 5 |
+
tags:
|
| 6 |
+
- lens
|
| 7 |
+
- text-to-image
|
| 8 |
+
- sdnq
|
| 9 |
+
- uint4
|
| 10 |
+
- static-quantization
|
| 11 |
+
- ablation
|
| 12 |
+
- model-cpu-offload
|
| 13 |
+
---
|
| 14 |
+
|
| 15 |
+
# Lens SDNQ uint4 static
|
| 16 |
+
|
| 17 |
+
This is a corrected SDNQ static UINT4 quantized variant of [microsoft/Lens](https://huggingface.co/microsoft/Lens).
|
| 18 |
+
|
| 19 |
+
The recipe follows the Lens-Turbo ablation result: all-linear UINT4 quantization can introduce periodic grid artifacts and severe text degradation when transformer modulation linears are quantized. This checkpoint keeps `*.img_mod.*` and `*.txt_mod.*` in bfloat16 and quantizes the rest of the denoising transformer with SDNQ UINT4.
|
| 20 |
+
|
| 21 |
+
## Visual Comparison
|
| 22 |
+
|
| 23 |
+
**Full-size comparison grid:** the image below is built from native 1440x1440 samples without resampling the image cells and saved as WebP quality 98. Raw file: [assets/comparison/comparison_grid_1to1_q98.webp](https://huggingface.co/WaveCut/Lens-SDNQ-uint4-static/resolve/main/assets/comparison/comparison_grid_1to1_q98.webp).
|
| 24 |
+
|
| 25 |
+

|
| 26 |
+
|
| 27 |
+
## Quantization Recipe
|
| 28 |
+
|
| 29 |
+
| Field | Value |
|
| 30 |
+
| --- | --- |
|
| 31 |
+
| Method | SDNQ uint4 static |
|
| 32 |
+
| Source model | `microsoft/Lens` |
|
| 33 |
+
| Quantized component | Denoising transformer |
|
| 34 |
+
| Text encoder | Unchanged upstream GPT-OSS text encoder |
|
| 35 |
+
| VAE | Unchanged upstream VAE |
|
| 36 |
+
| `weights_dtype` | `uint4` |
|
| 37 |
+
| `quantized_matmul_dtype` | `int8` |
|
| 38 |
+
| `use_quantized_matmul` | `true` |
|
| 39 |
+
| `group_size` | `0` |
|
| 40 |
+
| `dequantize_fp32` | `false` |
|
| 41 |
+
| Critical skip rule | `*.img_mod.*`, `*.txt_mod.*` kept in bfloat16 |
|
| 42 |
+
|
| 43 |
+
## Usage
|
| 44 |
+
|
| 45 |
+
Run from the cloned [microsoft/Lens](https://github.com/microsoft/Lens) repo root so the custom Lens classes are registered.
|
| 46 |
+
|
| 47 |
+
```python
|
| 48 |
+
import torch
|
| 49 |
+
from huggingface_hub import snapshot_download
|
| 50 |
+
from lens import LensPipeline, LensTransformer2DModel
|
| 51 |
+
from sdnq import load_sdnq_model
|
| 52 |
+
|
| 53 |
+
model_dir = snapshot_download("WaveCut/Lens-SDNQ-uint4-static")
|
| 54 |
+
transformer = load_sdnq_model(
|
| 55 |
+
model_dir + "/transformer",
|
| 56 |
+
model_cls=LensTransformer2DModel,
|
| 57 |
+
dtype=torch.bfloat16,
|
| 58 |
+
device=torch.device("cuda"),
|
| 59 |
+
dequantize_fp32=False,
|
| 60 |
+
use_quantized_matmul=True,
|
| 61 |
+
)
|
| 62 |
+
pipe = LensPipeline.from_pretrained(
|
| 63 |
+
model_dir,
|
| 64 |
+
transformer=transformer,
|
| 65 |
+
torch_dtype=torch.bfloat16,
|
| 66 |
+
).to("cuda")
|
| 67 |
+
|
| 68 |
+
image = pipe(
|
| 69 |
+
prompt="A cat holding a sign that says hello world",
|
| 70 |
+
base_resolution=1440,
|
| 71 |
+
aspect_ratio="1:1",
|
| 72 |
+
num_inference_steps=20,
|
| 73 |
+
guidance_scale=5.0,
|
| 74 |
+
generator=torch.Generator("cuda").manual_seed(0),
|
| 75 |
+
).images[0]
|
| 76 |
+
```
|
| 77 |
+
|
| 78 |
+
## Benchmark
|
| 79 |
+
|
| 80 |
+
Hardware: RunPod NVIDIA H100 80GB HBM3 (H100 SXM), PyTorch 2.8.0 CUDA 12.8 container, local container disk only. Benchmark date: 2026-05-24. Generation settings: `base_resolution=1440`, `aspect_ratio="1:1"`, `num_inference_steps=20`, `guidance_scale=5.0`.
|
| 81 |
+
|
| 82 |
+
| Metric | Original Lens | SDNQ uint4 static |
|
| 83 |
+
| --- | ---: | ---: |
|
| 84 |
+
| Load time, seconds | 17.641 | 14.605 |
|
| 85 |
+
| Load peak allocated VRAM, GB | 22.342 | 18.446 |
|
| 86 |
+
| Load peak reserved VRAM, GB | 22.471 | 18.516 |
|
| 87 |
+
| Transformer tensor storage footprint, GB | 16.417 | 4.301 |
|
| 88 |
+
| Transformer storage reduction vs original | baseline | 73.8% smaller |
|
| 89 |
+
| Average prompt runtime, seconds | 15.357 | 17.937 |
|
| 90 |
+
| Median prompt runtime, seconds | 14.346 | 17.813 |
|
| 91 |
+
| Average generation peak allocated VRAM, GB | 27.462 | 23.533 |
|
| 92 |
+
| Max generation peak allocated VRAM, GB | 27.467 | 23.538 |
|
| 93 |
+
|
| 94 |
+
Transformer-only footprint is computed from safetensors tensor storage for the denoising transformer parameter tensors only; it excludes allocator overhead and non-transformer components. The original transformer tensors are F32; the corrected SDNQ transformer stores quantized tensors as U8 plus the excluded modulation layers as BF16.
|
| 95 |
+
|
| 96 |
+
### Model CPU Offload Benchmark
|
| 97 |
+
|
| 98 |
+
Same 10 prompts, using `pipe.enable_model_cpu_offload()`. The reported load time uses a warm local Hugging Face cache on the container disk, so model download time is excluded. Each model was measured in a fresh Python process. `Cold generation` is P01, the first generation immediately after load/offload setup; `warm generation` aggregates P02-P10.
|
| 99 |
+
|
| 100 |
+
| Metric | Original Lens | SDNQ uint4 static |
|
| 101 |
+
| --- | ---: | ---: |
|
| 102 |
+
| Offload setup/load time, seconds | 15.510 | 13.573 |
|
| 103 |
+
| Offload setup peak allocated VRAM, GB | 12.582 | 12.582 |
|
| 104 |
+
| Offload setup peak reserved VRAM, GB | 13.881 | 13.881 |
|
| 105 |
+
| Cold generation time, seconds | 26.217 | 21.473 |
|
| 106 |
+
| Cold generation peak allocated VRAM, GB | 19.274 | 15.479 |
|
| 107 |
+
| Cold generation peak reserved VRAM, GB | 19.608 | 19.126 |
|
| 108 |
+
| Warm generation average time, seconds | 18.123 | 17.650 |
|
| 109 |
+
| Warm generation median time, seconds | 17.178 | 17.519 |
|
| 110 |
+
| Warm generation average peak allocated VRAM, GB | 19.271 | 15.480 |
|
| 111 |
+
| Warm generation average peak reserved VRAM, GB | 19.630 | 18.965 |
|
| 112 |
+
| Warm generation max peak allocated VRAM, GB | 19.276 | 15.482 |
|
| 113 |
+
| Warm generation max peak reserved VRAM, GB | 19.803 | 19.210 |
|
| 114 |
+
|
| 115 |
+
Raw metrics: [`benchmark_metrics.json`](benchmark_metrics.json), [`comparison_matrix.json`](comparison_matrix.json), [`model_cpu_offload_benchmark.json`](model_cpu_offload_benchmark.json), [`sdnq_quantization_summary.json`](sdnq_quantization_summary.json).
|
| 116 |
+
|
| 117 |
+
## 10-Prompt Matrix
|
| 118 |
+
|
| 119 |
+
| ID | Scenario | Seed | Original time, s | Quant time, s | Delta | Original peak allocated VRAM, GB | Quant peak allocated VRAM, GB |
|
| 120 |
+
| --- | --- | ---: | ---: | ---: | ---: | ---: | ---: |
|
| 121 |
+
| P01 | Midnight Library Weather Station | 301 | 19.518 | 24.105 | +23.5% | 27.461 | 23.532 |
|
| 122 |
+
| P02 | Desert Observatory Treaty Room | 302 | 16.986 | 18.565 | +9.3% | 27.461 | 23.532 |
|
| 123 |
+
| P03 | Arctic Submarine Greenhouse | 303 | 13.903 | 17.882 | +28.6% | 27.461 | 23.532 |
|
| 124 |
+
| P04 | Long English Museum Labels | 304 | 14.439 | 17.848 | +23.6% | 27.461 | 23.533 |
|
| 125 |
+
| P05 | Tokyo Rooftop Repair Diner | 305 | 14.253 | 17.779 | +24.7% | 27.461 | 23.532 |
|
| 126 |
+
| P06 | Russian Provincial Print Shop | 306 | 16.744 | 18.136 | +8.3% | 27.467 | 23.538 |
|
| 127 |
+
| P07 | Ocean Cartography Bakery | 307 | 13.918 | 14.828 | +6.5% | 27.461 | 23.532 |
|
| 128 |
+
| P08 | Long English Train Notice Wall | 308 | 13.906 | 14.826 | +6.6% | 27.461 | 23.532 |
|
| 129 |
+
| P09 | Orbital Botanical Courtroom | 309 | 16.204 | 17.740 | +9.5% | 27.461 | 23.533 |
|
| 130 |
+
| P10 | Byzantine Data Center Chapel | 310 | 13.703 | 17.665 | +28.9% | 27.461 | 23.532 |
|
| 131 |
+
|
| 132 |
+
## Full Prompts
|
| 133 |
+
|
| 134 |
+
<details>
|
| 135 |
+
<summary>P01 - Midnight Library Weather Station</summary>
|
| 136 |
+
|
| 137 |
+
A vast midnight library converted into a Victorian weather station, brass barometers, hanging cloud chambers, blue lightning outside stained-glass windows, spiral ladders, rainwater collecting in crystal funnels, and readable labels everywhere. Include a large oak sign saying "ARCHIVE OF STORMS - EAST WING", a ledger title saying "BAROMETRIC ANOMALIES 1897-1903", a small drawer label saying "FOG SAMPLES / DO NOT SHAKE", a chalkboard note saying "THUNDER ARRIVES AT 02:17", and a bookmark saying "RETURN TO SHELF C-19". Extremely detailed, cinematic, natural perspective, crisp small typography.
|
| 138 |
+
|
| 139 |
+
</details>
|
| 140 |
+
|
| 141 |
+
<details>
|
| 142 |
+
<summary>P02 - Desert Observatory Treaty Room</summary>
|
| 143 |
+
|
| 144 |
+
An ancient desert observatory at golden hour, now used as a treaty room for astronomers and nomad diplomats, sandstone arches, astrolabes, folded star maps, copper tea service, wind-blown curtains, tiny dust motes, and many readable inscriptions. The central parchment must read "TREATY OF THE SEVEN MOONS". A wall plaque reads "OBSERVATORY OF QASR AL-SUHAIL". A tea label says "CARDAMOM - NO SUGAR". A blue wax seal says "WITNESSED UNDER MARS". A telescope tag says "CALIBRATE BEFORE SUNSET". Hyperreal, warm shadows, intricate surface wear.
|
| 145 |
+
|
| 146 |
+
</details>
|
| 147 |
+
|
| 148 |
+
<details>
|
| 149 |
+
<summary>P03 - Arctic Submarine Greenhouse</summary>
|
| 150 |
+
|
| 151 |
+
A transparent research submarine trapped under Arctic ice, transformed into a warm hydroponic greenhouse with orange grow lights, condensation, polar bears visible above through thick ice, scientists in wool sweaters, algae tanks, and frost patterns on glass. Include readable text on multiple objects: "POLAR BOTANY UNIT 4" on the bulkhead, "EMERGENCY SEED VAULT" on a red locker, "LIGHT CYCLE: 18 HOURS" on a tablet, "DO NOT FEED THE KELP" on a handwritten note, and "RETURN CORE SAMPLES" on a metal tray. Detailed, atmospheric, believable engineering.
|
| 152 |
+
|
| 153 |
+
</details>
|
| 154 |
+
|
| 155 |
+
<details>
|
| 156 |
+
<summary>P04 - Long English Museum Labels</summary>
|
| 157 |
+
|
| 158 |
+
A photorealistic museum exhibit room about impossible machines, with glass cases, velvet ropes, soft spotlights, and several long English placards that must be visible on different parts of the image. Placard one reads: "THE CLOCK THAT REMEMBERED WINTER: assembled from brass, bone, and borrowed tides, circa 1814." Placard two reads: "PLEASE DO NOT TOUCH THE PERPETUAL ENGINE; it becomes anxious when observed too closely." Placard three reads: "CURATOR'S NOTE: every gear was catalogued, polished, numbered, and returned before dawn." Also include ticket stubs, tiny accession numbers, fingerprints on glass, and realistic museum lighting.
|
| 159 |
+
|
| 160 |
+
</details>
|
| 161 |
+
|
| 162 |
+
<details>
|
| 163 |
+
<summary>P05 - Tokyo Rooftop Repair Diner</summary>
|
| 164 |
+
|
| 165 |
+
A rainy Tokyo rooftop diner that doubles as a robot repair shop, neon reflections, steam from ramen bowls, umbrellas, tiny servo motors, handwritten order slips, rain beads on chrome, and a skyline full of antennas. Readable signs: a pink neon sign says "MIDNIGHT RAMEN & REPAIRS", a menu board says "SPECIAL: MISO, BATTERY PACK, GREEN TEA", a repair invoice says "UNIT 7B - LEFT HAND RECALIBRATION", a sticker says "NO DRONES AFTER 2 AM", and a paper lantern says "OPEN WHEN IT RAINS". High detail, shallow depth of field, cinematic realism.
|
| 166 |
+
|
| 167 |
+
</details>
|
| 168 |
+
|
| 169 |
+
<details>
|
| 170 |
+
<summary>P06 - Russian Provincial Print Shop</summary>
|
| 171 |
+
|
| 172 |
+
Старинная провинциальная типография в России, поздний вечер, керосиновые лампы, деревянные кассы со свинцовыми литерами, мокрые афиши на веревках, самовар, иней на окне, реалистичная пыль и следы краски. На большой вывеске долж��о быть написано: "ТИПОГРАФИЯ УЕЗДНЫХ ВЕСТЕЙ". На длинной афише читаемый текст: "Завтра в городском саду: лекция о кометах, духовой оркестр, чай с баранками, начало ровно в семь часов вечера". На ящике: "ЛИТЕРЫ: А-Я, НЕ РОНЯТЬ". На записке: "Срочно отпечатать до рассвета". Очень детально, без мультяшности.
|
| 173 |
+
|
| 174 |
+
</details>
|
| 175 |
+
|
| 176 |
+
<details>
|
| 177 |
+
<summary>P07 - Ocean Cartography Bakery</summary>
|
| 178 |
+
|
| 179 |
+
A cozy bakery inside an old ocean cartography office, with croissants shaped like sea monsters, nautical charts dusted with flour, brass compasses, jars of ink, morning light, and a baker drawing coastlines in powdered sugar. Text elements: "TIDAL BREAD & MAPS" on the front sign, "SOURDOUGH CURRENT - 6:30 AM" on a chalkboard, "UNCHARTED PLUM TARTS" on a pastry label, "DO NOT EAT THE COMPASS" on a note, and "NORTH SEA BATCH 12" stamped on a paper bag. Warm, detailed, whimsical but realistic.
|
| 180 |
+
|
| 181 |
+
</details>
|
| 182 |
+
|
| 183 |
+
<details>
|
| 184 |
+
<summary>P08 - Long English Train Notice Wall</summary>
|
| 185 |
+
|
| 186 |
+
A foggy Edwardian railway platform at dawn with a wall of overlapping long English notices, brass lamps, wet cobblestones, porters, suitcases, pigeons, steam, and reflections. The largest notice must read: "IMPORTANT SERVICE CHANGE: The 6:42 express to Northbridge will depart from Platform Three after the moonlit freight has cleared the signal box." A second poster reads: "LOST PROPERTY: one violin case, two blue gloves, a silver compass, and a letter never posted." A timetable says "WINTER ROUTE - DELAYS EXPECTED NEAR THE MARSH". Ultra detailed, cinematic, legible signs, natural perspective.
|
| 187 |
+
|
| 188 |
+
</details>
|
| 189 |
+
|
| 190 |
+
<details>
|
| 191 |
+
<summary>P09 - Orbital Botanical Courtroom</summary>
|
| 192 |
+
|
| 193 |
+
A surreal but photorealistic courtroom inside an orbital botanical garden, judges in dark robes, enormous ferns, floating pollen, Earth visible through a curved window, holographic evidence screens, and a tiny robot stenographer. Required readable text: "CASE 44-B: THE PEOPLE VS. THE SUNFLOWER" on the main screen, "EVIDENCE: THREE PETALS AND A BROKEN VASE" on a side display, "SILENCE IN THE GREENHOUSE COURT" on a sign, "WITNESS: DR. LYSANDER MOSS" on a nameplate, and "OXYGEN TAX RECEIPT" on a paper slip. Sharp, high-detail, dramatic lighting.
|
| 194 |
+
|
| 195 |
+
</details>
|
| 196 |
+
|
| 197 |
+
<details>
|
| 198 |
+
<summary>P10 - Byzantine Data Center Chapel</summary>
|
| 199 |
+
|
| 200 |
+
A Byzantine chapel converted into a quiet data center, gold mosaics reflecting server LEDs, incense smoke, marble floors, monks maintaining fiber cables, illuminated manuscripts next to diagnostic terminals, and beautiful cable management. Text must appear in multiple places: "SANCTUM SERVER ROOM - AUTHORIZED MONKS ONLY" on a bronze door, "BACKUP PSALMS COMPLETED AT 03:12" on a terminal, "DO NOT UNPLUG THE RELIQUARY" on a warning label, "LATENCY PRAYER REQUESTS" on a clipboard, and "ARCHIVE NODE IX" etched on a server rack. Rich texture, controlled highlights, realistic scale.
|
| 201 |
+
|
| 202 |
+
</details>
|
| 203 |
+
|
| 204 |
+
## Notes
|
| 205 |
+
|
| 206 |
+
This checkpoint is intended for research and evaluation. It inherits the upstream Lens limitations and responsible AI considerations from the source model. Text rendering remains challenging; the corrected recipe is designed to avoid the obvious grid/printed texture failure seen when transformer modulation linears are quantized.
|
assets/comparison/comparison_grid_1to1_q98.webp
ADDED
|
Git LFS Details
|
benchmark_metrics.json
ADDED
|
@@ -0,0 +1,349 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
|
| 3 |
+
"mode": "full GPU, pipe.to('cuda')",
|
| 4 |
+
"base_resolution": 1440,
|
| 5 |
+
"aspect_ratio": "1:1",
|
| 6 |
+
"num_inference_steps": 20,
|
| 7 |
+
"guidance_scale": 5.0,
|
| 8 |
+
"dtype": "torch.bfloat16",
|
| 9 |
+
"models": {
|
| 10 |
+
"base": {
|
| 11 |
+
"load": {
|
| 12 |
+
"load_time_s": 17.641,
|
| 13 |
+
"peak_allocated_gb": 22.342,
|
| 14 |
+
"peak_reserved_gb": 22.471,
|
| 15 |
+
"end_allocated_gb": 22.342,
|
| 16 |
+
"end_reserved_gb": 22.471
|
| 17 |
+
},
|
| 18 |
+
"summary": {
|
| 19 |
+
"avg_time_s": 15.357,
|
| 20 |
+
"median_time_s": 14.346,
|
| 21 |
+
"avg_peak_allocated_gb": 27.462,
|
| 22 |
+
"avg_peak_reserved_gb": 31.756,
|
| 23 |
+
"max_peak_allocated_gb": 27.467,
|
| 24 |
+
"max_peak_reserved_gb": 31.965
|
| 25 |
+
},
|
| 26 |
+
"prompts": [
|
| 27 |
+
{
|
| 28 |
+
"id": "P01",
|
| 29 |
+
"title": "Midnight Library Weather Station",
|
| 30 |
+
"seed": 301,
|
| 31 |
+
"time_s": 19.518,
|
| 32 |
+
"image_size": [
|
| 33 |
+
1440,
|
| 34 |
+
1440
|
| 35 |
+
],
|
| 36 |
+
"peak_allocated_gb": 27.461,
|
| 37 |
+
"peak_reserved_gb": 31.74,
|
| 38 |
+
"end_allocated_gb": 22.377,
|
| 39 |
+
"end_reserved_gb": 31.74,
|
| 40 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p01_base.png"
|
| 41 |
+
},
|
| 42 |
+
{
|
| 43 |
+
"id": "P02",
|
| 44 |
+
"title": "Desert Observatory Treaty Room",
|
| 45 |
+
"seed": 302,
|
| 46 |
+
"time_s": 16.986,
|
| 47 |
+
"image_size": [
|
| 48 |
+
1440,
|
| 49 |
+
1440
|
| 50 |
+
],
|
| 51 |
+
"peak_allocated_gb": 27.461,
|
| 52 |
+
"peak_reserved_gb": 31.74,
|
| 53 |
+
"end_allocated_gb": 22.377,
|
| 54 |
+
"end_reserved_gb": 31.74,
|
| 55 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p02_base.png"
|
| 56 |
+
},
|
| 57 |
+
{
|
| 58 |
+
"id": "P03",
|
| 59 |
+
"title": "Arctic Submarine Greenhouse",
|
| 60 |
+
"seed": 303,
|
| 61 |
+
"time_s": 13.903,
|
| 62 |
+
"image_size": [
|
| 63 |
+
1440,
|
| 64 |
+
1440
|
| 65 |
+
],
|
| 66 |
+
"peak_allocated_gb": 27.461,
|
| 67 |
+
"peak_reserved_gb": 31.719,
|
| 68 |
+
"end_allocated_gb": 22.377,
|
| 69 |
+
"end_reserved_gb": 31.719,
|
| 70 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p03_base.png"
|
| 71 |
+
},
|
| 72 |
+
{
|
| 73 |
+
"id": "P04",
|
| 74 |
+
"title": "Long English Museum Labels",
|
| 75 |
+
"seed": 304,
|
| 76 |
+
"time_s": 14.439,
|
| 77 |
+
"image_size": [
|
| 78 |
+
1440,
|
| 79 |
+
1440
|
| 80 |
+
],
|
| 81 |
+
"peak_allocated_gb": 27.461,
|
| 82 |
+
"peak_reserved_gb": 31.719,
|
| 83 |
+
"end_allocated_gb": 22.377,
|
| 84 |
+
"end_reserved_gb": 31.719,
|
| 85 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p04_base.png"
|
| 86 |
+
},
|
| 87 |
+
{
|
| 88 |
+
"id": "P05",
|
| 89 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 90 |
+
"seed": 305,
|
| 91 |
+
"time_s": 14.253,
|
| 92 |
+
"image_size": [
|
| 93 |
+
1440,
|
| 94 |
+
1440
|
| 95 |
+
],
|
| 96 |
+
"peak_allocated_gb": 27.461,
|
| 97 |
+
"peak_reserved_gb": 31.74,
|
| 98 |
+
"end_allocated_gb": 22.377,
|
| 99 |
+
"end_reserved_gb": 31.74,
|
| 100 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p05_base.png"
|
| 101 |
+
},
|
| 102 |
+
{
|
| 103 |
+
"id": "P06",
|
| 104 |
+
"title": "Russian Provincial Print Shop",
|
| 105 |
+
"seed": 306,
|
| 106 |
+
"time_s": 16.744,
|
| 107 |
+
"image_size": [
|
| 108 |
+
1440,
|
| 109 |
+
1440
|
| 110 |
+
],
|
| 111 |
+
"peak_allocated_gb": 27.467,
|
| 112 |
+
"peak_reserved_gb": 31.965,
|
| 113 |
+
"end_allocated_gb": 22.377,
|
| 114 |
+
"end_reserved_gb": 31.965,
|
| 115 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p06_base.png"
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"id": "P07",
|
| 119 |
+
"title": "Ocean Cartography Bakery",
|
| 120 |
+
"seed": 307,
|
| 121 |
+
"time_s": 13.918,
|
| 122 |
+
"image_size": [
|
| 123 |
+
1440,
|
| 124 |
+
1440
|
| 125 |
+
],
|
| 126 |
+
"peak_allocated_gb": 27.461,
|
| 127 |
+
"peak_reserved_gb": 31.74,
|
| 128 |
+
"end_allocated_gb": 22.377,
|
| 129 |
+
"end_reserved_gb": 31.74,
|
| 130 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p07_base.png"
|
| 131 |
+
},
|
| 132 |
+
{
|
| 133 |
+
"id": "P08",
|
| 134 |
+
"title": "Long English Train Notice Wall",
|
| 135 |
+
"seed": 308,
|
| 136 |
+
"time_s": 13.906,
|
| 137 |
+
"image_size": [
|
| 138 |
+
1440,
|
| 139 |
+
1440
|
| 140 |
+
],
|
| 141 |
+
"peak_allocated_gb": 27.461,
|
| 142 |
+
"peak_reserved_gb": 31.74,
|
| 143 |
+
"end_allocated_gb": 22.377,
|
| 144 |
+
"end_reserved_gb": 31.74,
|
| 145 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p08_base.png"
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"id": "P09",
|
| 149 |
+
"title": "Orbital Botanical Courtroom",
|
| 150 |
+
"seed": 309,
|
| 151 |
+
"time_s": 16.204,
|
| 152 |
+
"image_size": [
|
| 153 |
+
1440,
|
| 154 |
+
1440
|
| 155 |
+
],
|
| 156 |
+
"peak_allocated_gb": 27.461,
|
| 157 |
+
"peak_reserved_gb": 31.719,
|
| 158 |
+
"end_allocated_gb": 22.377,
|
| 159 |
+
"end_reserved_gb": 31.719,
|
| 160 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p09_base.png"
|
| 161 |
+
},
|
| 162 |
+
{
|
| 163 |
+
"id": "P10",
|
| 164 |
+
"title": "Byzantine Data Center Chapel",
|
| 165 |
+
"seed": 310,
|
| 166 |
+
"time_s": 13.703,
|
| 167 |
+
"image_size": [
|
| 168 |
+
1440,
|
| 169 |
+
1440
|
| 170 |
+
],
|
| 171 |
+
"peak_allocated_gb": 27.461,
|
| 172 |
+
"peak_reserved_gb": 31.74,
|
| 173 |
+
"end_allocated_gb": 22.377,
|
| 174 |
+
"end_reserved_gb": 31.74,
|
| 175 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p10_base.png"
|
| 176 |
+
}
|
| 177 |
+
]
|
| 178 |
+
},
|
| 179 |
+
"quant": {
|
| 180 |
+
"load": {
|
| 181 |
+
"load_time_s": 14.605,
|
| 182 |
+
"peak_allocated_gb": 18.446,
|
| 183 |
+
"peak_reserved_gb": 18.516,
|
| 184 |
+
"end_allocated_gb": 18.446,
|
| 185 |
+
"end_reserved_gb": 18.516
|
| 186 |
+
},
|
| 187 |
+
"summary": {
|
| 188 |
+
"avg_time_s": 17.937,
|
| 189 |
+
"median_time_s": 17.813,
|
| 190 |
+
"avg_peak_allocated_gb": 23.533,
|
| 191 |
+
"avg_peak_reserved_gb": 27.699,
|
| 192 |
+
"max_peak_allocated_gb": 23.538,
|
| 193 |
+
"max_peak_reserved_gb": 27.712
|
| 194 |
+
},
|
| 195 |
+
"prompts": [
|
| 196 |
+
{
|
| 197 |
+
"id": "P01",
|
| 198 |
+
"title": "Midnight Library Weather Station",
|
| 199 |
+
"seed": 301,
|
| 200 |
+
"time_s": 24.105,
|
| 201 |
+
"image_size": [
|
| 202 |
+
1440,
|
| 203 |
+
1440
|
| 204 |
+
],
|
| 205 |
+
"peak_allocated_gb": 23.532,
|
| 206 |
+
"peak_reserved_gb": 27.682,
|
| 207 |
+
"end_allocated_gb": 18.448,
|
| 208 |
+
"end_reserved_gb": 27.682,
|
| 209 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p01_quant.png"
|
| 210 |
+
},
|
| 211 |
+
{
|
| 212 |
+
"id": "P02",
|
| 213 |
+
"title": "Desert Observatory Treaty Room",
|
| 214 |
+
"seed": 302,
|
| 215 |
+
"time_s": 18.565,
|
| 216 |
+
"image_size": [
|
| 217 |
+
1440,
|
| 218 |
+
1440
|
| 219 |
+
],
|
| 220 |
+
"peak_allocated_gb": 23.532,
|
| 221 |
+
"peak_reserved_gb": 27.712,
|
| 222 |
+
"end_allocated_gb": 18.448,
|
| 223 |
+
"end_reserved_gb": 27.712,
|
| 224 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p02_quant.png"
|
| 225 |
+
},
|
| 226 |
+
{
|
| 227 |
+
"id": "P03",
|
| 228 |
+
"title": "Arctic Submarine Greenhouse",
|
| 229 |
+
"seed": 303,
|
| 230 |
+
"time_s": 17.882,
|
| 231 |
+
"image_size": [
|
| 232 |
+
1440,
|
| 233 |
+
1440
|
| 234 |
+
],
|
| 235 |
+
"peak_allocated_gb": 23.532,
|
| 236 |
+
"peak_reserved_gb": 27.712,
|
| 237 |
+
"end_allocated_gb": 18.448,
|
| 238 |
+
"end_reserved_gb": 27.712,
|
| 239 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p03_quant.png"
|
| 240 |
+
},
|
| 241 |
+
{
|
| 242 |
+
"id": "P04",
|
| 243 |
+
"title": "Long English Museum Labels",
|
| 244 |
+
"seed": 304,
|
| 245 |
+
"time_s": 17.848,
|
| 246 |
+
"image_size": [
|
| 247 |
+
1440,
|
| 248 |
+
1440
|
| 249 |
+
],
|
| 250 |
+
"peak_allocated_gb": 23.533,
|
| 251 |
+
"peak_reserved_gb": 27.712,
|
| 252 |
+
"end_allocated_gb": 18.448,
|
| 253 |
+
"end_reserved_gb": 27.712,
|
| 254 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p04_quant.png"
|
| 255 |
+
},
|
| 256 |
+
{
|
| 257 |
+
"id": "P05",
|
| 258 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 259 |
+
"seed": 305,
|
| 260 |
+
"time_s": 17.779,
|
| 261 |
+
"image_size": [
|
| 262 |
+
1440,
|
| 263 |
+
1440
|
| 264 |
+
],
|
| 265 |
+
"peak_allocated_gb": 23.532,
|
| 266 |
+
"peak_reserved_gb": 27.712,
|
| 267 |
+
"end_allocated_gb": 18.448,
|
| 268 |
+
"end_reserved_gb": 27.712,
|
| 269 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p05_quant.png"
|
| 270 |
+
},
|
| 271 |
+
{
|
| 272 |
+
"id": "P06",
|
| 273 |
+
"title": "Russian Provincial Print Shop",
|
| 274 |
+
"seed": 306,
|
| 275 |
+
"time_s": 18.136,
|
| 276 |
+
"image_size": [
|
| 277 |
+
1440,
|
| 278 |
+
1440
|
| 279 |
+
],
|
| 280 |
+
"peak_allocated_gb": 23.538,
|
| 281 |
+
"peak_reserved_gb": 27.615,
|
| 282 |
+
"end_allocated_gb": 18.448,
|
| 283 |
+
"end_reserved_gb": 27.615,
|
| 284 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p06_quant.png"
|
| 285 |
+
},
|
| 286 |
+
{
|
| 287 |
+
"id": "P07",
|
| 288 |
+
"title": "Ocean Cartography Bakery",
|
| 289 |
+
"seed": 307,
|
| 290 |
+
"time_s": 14.828,
|
| 291 |
+
"image_size": [
|
| 292 |
+
1440,
|
| 293 |
+
1440
|
| 294 |
+
],
|
| 295 |
+
"peak_allocated_gb": 23.532,
|
| 296 |
+
"peak_reserved_gb": 27.712,
|
| 297 |
+
"end_allocated_gb": 18.448,
|
| 298 |
+
"end_reserved_gb": 27.712,
|
| 299 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p07_quant.png"
|
| 300 |
+
},
|
| 301 |
+
{
|
| 302 |
+
"id": "P08",
|
| 303 |
+
"title": "Long English Train Notice Wall",
|
| 304 |
+
"seed": 308,
|
| 305 |
+
"time_s": 14.826,
|
| 306 |
+
"image_size": [
|
| 307 |
+
1440,
|
| 308 |
+
1440
|
| 309 |
+
],
|
| 310 |
+
"peak_allocated_gb": 23.532,
|
| 311 |
+
"peak_reserved_gb": 27.712,
|
| 312 |
+
"end_allocated_gb": 18.448,
|
| 313 |
+
"end_reserved_gb": 27.712,
|
| 314 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p08_quant.png"
|
| 315 |
+
},
|
| 316 |
+
{
|
| 317 |
+
"id": "P09",
|
| 318 |
+
"title": "Orbital Botanical Courtroom",
|
| 319 |
+
"seed": 309,
|
| 320 |
+
"time_s": 17.74,
|
| 321 |
+
"image_size": [
|
| 322 |
+
1440,
|
| 323 |
+
1440
|
| 324 |
+
],
|
| 325 |
+
"peak_allocated_gb": 23.533,
|
| 326 |
+
"peak_reserved_gb": 27.712,
|
| 327 |
+
"end_allocated_gb": 18.448,
|
| 328 |
+
"end_reserved_gb": 27.712,
|
| 329 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p09_quant.png"
|
| 330 |
+
},
|
| 331 |
+
{
|
| 332 |
+
"id": "P10",
|
| 333 |
+
"title": "Byzantine Data Center Chapel",
|
| 334 |
+
"seed": 310,
|
| 335 |
+
"time_s": 17.665,
|
| 336 |
+
"image_size": [
|
| 337 |
+
1440,
|
| 338 |
+
1440
|
| 339 |
+
],
|
| 340 |
+
"peak_allocated_gb": 23.532,
|
| 341 |
+
"peak_reserved_gb": 27.712,
|
| 342 |
+
"end_allocated_gb": 18.448,
|
| 343 |
+
"end_reserved_gb": 27.712,
|
| 344 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p10_quant.png"
|
| 345 |
+
}
|
| 346 |
+
]
|
| 347 |
+
}
|
| 348 |
+
}
|
| 349 |
+
}
|
comparison_matrix.json
ADDED
|
@@ -0,0 +1,362 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"id": "P01",
|
| 4 |
+
"title": "Midnight Library Weather Station",
|
| 5 |
+
"seed": 301,
|
| 6 |
+
"prompt": "A vast midnight library converted into a Victorian weather station, brass barometers, hanging cloud chambers, blue lightning outside stained-glass windows, spiral ladders, rainwater collecting in crystal funnels, and readable labels everywhere. Include a large oak sign saying \"ARCHIVE OF STORMS - EAST WING\", a ledger title saying \"BAROMETRIC ANOMALIES 1897-1903\", a small drawer label saying \"FOG SAMPLES / DO NOT SHAKE\", a chalkboard note saying \"THUNDER ARRIVES AT 02:17\", and a bookmark saying \"RETURN TO SHELF C-19\". Extremely detailed, cinematic, natural perspective, crisp small typography.",
|
| 7 |
+
"base": {
|
| 8 |
+
"id": "P01",
|
| 9 |
+
"title": "Midnight Library Weather Station",
|
| 10 |
+
"seed": 301,
|
| 11 |
+
"time_s": 19.518,
|
| 12 |
+
"image_size": [
|
| 13 |
+
1440,
|
| 14 |
+
1440
|
| 15 |
+
],
|
| 16 |
+
"peak_allocated_gb": 27.461,
|
| 17 |
+
"peak_reserved_gb": 31.74,
|
| 18 |
+
"end_allocated_gb": 22.377,
|
| 19 |
+
"end_reserved_gb": 31.74,
|
| 20 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p01_base.png"
|
| 21 |
+
},
|
| 22 |
+
"quant": {
|
| 23 |
+
"id": "P01",
|
| 24 |
+
"title": "Midnight Library Weather Station",
|
| 25 |
+
"seed": 301,
|
| 26 |
+
"time_s": 24.105,
|
| 27 |
+
"image_size": [
|
| 28 |
+
1440,
|
| 29 |
+
1440
|
| 30 |
+
],
|
| 31 |
+
"peak_allocated_gb": 23.532,
|
| 32 |
+
"peak_reserved_gb": 27.682,
|
| 33 |
+
"end_allocated_gb": 18.448,
|
| 34 |
+
"end_reserved_gb": 27.682,
|
| 35 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p01_quant.png"
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
{
|
| 39 |
+
"id": "P02",
|
| 40 |
+
"title": "Desert Observatory Treaty Room",
|
| 41 |
+
"seed": 302,
|
| 42 |
+
"prompt": "An ancient desert observatory at golden hour, now used as a treaty room for astronomers and nomad diplomats, sandstone arches, astrolabes, folded star maps, copper tea service, wind-blown curtains, tiny dust motes, and many readable inscriptions. The central parchment must read \"TREATY OF THE SEVEN MOONS\". A wall plaque reads \"OBSERVATORY OF QASR AL-SUHAIL\". A tea label says \"CARDAMOM - NO SUGAR\". A blue wax seal says \"WITNESSED UNDER MARS\". A telescope tag says \"CALIBRATE BEFORE SUNSET\". Hyperreal, warm shadows, intricate surface wear.",
|
| 43 |
+
"base": {
|
| 44 |
+
"id": "P02",
|
| 45 |
+
"title": "Desert Observatory Treaty Room",
|
| 46 |
+
"seed": 302,
|
| 47 |
+
"time_s": 16.986,
|
| 48 |
+
"image_size": [
|
| 49 |
+
1440,
|
| 50 |
+
1440
|
| 51 |
+
],
|
| 52 |
+
"peak_allocated_gb": 27.461,
|
| 53 |
+
"peak_reserved_gb": 31.74,
|
| 54 |
+
"end_allocated_gb": 22.377,
|
| 55 |
+
"end_reserved_gb": 31.74,
|
| 56 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p02_base.png"
|
| 57 |
+
},
|
| 58 |
+
"quant": {
|
| 59 |
+
"id": "P02",
|
| 60 |
+
"title": "Desert Observatory Treaty Room",
|
| 61 |
+
"seed": 302,
|
| 62 |
+
"time_s": 18.565,
|
| 63 |
+
"image_size": [
|
| 64 |
+
1440,
|
| 65 |
+
1440
|
| 66 |
+
],
|
| 67 |
+
"peak_allocated_gb": 23.532,
|
| 68 |
+
"peak_reserved_gb": 27.712,
|
| 69 |
+
"end_allocated_gb": 18.448,
|
| 70 |
+
"end_reserved_gb": 27.712,
|
| 71 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p02_quant.png"
|
| 72 |
+
}
|
| 73 |
+
},
|
| 74 |
+
{
|
| 75 |
+
"id": "P03",
|
| 76 |
+
"title": "Arctic Submarine Greenhouse",
|
| 77 |
+
"seed": 303,
|
| 78 |
+
"prompt": "A transparent research submarine trapped under Arctic ice, transformed into a warm hydroponic greenhouse with orange grow lights, condensation, polar bears visible above through thick ice, scientists in wool sweaters, algae tanks, and frost patterns on glass. Include readable text on multiple objects: \"POLAR BOTANY UNIT 4\" on the bulkhead, \"EMERGENCY SEED VAULT\" on a red locker, \"LIGHT CYCLE: 18 HOURS\" on a tablet, \"DO NOT FEED THE KELP\" on a handwritten note, and \"RETURN CORE SAMPLES\" on a metal tray. Detailed, atmospheric, believable engineering.",
|
| 79 |
+
"base": {
|
| 80 |
+
"id": "P03",
|
| 81 |
+
"title": "Arctic Submarine Greenhouse",
|
| 82 |
+
"seed": 303,
|
| 83 |
+
"time_s": 13.903,
|
| 84 |
+
"image_size": [
|
| 85 |
+
1440,
|
| 86 |
+
1440
|
| 87 |
+
],
|
| 88 |
+
"peak_allocated_gb": 27.461,
|
| 89 |
+
"peak_reserved_gb": 31.719,
|
| 90 |
+
"end_allocated_gb": 22.377,
|
| 91 |
+
"end_reserved_gb": 31.719,
|
| 92 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p03_base.png"
|
| 93 |
+
},
|
| 94 |
+
"quant": {
|
| 95 |
+
"id": "P03",
|
| 96 |
+
"title": "Arctic Submarine Greenhouse",
|
| 97 |
+
"seed": 303,
|
| 98 |
+
"time_s": 17.882,
|
| 99 |
+
"image_size": [
|
| 100 |
+
1440,
|
| 101 |
+
1440
|
| 102 |
+
],
|
| 103 |
+
"peak_allocated_gb": 23.532,
|
| 104 |
+
"peak_reserved_gb": 27.712,
|
| 105 |
+
"end_allocated_gb": 18.448,
|
| 106 |
+
"end_reserved_gb": 27.712,
|
| 107 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p03_quant.png"
|
| 108 |
+
}
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"id": "P04",
|
| 112 |
+
"title": "Long English Museum Labels",
|
| 113 |
+
"seed": 304,
|
| 114 |
+
"prompt": "A photorealistic museum exhibit room about impossible machines, with glass cases, velvet ropes, soft spotlights, and several long English placards that must be visible on different parts of the image. Placard one reads: \"THE CLOCK THAT REMEMBERED WINTER: assembled from brass, bone, and borrowed tides, circa 1814.\" Placard two reads: \"PLEASE DO NOT TOUCH THE PERPETUAL ENGINE; it becomes anxious when observed too closely.\" Placard three reads: \"CURATOR'S NOTE: every gear was catalogued, polished, numbered, and returned before dawn.\" Also include ticket stubs, tiny accession numbers, fingerprints on glass, and realistic museum lighting.",
|
| 115 |
+
"base": {
|
| 116 |
+
"id": "P04",
|
| 117 |
+
"title": "Long English Museum Labels",
|
| 118 |
+
"seed": 304,
|
| 119 |
+
"time_s": 14.439,
|
| 120 |
+
"image_size": [
|
| 121 |
+
1440,
|
| 122 |
+
1440
|
| 123 |
+
],
|
| 124 |
+
"peak_allocated_gb": 27.461,
|
| 125 |
+
"peak_reserved_gb": 31.719,
|
| 126 |
+
"end_allocated_gb": 22.377,
|
| 127 |
+
"end_reserved_gb": 31.719,
|
| 128 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p04_base.png"
|
| 129 |
+
},
|
| 130 |
+
"quant": {
|
| 131 |
+
"id": "P04",
|
| 132 |
+
"title": "Long English Museum Labels",
|
| 133 |
+
"seed": 304,
|
| 134 |
+
"time_s": 17.848,
|
| 135 |
+
"image_size": [
|
| 136 |
+
1440,
|
| 137 |
+
1440
|
| 138 |
+
],
|
| 139 |
+
"peak_allocated_gb": 23.533,
|
| 140 |
+
"peak_reserved_gb": 27.712,
|
| 141 |
+
"end_allocated_gb": 18.448,
|
| 142 |
+
"end_reserved_gb": 27.712,
|
| 143 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p04_quant.png"
|
| 144 |
+
}
|
| 145 |
+
},
|
| 146 |
+
{
|
| 147 |
+
"id": "P05",
|
| 148 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 149 |
+
"seed": 305,
|
| 150 |
+
"prompt": "A rainy Tokyo rooftop diner that doubles as a robot repair shop, neon reflections, steam from ramen bowls, umbrellas, tiny servo motors, handwritten order slips, rain beads on chrome, and a skyline full of antennas. Readable signs: a pink neon sign says \"MIDNIGHT RAMEN & REPAIRS\", a menu board says \"SPECIAL: MISO, BATTERY PACK, GREEN TEA\", a repair invoice says \"UNIT 7B - LEFT HAND RECALIBRATION\", a sticker says \"NO DRONES AFTER 2 AM\", and a paper lantern says \"OPEN WHEN IT RAINS\". High detail, shallow depth of field, cinematic realism.",
|
| 151 |
+
"base": {
|
| 152 |
+
"id": "P05",
|
| 153 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 154 |
+
"seed": 305,
|
| 155 |
+
"time_s": 14.253,
|
| 156 |
+
"image_size": [
|
| 157 |
+
1440,
|
| 158 |
+
1440
|
| 159 |
+
],
|
| 160 |
+
"peak_allocated_gb": 27.461,
|
| 161 |
+
"peak_reserved_gb": 31.74,
|
| 162 |
+
"end_allocated_gb": 22.377,
|
| 163 |
+
"end_reserved_gb": 31.74,
|
| 164 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p05_base.png"
|
| 165 |
+
},
|
| 166 |
+
"quant": {
|
| 167 |
+
"id": "P05",
|
| 168 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 169 |
+
"seed": 305,
|
| 170 |
+
"time_s": 17.779,
|
| 171 |
+
"image_size": [
|
| 172 |
+
1440,
|
| 173 |
+
1440
|
| 174 |
+
],
|
| 175 |
+
"peak_allocated_gb": 23.532,
|
| 176 |
+
"peak_reserved_gb": 27.712,
|
| 177 |
+
"end_allocated_gb": 18.448,
|
| 178 |
+
"end_reserved_gb": 27.712,
|
| 179 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p05_quant.png"
|
| 180 |
+
}
|
| 181 |
+
},
|
| 182 |
+
{
|
| 183 |
+
"id": "P06",
|
| 184 |
+
"title": "Russian Provincial Print Shop",
|
| 185 |
+
"seed": 306,
|
| 186 |
+
"prompt": "\u0421\u0442\u0430\u0440\u0438\u043d\u043d\u0430\u044f \u043f\u0440\u043e\u0432\u0438\u043d\u0446\u0438\u0430\u043b\u044c\u043d\u0430\u044f \u0442\u0438\u043f\u043e\u0433\u0440\u0430\u0444\u0438\u044f \u0432 \u0420\u043e\u0441\u0441\u0438\u0438, \u043f\u043e\u0437\u0434\u043d\u0438\u0439 \u0432\u0435\u0447\u0435\u0440, \u043a\u0435\u0440\u043e\u0441\u0438\u043d\u043e\u0432\u044b\u0435 \u043b\u0430\u043c\u043f\u044b, \u0434\u0435\u0440\u0435\u0432\u044f\u043d\u043d\u044b\u0435 \u043a\u0430\u0441\u0441\u044b \u0441\u043e \u0441\u0432\u0438\u043d\u0446\u043e\u0432\u044b\u043c\u0438 \u043b\u0438\u0442\u0435\u0440\u0430\u043c\u0438, \u043c\u043e\u043a\u0440\u044b\u0435 \u0430\u0444\u0438\u0448\u0438 \u043d\u0430 \u0432\u0435\u0440\u0435\u0432\u043a\u0430\u0445, \u0441\u0430\u043c\u043e\u0432\u0430\u0440, \u0438\u043d\u0435\u0439 \u043d\u0430 \u043e\u043a\u043d\u0435, \u0440\u0435\u0430\u043b\u0438\u0441\u0442\u0438\u0447\u043d\u0430\u044f \u043f\u044b\u043b\u044c \u0438 \u0441\u043b\u0435\u0434\u044b \u043a\u0440\u0430\u0441\u043a\u0438. \u041d\u0430 \u0431\u043e\u043b\u044c\u0448\u043e\u0439 \u0432\u044b\u0432\u0435\u0441\u043a\u0435 \u0434\u043e\u043b\u0436\u043d\u043e \u0431\u044b\u0442\u044c \u043d\u0430\u043f\u0438\u0441\u0430\u043d\u043e: \"\u0422\u0418\u041f\u041e\u0413\u0420\u0410\u0424\u0418\u042f \u0423\u0415\u0417\u0414\u041d\u042b\u0425 \u0412\u0415\u0421\u0422\u0415\u0419\". \u041d\u0430 \u0434\u043b\u0438\u043d\u043d\u043e\u0439 \u0430\u0444\u0438\u0448\u0435 \u0447\u0438\u0442\u0430\u0435\u043c\u044b\u0439 \u0442\u0435\u043a\u0441\u0442: \"\u0417\u0430\u0432\u0442\u0440\u0430 \u0432 \u0433\u043e\u0440\u043e\u0434\u0441\u043a\u043e\u043c \u0441\u0430\u0434\u0443: \u043b\u0435\u043a\u0446\u0438\u044f \u043e \u043a\u043e\u043c\u0435\u0442\u0430\u0445, \u0434\u0443\u0445\u043e\u0432\u043e\u0439 \u043e\u0440\u043a\u0435\u0441\u0442\u0440, \u0447\u0430\u0439 \u0441 \u0431\u0430\u0440\u0430\u043d\u043a\u0430\u043c\u0438, \u043d\u0430\u0447\u0430\u043b\u043e \u0440\u043e\u0432\u043d\u043e \u0432 \u0441\u0435\u043c\u044c \u0447\u0430\u0441\u043e\u0432 \u0432\u0435\u0447\u0435\u0440\u0430\". \u041d\u0430 \u044f\u0449\u0438\u043a\u0435: \"\u041b\u0418\u0422\u0415\u0420\u042b: \u0410-\u042f, \u041d\u0415 \u0420\u041e\u041d\u042f\u0422\u042c\". \u041d\u0430 \u0437\u0430\u043f\u0438\u0441\u043a\u0435: \"\u0421\u0440\u043e\u0447\u043d\u043e \u043e\u0442\u043f\u0435\u0447\u0430\u0442\u0430\u0442\u044c \u0434\u043e \u0440\u0430\u0441\u0441\u0432\u0435\u0442\u0430\". \u041e\u0447\u0435\u043d\u044c \u0434\u0435\u0442\u0430\u043b\u044c\u043d\u043e, \u0431\u0435\u0437 \u043c\u0443\u043b\u044c\u0442\u044f\u0448\u043d\u043e\u0441\u0442\u0438.",
|
| 187 |
+
"base": {
|
| 188 |
+
"id": "P06",
|
| 189 |
+
"title": "Russian Provincial Print Shop",
|
| 190 |
+
"seed": 306,
|
| 191 |
+
"time_s": 16.744,
|
| 192 |
+
"image_size": [
|
| 193 |
+
1440,
|
| 194 |
+
1440
|
| 195 |
+
],
|
| 196 |
+
"peak_allocated_gb": 27.467,
|
| 197 |
+
"peak_reserved_gb": 31.965,
|
| 198 |
+
"end_allocated_gb": 22.377,
|
| 199 |
+
"end_reserved_gb": 31.965,
|
| 200 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p06_base.png"
|
| 201 |
+
},
|
| 202 |
+
"quant": {
|
| 203 |
+
"id": "P06",
|
| 204 |
+
"title": "Russian Provincial Print Shop",
|
| 205 |
+
"seed": 306,
|
| 206 |
+
"time_s": 18.136,
|
| 207 |
+
"image_size": [
|
| 208 |
+
1440,
|
| 209 |
+
1440
|
| 210 |
+
],
|
| 211 |
+
"peak_allocated_gb": 23.538,
|
| 212 |
+
"peak_reserved_gb": 27.615,
|
| 213 |
+
"end_allocated_gb": 18.448,
|
| 214 |
+
"end_reserved_gb": 27.615,
|
| 215 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p06_quant.png"
|
| 216 |
+
}
|
| 217 |
+
},
|
| 218 |
+
{
|
| 219 |
+
"id": "P07",
|
| 220 |
+
"title": "Ocean Cartography Bakery",
|
| 221 |
+
"seed": 307,
|
| 222 |
+
"prompt": "A cozy bakery inside an old ocean cartography office, with croissants shaped like sea monsters, nautical charts dusted with flour, brass compasses, jars of ink, morning light, and a baker drawing coastlines in powdered sugar. Text elements: \"TIDAL BREAD & MAPS\" on the front sign, \"SOURDOUGH CURRENT - 6:30 AM\" on a chalkboard, \"UNCHARTED PLUM TARTS\" on a pastry label, \"DO NOT EAT THE COMPASS\" on a note, and \"NORTH SEA BATCH 12\" stamped on a paper bag. Warm, detailed, whimsical but realistic.",
|
| 223 |
+
"base": {
|
| 224 |
+
"id": "P07",
|
| 225 |
+
"title": "Ocean Cartography Bakery",
|
| 226 |
+
"seed": 307,
|
| 227 |
+
"time_s": 13.918,
|
| 228 |
+
"image_size": [
|
| 229 |
+
1440,
|
| 230 |
+
1440
|
| 231 |
+
],
|
| 232 |
+
"peak_allocated_gb": 27.461,
|
| 233 |
+
"peak_reserved_gb": 31.74,
|
| 234 |
+
"end_allocated_gb": 22.377,
|
| 235 |
+
"end_reserved_gb": 31.74,
|
| 236 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p07_base.png"
|
| 237 |
+
},
|
| 238 |
+
"quant": {
|
| 239 |
+
"id": "P07",
|
| 240 |
+
"title": "Ocean Cartography Bakery",
|
| 241 |
+
"seed": 307,
|
| 242 |
+
"time_s": 14.828,
|
| 243 |
+
"image_size": [
|
| 244 |
+
1440,
|
| 245 |
+
1440
|
| 246 |
+
],
|
| 247 |
+
"peak_allocated_gb": 23.532,
|
| 248 |
+
"peak_reserved_gb": 27.712,
|
| 249 |
+
"end_allocated_gb": 18.448,
|
| 250 |
+
"end_reserved_gb": 27.712,
|
| 251 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p07_quant.png"
|
| 252 |
+
}
|
| 253 |
+
},
|
| 254 |
+
{
|
| 255 |
+
"id": "P08",
|
| 256 |
+
"title": "Long English Train Notice Wall",
|
| 257 |
+
"seed": 308,
|
| 258 |
+
"prompt": "A foggy Edwardian railway platform at dawn with a wall of overlapping long English notices, brass lamps, wet cobblestones, porters, suitcases, pigeons, steam, and reflections. The largest notice must read: \"IMPORTANT SERVICE CHANGE: The 6:42 express to Northbridge will depart from Platform Three after the moonlit freight has cleared the signal box.\" A second poster reads: \"LOST PROPERTY: one violin case, two blue gloves, a silver compass, and a letter never posted.\" A timetable says \"WINTER ROUTE - DELAYS EXPECTED NEAR THE MARSH\". Ultra detailed, cinematic, legible signs, natural perspective.",
|
| 259 |
+
"base": {
|
| 260 |
+
"id": "P08",
|
| 261 |
+
"title": "Long English Train Notice Wall",
|
| 262 |
+
"seed": 308,
|
| 263 |
+
"time_s": 13.906,
|
| 264 |
+
"image_size": [
|
| 265 |
+
1440,
|
| 266 |
+
1440
|
| 267 |
+
],
|
| 268 |
+
"peak_allocated_gb": 27.461,
|
| 269 |
+
"peak_reserved_gb": 31.74,
|
| 270 |
+
"end_allocated_gb": 22.377,
|
| 271 |
+
"end_reserved_gb": 31.74,
|
| 272 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p08_base.png"
|
| 273 |
+
},
|
| 274 |
+
"quant": {
|
| 275 |
+
"id": "P08",
|
| 276 |
+
"title": "Long English Train Notice Wall",
|
| 277 |
+
"seed": 308,
|
| 278 |
+
"time_s": 14.826,
|
| 279 |
+
"image_size": [
|
| 280 |
+
1440,
|
| 281 |
+
1440
|
| 282 |
+
],
|
| 283 |
+
"peak_allocated_gb": 23.532,
|
| 284 |
+
"peak_reserved_gb": 27.712,
|
| 285 |
+
"end_allocated_gb": 18.448,
|
| 286 |
+
"end_reserved_gb": 27.712,
|
| 287 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p08_quant.png"
|
| 288 |
+
}
|
| 289 |
+
},
|
| 290 |
+
{
|
| 291 |
+
"id": "P09",
|
| 292 |
+
"title": "Orbital Botanical Courtroom",
|
| 293 |
+
"seed": 309,
|
| 294 |
+
"prompt": "A surreal but photorealistic courtroom inside an orbital botanical garden, judges in dark robes, enormous ferns, floating pollen, Earth visible through a curved window, holographic evidence screens, and a tiny robot stenographer. Required readable text: \"CASE 44-B: THE PEOPLE VS. THE SUNFLOWER\" on the main screen, \"EVIDENCE: THREE PETALS AND A BROKEN VASE\" on a side display, \"SILENCE IN THE GREENHOUSE COURT\" on a sign, \"WITNESS: DR. LYSANDER MOSS\" on a nameplate, and \"OXYGEN TAX RECEIPT\" on a paper slip. Sharp, high-detail, dramatic lighting.",
|
| 295 |
+
"base": {
|
| 296 |
+
"id": "P09",
|
| 297 |
+
"title": "Orbital Botanical Courtroom",
|
| 298 |
+
"seed": 309,
|
| 299 |
+
"time_s": 16.204,
|
| 300 |
+
"image_size": [
|
| 301 |
+
1440,
|
| 302 |
+
1440
|
| 303 |
+
],
|
| 304 |
+
"peak_allocated_gb": 27.461,
|
| 305 |
+
"peak_reserved_gb": 31.719,
|
| 306 |
+
"end_allocated_gb": 22.377,
|
| 307 |
+
"end_reserved_gb": 31.719,
|
| 308 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p09_base.png"
|
| 309 |
+
},
|
| 310 |
+
"quant": {
|
| 311 |
+
"id": "P09",
|
| 312 |
+
"title": "Orbital Botanical Courtroom",
|
| 313 |
+
"seed": 309,
|
| 314 |
+
"time_s": 17.74,
|
| 315 |
+
"image_size": [
|
| 316 |
+
1440,
|
| 317 |
+
1440
|
| 318 |
+
],
|
| 319 |
+
"peak_allocated_gb": 23.533,
|
| 320 |
+
"peak_reserved_gb": 27.712,
|
| 321 |
+
"end_allocated_gb": 18.448,
|
| 322 |
+
"end_reserved_gb": 27.712,
|
| 323 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p09_quant.png"
|
| 324 |
+
}
|
| 325 |
+
},
|
| 326 |
+
{
|
| 327 |
+
"id": "P10",
|
| 328 |
+
"title": "Byzantine Data Center Chapel",
|
| 329 |
+
"seed": 310,
|
| 330 |
+
"prompt": "A Byzantine chapel converted into a quiet data center, gold mosaics reflecting server LEDs, incense smoke, marble floors, monks maintaining fiber cables, illuminated manuscripts next to diagnostic terminals, and beautiful cable management. Text must appear in multiple places: \"SANCTUM SERVER ROOM - AUTHORIZED MONKS ONLY\" on a bronze door, \"BACKUP PSALMS COMPLETED AT 03:12\" on a terminal, \"DO NOT UNPLUG THE RELIQUARY\" on a warning label, \"LATENCY PRAYER REQUESTS\" on a clipboard, and \"ARCHIVE NODE IX\" etched on a server rack. Rich texture, controlled highlights, realistic scale.",
|
| 331 |
+
"base": {
|
| 332 |
+
"id": "P10",
|
| 333 |
+
"title": "Byzantine Data Center Chapel",
|
| 334 |
+
"seed": 310,
|
| 335 |
+
"time_s": 13.703,
|
| 336 |
+
"image_size": [
|
| 337 |
+
1440,
|
| 338 |
+
1440
|
| 339 |
+
],
|
| 340 |
+
"peak_allocated_gb": 27.461,
|
| 341 |
+
"peak_reserved_gb": 31.74,
|
| 342 |
+
"end_allocated_gb": 22.377,
|
| 343 |
+
"end_reserved_gb": 31.74,
|
| 344 |
+
"image": "/workspace/lens_sdnq_work/generated/base/p10_base.png"
|
| 345 |
+
},
|
| 346 |
+
"quant": {
|
| 347 |
+
"id": "P10",
|
| 348 |
+
"title": "Byzantine Data Center Chapel",
|
| 349 |
+
"seed": 310,
|
| 350 |
+
"time_s": 17.665,
|
| 351 |
+
"image_size": [
|
| 352 |
+
1440,
|
| 353 |
+
1440
|
| 354 |
+
],
|
| 355 |
+
"peak_allocated_gb": 23.532,
|
| 356 |
+
"peak_reserved_gb": 27.712,
|
| 357 |
+
"end_allocated_gb": 18.448,
|
| 358 |
+
"end_reserved_gb": 27.712,
|
| 359 |
+
"image": "/workspace/lens_sdnq_work/generated/quant/p10_quant.png"
|
| 360 |
+
}
|
| 361 |
+
}
|
| 362 |
+
]
|
model_cpu_offload_benchmark.json
ADDED
|
@@ -0,0 +1,363 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"benchmark": "model_cpu_offload_cold_warm",
|
| 3 |
+
"hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
|
| 4 |
+
"mode": "Diffusers enable_model_cpu_offload()",
|
| 5 |
+
"cache_state": "warm local HF cache; no download time included",
|
| 6 |
+
"process_isolation": "single model per fresh Python process",
|
| 7 |
+
"base_resolution": 1440,
|
| 8 |
+
"aspect_ratio": "1:1",
|
| 9 |
+
"num_inference_steps": 20,
|
| 10 |
+
"guidance_scale": 5.0,
|
| 11 |
+
"dtype": "torch.bfloat16",
|
| 12 |
+
"definitions": {
|
| 13 |
+
"load_time_s": "Pipeline load plus enable_model_cpu_offload setup from warm local HF cache; download time excluded.",
|
| 14 |
+
"cold_generation": "P01, first generation immediately after fresh process load/offload setup.",
|
| 15 |
+
"warm_generation": "P02-P10 after the cold P01 generation."
|
| 16 |
+
},
|
| 17 |
+
"models": {
|
| 18 |
+
"base": {
|
| 19 |
+
"hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
|
| 20 |
+
"mode": "Diffusers enable_model_cpu_offload()",
|
| 21 |
+
"cache_state": "warm local HF cache; no download time included",
|
| 22 |
+
"process_isolation": "single model per fresh Python process",
|
| 23 |
+
"base_resolution": 1440,
|
| 24 |
+
"aspect_ratio": "1:1",
|
| 25 |
+
"num_inference_steps": 20,
|
| 26 |
+
"guidance_scale": 5.0,
|
| 27 |
+
"dtype": "torch.bfloat16",
|
| 28 |
+
"kind": "base",
|
| 29 |
+
"load": {
|
| 30 |
+
"load_time_s": 15.51,
|
| 31 |
+
"peak_allocated_gb": 12.582,
|
| 32 |
+
"peak_reserved_gb": 13.881,
|
| 33 |
+
"end_allocated_gb": 10.185,
|
| 34 |
+
"end_reserved_gb": 10.679
|
| 35 |
+
},
|
| 36 |
+
"summary": {
|
| 37 |
+
"cold_time_s": 26.217,
|
| 38 |
+
"cold_peak_allocated_gb": 19.274,
|
| 39 |
+
"cold_peak_reserved_gb": 19.608,
|
| 40 |
+
"warm_avg_time_s": 18.123,
|
| 41 |
+
"warm_median_time_s": 17.178,
|
| 42 |
+
"warm_avg_peak_allocated_gb": 19.271,
|
| 43 |
+
"warm_avg_peak_reserved_gb": 19.63,
|
| 44 |
+
"warm_max_peak_allocated_gb": 19.276,
|
| 45 |
+
"warm_max_peak_reserved_gb": 19.803
|
| 46 |
+
},
|
| 47 |
+
"prompts": [
|
| 48 |
+
{
|
| 49 |
+
"id": "P01",
|
| 50 |
+
"title": "Midnight Library Weather Station",
|
| 51 |
+
"seed": 301,
|
| 52 |
+
"time_s": 26.217,
|
| 53 |
+
"image_size": [
|
| 54 |
+
1440,
|
| 55 |
+
1440
|
| 56 |
+
],
|
| 57 |
+
"peak_allocated_gb": 19.274,
|
| 58 |
+
"peak_reserved_gb": 19.608,
|
| 59 |
+
"end_allocated_gb": 10.221,
|
| 60 |
+
"end_reserved_gb": 10.884
|
| 61 |
+
},
|
| 62 |
+
{
|
| 63 |
+
"id": "P02",
|
| 64 |
+
"title": "Desert Observatory Treaty Room",
|
| 65 |
+
"seed": 302,
|
| 66 |
+
"time_s": 21.285,
|
| 67 |
+
"image_size": [
|
| 68 |
+
1440,
|
| 69 |
+
1440
|
| 70 |
+
],
|
| 71 |
+
"peak_allocated_gb": 19.274,
|
| 72 |
+
"peak_reserved_gb": 19.608,
|
| 73 |
+
"end_allocated_gb": 10.221,
|
| 74 |
+
"end_reserved_gb": 10.884
|
| 75 |
+
},
|
| 76 |
+
{
|
| 77 |
+
"id": "P03",
|
| 78 |
+
"title": "Arctic Submarine Greenhouse",
|
| 79 |
+
"seed": 303,
|
| 80 |
+
"time_s": 17.271,
|
| 81 |
+
"image_size": [
|
| 82 |
+
1440,
|
| 83 |
+
1440
|
| 84 |
+
],
|
| 85 |
+
"peak_allocated_gb": 19.275,
|
| 86 |
+
"peak_reserved_gb": 19.608,
|
| 87 |
+
"end_allocated_gb": 10.221,
|
| 88 |
+
"end_reserved_gb": 10.809
|
| 89 |
+
},
|
| 90 |
+
{
|
| 91 |
+
"id": "P04",
|
| 92 |
+
"title": "Long English Museum Labels",
|
| 93 |
+
"seed": 304,
|
| 94 |
+
"time_s": 17.178,
|
| 95 |
+
"image_size": [
|
| 96 |
+
1440,
|
| 97 |
+
1440
|
| 98 |
+
],
|
| 99 |
+
"peak_allocated_gb": 19.275,
|
| 100 |
+
"peak_reserved_gb": 19.608,
|
| 101 |
+
"end_allocated_gb": 10.221,
|
| 102 |
+
"end_reserved_gb": 10.884
|
| 103 |
+
},
|
| 104 |
+
{
|
| 105 |
+
"id": "P05",
|
| 106 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 107 |
+
"seed": 305,
|
| 108 |
+
"time_s": 17.058,
|
| 109 |
+
"image_size": [
|
| 110 |
+
1440,
|
| 111 |
+
1440
|
| 112 |
+
],
|
| 113 |
+
"peak_allocated_gb": 19.275,
|
| 114 |
+
"peak_reserved_gb": 19.608,
|
| 115 |
+
"end_allocated_gb": 10.221,
|
| 116 |
+
"end_reserved_gb": 10.813
|
| 117 |
+
},
|
| 118 |
+
{
|
| 119 |
+
"id": "P06",
|
| 120 |
+
"title": "Russian Provincial Print Shop",
|
| 121 |
+
"seed": 306,
|
| 122 |
+
"time_s": 20.163,
|
| 123 |
+
"image_size": [
|
| 124 |
+
1440,
|
| 125 |
+
1440
|
| 126 |
+
],
|
| 127 |
+
"peak_allocated_gb": 19.242,
|
| 128 |
+
"peak_reserved_gb": 19.803,
|
| 129 |
+
"end_allocated_gb": 10.221,
|
| 130 |
+
"end_reserved_gb": 13.16
|
| 131 |
+
},
|
| 132 |
+
{
|
| 133 |
+
"id": "P07",
|
| 134 |
+
"title": "Ocean Cartography Bakery",
|
| 135 |
+
"seed": 307,
|
| 136 |
+
"time_s": 16.903,
|
| 137 |
+
"image_size": [
|
| 138 |
+
1440,
|
| 139 |
+
1440
|
| 140 |
+
],
|
| 141 |
+
"peak_allocated_gb": 19.274,
|
| 142 |
+
"peak_reserved_gb": 19.608,
|
| 143 |
+
"end_allocated_gb": 10.221,
|
| 144 |
+
"end_reserved_gb": 10.884
|
| 145 |
+
},
|
| 146 |
+
{
|
| 147 |
+
"id": "P08",
|
| 148 |
+
"title": "Long English Train Notice Wall",
|
| 149 |
+
"seed": 308,
|
| 150 |
+
"time_s": 16.857,
|
| 151 |
+
"image_size": [
|
| 152 |
+
1440,
|
| 153 |
+
1440
|
| 154 |
+
],
|
| 155 |
+
"peak_allocated_gb": 19.274,
|
| 156 |
+
"peak_reserved_gb": 19.608,
|
| 157 |
+
"end_allocated_gb": 10.221,
|
| 158 |
+
"end_reserved_gb": 10.884
|
| 159 |
+
},
|
| 160 |
+
{
|
| 161 |
+
"id": "P09",
|
| 162 |
+
"title": "Orbital Botanical Courtroom",
|
| 163 |
+
"seed": 309,
|
| 164 |
+
"time_s": 19.664,
|
| 165 |
+
"image_size": [
|
| 166 |
+
1440,
|
| 167 |
+
1440
|
| 168 |
+
],
|
| 169 |
+
"peak_allocated_gb": 19.276,
|
| 170 |
+
"peak_reserved_gb": 19.61,
|
| 171 |
+
"end_allocated_gb": 10.221,
|
| 172 |
+
"end_reserved_gb": 10.909
|
| 173 |
+
},
|
| 174 |
+
{
|
| 175 |
+
"id": "P10",
|
| 176 |
+
"title": "Byzantine Data Center Chapel",
|
| 177 |
+
"seed": 310,
|
| 178 |
+
"time_s": 16.731,
|
| 179 |
+
"image_size": [
|
| 180 |
+
1440,
|
| 181 |
+
1440
|
| 182 |
+
],
|
| 183 |
+
"peak_allocated_gb": 19.276,
|
| 184 |
+
"peak_reserved_gb": 19.608,
|
| 185 |
+
"end_allocated_gb": 10.221,
|
| 186 |
+
"end_reserved_gb": 10.813
|
| 187 |
+
}
|
| 188 |
+
]
|
| 189 |
+
},
|
| 190 |
+
"quant": {
|
| 191 |
+
"hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
|
| 192 |
+
"mode": "Diffusers enable_model_cpu_offload()",
|
| 193 |
+
"cache_state": "warm local HF cache; no download time included",
|
| 194 |
+
"process_isolation": "single model per fresh Python process",
|
| 195 |
+
"base_resolution": 1440,
|
| 196 |
+
"aspect_ratio": "1:1",
|
| 197 |
+
"num_inference_steps": 20,
|
| 198 |
+
"guidance_scale": 5.0,
|
| 199 |
+
"dtype": "torch.bfloat16",
|
| 200 |
+
"kind": "quant",
|
| 201 |
+
"load": {
|
| 202 |
+
"load_time_s": 13.573,
|
| 203 |
+
"peak_allocated_gb": 12.582,
|
| 204 |
+
"peak_reserved_gb": 13.881,
|
| 205 |
+
"end_allocated_gb": 10.185,
|
| 206 |
+
"end_reserved_gb": 10.679
|
| 207 |
+
},
|
| 208 |
+
"summary": {
|
| 209 |
+
"cold_time_s": 21.473,
|
| 210 |
+
"cold_peak_allocated_gb": 15.479,
|
| 211 |
+
"cold_peak_reserved_gb": 19.126,
|
| 212 |
+
"warm_avg_time_s": 17.65,
|
| 213 |
+
"warm_median_time_s": 17.519,
|
| 214 |
+
"warm_avg_peak_allocated_gb": 15.48,
|
| 215 |
+
"warm_avg_peak_reserved_gb": 18.965,
|
| 216 |
+
"warm_max_peak_allocated_gb": 15.482,
|
| 217 |
+
"warm_max_peak_reserved_gb": 19.21
|
| 218 |
+
},
|
| 219 |
+
"prompts": [
|
| 220 |
+
{
|
| 221 |
+
"id": "P01",
|
| 222 |
+
"title": "Midnight Library Weather Station",
|
| 223 |
+
"seed": 301,
|
| 224 |
+
"time_s": 21.473,
|
| 225 |
+
"image_size": [
|
| 226 |
+
1440,
|
| 227 |
+
1440
|
| 228 |
+
],
|
| 229 |
+
"peak_allocated_gb": 15.479,
|
| 230 |
+
"peak_reserved_gb": 19.126,
|
| 231 |
+
"end_allocated_gb": 10.221,
|
| 232 |
+
"end_reserved_gb": 10.865
|
| 233 |
+
},
|
| 234 |
+
{
|
| 235 |
+
"id": "P02",
|
| 236 |
+
"title": "Desert Observatory Treaty Room",
|
| 237 |
+
"seed": 302,
|
| 238 |
+
"time_s": 19.047,
|
| 239 |
+
"image_size": [
|
| 240 |
+
1440,
|
| 241 |
+
1440
|
| 242 |
+
],
|
| 243 |
+
"peak_allocated_gb": 15.479,
|
| 244 |
+
"peak_reserved_gb": 19.126,
|
| 245 |
+
"end_allocated_gb": 10.221,
|
| 246 |
+
"end_reserved_gb": 10.865
|
| 247 |
+
},
|
| 248 |
+
{
|
| 249 |
+
"id": "P03",
|
| 250 |
+
"title": "Arctic Submarine Greenhouse",
|
| 251 |
+
"seed": 303,
|
| 252 |
+
"time_s": 17.133,
|
| 253 |
+
"image_size": [
|
| 254 |
+
1440,
|
| 255 |
+
1440
|
| 256 |
+
],
|
| 257 |
+
"peak_allocated_gb": 15.479,
|
| 258 |
+
"peak_reserved_gb": 19.185,
|
| 259 |
+
"end_allocated_gb": 10.221,
|
| 260 |
+
"end_reserved_gb": 10.792
|
| 261 |
+
},
|
| 262 |
+
{
|
| 263 |
+
"id": "P04",
|
| 264 |
+
"title": "Long English Museum Labels",
|
| 265 |
+
"seed": 304,
|
| 266 |
+
"time_s": 17.73,
|
| 267 |
+
"image_size": [
|
| 268 |
+
1440,
|
| 269 |
+
1440
|
| 270 |
+
],
|
| 271 |
+
"peak_allocated_gb": 15.479,
|
| 272 |
+
"peak_reserved_gb": 19.126,
|
| 273 |
+
"end_allocated_gb": 10.221,
|
| 274 |
+
"end_reserved_gb": 10.863
|
| 275 |
+
},
|
| 276 |
+
{
|
| 277 |
+
"id": "P05",
|
| 278 |
+
"title": "Tokyo Rooftop Repair Diner",
|
| 279 |
+
"seed": 305,
|
| 280 |
+
"time_s": 17.332,
|
| 281 |
+
"image_size": [
|
| 282 |
+
1440,
|
| 283 |
+
1440
|
| 284 |
+
],
|
| 285 |
+
"peak_allocated_gb": 15.479,
|
| 286 |
+
"peak_reserved_gb": 19.21,
|
| 287 |
+
"end_allocated_gb": 10.221,
|
| 288 |
+
"end_reserved_gb": 10.815
|
| 289 |
+
},
|
| 290 |
+
{
|
| 291 |
+
"id": "P06",
|
| 292 |
+
"title": "Russian Provincial Print Shop",
|
| 293 |
+
"seed": 306,
|
| 294 |
+
"time_s": 17.519,
|
| 295 |
+
"image_size": [
|
| 296 |
+
1440,
|
| 297 |
+
1440
|
| 298 |
+
],
|
| 299 |
+
"peak_allocated_gb": 15.482,
|
| 300 |
+
"peak_reserved_gb": 17.404,
|
| 301 |
+
"end_allocated_gb": 10.221,
|
| 302 |
+
"end_reserved_gb": 13.141
|
| 303 |
+
},
|
| 304 |
+
{
|
| 305 |
+
"id": "P07",
|
| 306 |
+
"title": "Ocean Cartography Bakery",
|
| 307 |
+
"seed": 307,
|
| 308 |
+
"time_s": 17.614,
|
| 309 |
+
"image_size": [
|
| 310 |
+
1440,
|
| 311 |
+
1440
|
| 312 |
+
],
|
| 313 |
+
"peak_allocated_gb": 15.479,
|
| 314 |
+
"peak_reserved_gb": 19.126,
|
| 315 |
+
"end_allocated_gb": 10.221,
|
| 316 |
+
"end_reserved_gb": 10.865
|
| 317 |
+
},
|
| 318 |
+
{
|
| 319 |
+
"id": "P08",
|
| 320 |
+
"title": "Long English Train Notice Wall",
|
| 321 |
+
"seed": 308,
|
| 322 |
+
"time_s": 17.498,
|
| 323 |
+
"image_size": [
|
| 324 |
+
1440,
|
| 325 |
+
1440
|
| 326 |
+
],
|
| 327 |
+
"peak_allocated_gb": 15.479,
|
| 328 |
+
"peak_reserved_gb": 19.126,
|
| 329 |
+
"end_allocated_gb": 10.221,
|
| 330 |
+
"end_reserved_gb": 10.865
|
| 331 |
+
},
|
| 332 |
+
{
|
| 333 |
+
"id": "P09",
|
| 334 |
+
"title": "Orbital Botanical Courtroom",
|
| 335 |
+
"seed": 309,
|
| 336 |
+
"time_s": 17.546,
|
| 337 |
+
"image_size": [
|
| 338 |
+
1440,
|
| 339 |
+
1440
|
| 340 |
+
],
|
| 341 |
+
"peak_allocated_gb": 15.481,
|
| 342 |
+
"peak_reserved_gb": 19.172,
|
| 343 |
+
"end_allocated_gb": 10.221,
|
| 344 |
+
"end_reserved_gb": 10.888
|
| 345 |
+
},
|
| 346 |
+
{
|
| 347 |
+
"id": "P10",
|
| 348 |
+
"title": "Byzantine Data Center Chapel",
|
| 349 |
+
"seed": 310,
|
| 350 |
+
"time_s": 17.434,
|
| 351 |
+
"image_size": [
|
| 352 |
+
1440,
|
| 353 |
+
1440
|
| 354 |
+
],
|
| 355 |
+
"peak_allocated_gb": 15.479,
|
| 356 |
+
"peak_reserved_gb": 19.21,
|
| 357 |
+
"end_allocated_gb": 10.221,
|
| 358 |
+
"end_reserved_gb": 10.813
|
| 359 |
+
}
|
| 360 |
+
]
|
| 361 |
+
}
|
| 362 |
+
}
|
| 363 |
+
}
|
model_index.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "LensPipeline",
|
| 3 |
+
"_diffusers_version": "0.37.1",
|
| 4 |
+
"scheduler": [
|
| 5 |
+
"diffusers",
|
| 6 |
+
"FlowMatchEulerDiscreteScheduler"
|
| 7 |
+
],
|
| 8 |
+
"vae": [
|
| 9 |
+
"diffusers",
|
| 10 |
+
"AutoencoderKLFlux2"
|
| 11 |
+
],
|
| 12 |
+
"text_encoder": [
|
| 13 |
+
"transformers",
|
| 14 |
+
"LensGptOssEncoder"
|
| 15 |
+
],
|
| 16 |
+
"tokenizer": [
|
| 17 |
+
"transformers",
|
| 18 |
+
"PreTrainedTokenizerFast"
|
| 19 |
+
],
|
| 20 |
+
"transformer": [
|
| 21 |
+
"diffusers",
|
| 22 |
+
"LensTransformer2DModel"
|
| 23 |
+
]
|
| 24 |
+
}
|
scheduler/scheduler_config.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "FlowMatchEulerDiscreteScheduler",
|
| 3 |
+
"_diffusers_version": "0.37.1",
|
| 4 |
+
"base_image_seq_len": 256,
|
| 5 |
+
"base_shift": 0.5,
|
| 6 |
+
"invert_sigmas": false,
|
| 7 |
+
"max_image_seq_len": 4096,
|
| 8 |
+
"max_shift": 1.15,
|
| 9 |
+
"num_train_timesteps": 1000,
|
| 10 |
+
"shift": 3.0,
|
| 11 |
+
"shift_terminal": null,
|
| 12 |
+
"stochastic_sampling": false,
|
| 13 |
+
"time_shift_type": "exponential",
|
| 14 |
+
"use_beta_sigmas": false,
|
| 15 |
+
"use_dynamic_shifting": true,
|
| 16 |
+
"use_exponential_sigmas": false,
|
| 17 |
+
"use_karras_sigmas": false
|
| 18 |
+
}
|
sdnq_quantization_summary.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"source_model": "microsoft/Lens",
|
| 3 |
+
"target_model": "WaveCut/Lens-SDNQ-uint4-static",
|
| 4 |
+
"method": "SDNQ uint4 static",
|
| 5 |
+
"corrected_recipe": true,
|
| 6 |
+
"weights_dtype": "uint4",
|
| 7 |
+
"quantized_matmul_dtype": "int8",
|
| 8 |
+
"group_size": 0,
|
| 9 |
+
"use_quantized_matmul": true,
|
| 10 |
+
"dequantize_fp32": false,
|
| 11 |
+
"modules_to_not_convert_user": [
|
| 12 |
+
".final_layer",
|
| 13 |
+
"pos_embed",
|
| 14 |
+
".norm_out",
|
| 15 |
+
".y_embedder",
|
| 16 |
+
".context_embedder",
|
| 17 |
+
".condition_embedder",
|
| 18 |
+
".x_embedder",
|
| 19 |
+
".vid_out",
|
| 20 |
+
".emb_out",
|
| 21 |
+
".img_in",
|
| 22 |
+
"patch_embed",
|
| 23 |
+
".time_embed",
|
| 24 |
+
".t_embedder",
|
| 25 |
+
"multi_modal_projector",
|
| 26 |
+
"patch_emb",
|
| 27 |
+
"norm",
|
| 28 |
+
".img_out",
|
| 29 |
+
"patch_embedding",
|
| 30 |
+
"lm_head",
|
| 31 |
+
".proj_out",
|
| 32 |
+
".vid_in",
|
| 33 |
+
".txt_in",
|
| 34 |
+
"wte",
|
| 35 |
+
"time_text_embed",
|
| 36 |
+
".txt_out",
|
| 37 |
+
".emb_in",
|
| 38 |
+
"*.img_mod.*",
|
| 39 |
+
"*.txt_mod.*"
|
| 40 |
+
],
|
| 41 |
+
"root_cause_from_turbo_ablation": "Do not quantize transformer modulation linears (*.img_mod.* and *.txt_mod.*); all-linear UINT4 caused periodic grid artifacts and text degradation on Lens-Turbo.",
|
| 42 |
+
"transformer_load_time_s": 3.677,
|
| 43 |
+
"transformer_load_peak_allocated_gb": 8.359,
|
| 44 |
+
"transformer_load_peak_reserved_gb": 8.424,
|
| 45 |
+
"quantization_time_s": 0.313,
|
| 46 |
+
"quantization_peak_allocated_gb": 8.425,
|
| 47 |
+
"quantization_peak_reserved_gb": 8.485,
|
| 48 |
+
"base_transformer_tensor_storage_gb": 16.417,
|
| 49 |
+
"quant_transformer_tensor_storage_gb": 4.301,
|
| 50 |
+
"transformer_storage_reduction_percent": 73.8,
|
| 51 |
+
"base_transformer_repo_files_gb": 16.417,
|
| 52 |
+
"quant_transformer_repo_files_gb": 4.302,
|
| 53 |
+
"base_transformer_dtypes": {
|
| 54 |
+
"FLOAT32": 16416900608
|
| 55 |
+
},
|
| 56 |
+
"quant_transformer_dtypes": {
|
| 57 |
+
"BFLOAT16": 2942501632,
|
| 58 |
+
"UINT8": 1358954496
|
| 59 |
+
},
|
| 60 |
+
"base_transformer_tensors": 1264,
|
| 61 |
+
"quant_transformer_tensors": 2224
|
| 62 |
+
}
|
text_encoder/config.json
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"GptOssForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": true,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": null,
|
| 8 |
+
"dtype": "bfloat16",
|
| 9 |
+
"eos_token_id": 200002,
|
| 10 |
+
"experts_per_token": 4,
|
| 11 |
+
"head_dim": 64,
|
| 12 |
+
"hidden_act": "silu",
|
| 13 |
+
"hidden_size": 2880,
|
| 14 |
+
"initial_context_length": 4096,
|
| 15 |
+
"initializer_range": 0.02,
|
| 16 |
+
"intermediate_size": 2880,
|
| 17 |
+
"layer_types": [
|
| 18 |
+
"sliding_attention",
|
| 19 |
+
"full_attention",
|
| 20 |
+
"sliding_attention",
|
| 21 |
+
"full_attention",
|
| 22 |
+
"sliding_attention",
|
| 23 |
+
"full_attention",
|
| 24 |
+
"sliding_attention",
|
| 25 |
+
"full_attention",
|
| 26 |
+
"sliding_attention",
|
| 27 |
+
"full_attention",
|
| 28 |
+
"sliding_attention",
|
| 29 |
+
"full_attention",
|
| 30 |
+
"sliding_attention",
|
| 31 |
+
"full_attention",
|
| 32 |
+
"sliding_attention",
|
| 33 |
+
"full_attention",
|
| 34 |
+
"sliding_attention",
|
| 35 |
+
"full_attention",
|
| 36 |
+
"sliding_attention",
|
| 37 |
+
"full_attention",
|
| 38 |
+
"sliding_attention",
|
| 39 |
+
"full_attention",
|
| 40 |
+
"sliding_attention",
|
| 41 |
+
"full_attention"
|
| 42 |
+
],
|
| 43 |
+
"max_position_embeddings": 131072,
|
| 44 |
+
"model_type": "gpt_oss",
|
| 45 |
+
"num_attention_heads": 64,
|
| 46 |
+
"num_experts_per_tok": 4,
|
| 47 |
+
"num_hidden_layers": 24,
|
| 48 |
+
"num_key_value_heads": 8,
|
| 49 |
+
"num_local_experts": 32,
|
| 50 |
+
"output_router_logits": false,
|
| 51 |
+
"pad_token_id": 199999,
|
| 52 |
+
"quantization_config": {
|
| 53 |
+
"modules_to_not_convert": [
|
| 54 |
+
"model.layers.*.self_attn",
|
| 55 |
+
"model.layers.*.mlp.router",
|
| 56 |
+
"model.embed_tokens",
|
| 57 |
+
"lm_head"
|
| 58 |
+
],
|
| 59 |
+
"quant_method": "mxfp4"
|
| 60 |
+
},
|
| 61 |
+
"rms_norm_eps": 1e-05,
|
| 62 |
+
"rope_parameters": {
|
| 63 |
+
"beta_fast": 32.0,
|
| 64 |
+
"beta_slow": 1.0,
|
| 65 |
+
"factor": 32.0,
|
| 66 |
+
"original_max_position_embeddings": 4096,
|
| 67 |
+
"rope_theta": 150000,
|
| 68 |
+
"rope_type": "yarn",
|
| 69 |
+
"truncate": false
|
| 70 |
+
},
|
| 71 |
+
"router_aux_loss_coef": 0.9,
|
| 72 |
+
"sliding_window": 128,
|
| 73 |
+
"swiglu_limit": 7.0,
|
| 74 |
+
"tie_word_embeddings": false,
|
| 75 |
+
"transformers_version": "5.8.0",
|
| 76 |
+
"use_cache": true,
|
| 77 |
+
"vocab_size": 201088
|
| 78 |
+
}
|
text_encoder/generation_config.json
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 199998,
|
| 3 |
+
"do_sample": true,
|
| 4 |
+
"eos_token_id": [
|
| 5 |
+
200002,
|
| 6 |
+
199999,
|
| 7 |
+
200012
|
| 8 |
+
],
|
| 9 |
+
"pad_token_id": 199999,
|
| 10 |
+
"transformers_version": "5.8.0"
|
| 11 |
+
}
|
text_encoder/model-00001-of-00003.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec5a256b3cdeea38db22f0988f9f156554fc9753f95857f5ecaea56048f43bd7
|
| 3 |
+
size 4845744456
|
text_encoder/model-00002-of-00003.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:914d5c38cd798a3393e348942e29c38497851b38c09df529ee162f4bd1f13b64
|
| 3 |
+
size 4774186632
|
text_encoder/model-00003-of-00003.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:931a994c03fc5554d6e343d95a991ae162502459eae6035cd9cc5ea773b598e3
|
| 3 |
+
size 4154656824
|
text_encoder/model.safetensors.index.json
ADDED
|
@@ -0,0 +1,467 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"metadata": {
|
| 3 |
+
"total_parameters": 1804459584,
|
| 4 |
+
"total_size": 13774535808
|
| 5 |
+
},
|
| 6 |
+
"weight_map": {
|
| 7 |
+
"lm_head.weight": "model-00001-of-00003.safetensors",
|
| 8 |
+
"model.embed_tokens.weight": "model-00001-of-00003.safetensors",
|
| 9 |
+
"model.layers.0.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 10 |
+
"model.layers.0.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 11 |
+
"model.layers.0.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 12 |
+
"model.layers.0.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 13 |
+
"model.layers.0.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 14 |
+
"model.layers.0.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
|
| 15 |
+
"model.layers.0.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
|
| 16 |
+
"model.layers.0.mlp.router.bias": "model-00001-of-00003.safetensors",
|
| 17 |
+
"model.layers.0.mlp.router.weight": "model-00001-of-00003.safetensors",
|
| 18 |
+
"model.layers.0.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 19 |
+
"model.layers.0.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
|
| 20 |
+
"model.layers.0.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
|
| 21 |
+
"model.layers.0.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
|
| 22 |
+
"model.layers.0.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
|
| 23 |
+
"model.layers.0.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
|
| 24 |
+
"model.layers.0.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
|
| 25 |
+
"model.layers.0.self_attn.sinks": "model-00001-of-00003.safetensors",
|
| 26 |
+
"model.layers.0.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
|
| 27 |
+
"model.layers.0.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
|
| 28 |
+
"model.layers.1.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 29 |
+
"model.layers.1.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 30 |
+
"model.layers.1.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 31 |
+
"model.layers.1.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 32 |
+
"model.layers.1.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 33 |
+
"model.layers.1.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
|
| 34 |
+
"model.layers.1.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
|
| 35 |
+
"model.layers.1.mlp.router.bias": "model-00001-of-00003.safetensors",
|
| 36 |
+
"model.layers.1.mlp.router.weight": "model-00001-of-00003.safetensors",
|
| 37 |
+
"model.layers.1.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 38 |
+
"model.layers.1.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
|
| 39 |
+
"model.layers.1.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
|
| 40 |
+
"model.layers.1.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
|
| 41 |
+
"model.layers.1.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
|
| 42 |
+
"model.layers.1.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
|
| 43 |
+
"model.layers.1.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
|
| 44 |
+
"model.layers.1.self_attn.sinks": "model-00001-of-00003.safetensors",
|
| 45 |
+
"model.layers.1.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
|
| 46 |
+
"model.layers.1.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
|
| 47 |
+
"model.layers.10.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 48 |
+
"model.layers.10.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 49 |
+
"model.layers.10.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 50 |
+
"model.layers.10.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 51 |
+
"model.layers.10.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 52 |
+
"model.layers.10.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 53 |
+
"model.layers.10.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 54 |
+
"model.layers.10.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 55 |
+
"model.layers.10.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 56 |
+
"model.layers.10.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 57 |
+
"model.layers.10.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 58 |
+
"model.layers.10.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 59 |
+
"model.layers.10.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 60 |
+
"model.layers.10.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 61 |
+
"model.layers.10.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 62 |
+
"model.layers.10.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 63 |
+
"model.layers.10.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 64 |
+
"model.layers.10.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 65 |
+
"model.layers.10.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 66 |
+
"model.layers.11.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 67 |
+
"model.layers.11.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 68 |
+
"model.layers.11.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 69 |
+
"model.layers.11.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 70 |
+
"model.layers.11.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 71 |
+
"model.layers.11.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 72 |
+
"model.layers.11.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 73 |
+
"model.layers.11.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 74 |
+
"model.layers.11.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 75 |
+
"model.layers.11.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 76 |
+
"model.layers.11.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 77 |
+
"model.layers.11.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 78 |
+
"model.layers.11.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 79 |
+
"model.layers.11.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 80 |
+
"model.layers.11.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 81 |
+
"model.layers.11.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 82 |
+
"model.layers.11.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 83 |
+
"model.layers.11.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 84 |
+
"model.layers.11.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 85 |
+
"model.layers.12.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 86 |
+
"model.layers.12.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 87 |
+
"model.layers.12.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 88 |
+
"model.layers.12.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 89 |
+
"model.layers.12.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 90 |
+
"model.layers.12.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 91 |
+
"model.layers.12.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 92 |
+
"model.layers.12.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 93 |
+
"model.layers.12.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 94 |
+
"model.layers.12.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 95 |
+
"model.layers.12.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 96 |
+
"model.layers.12.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 97 |
+
"model.layers.12.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 98 |
+
"model.layers.12.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 99 |
+
"model.layers.12.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 100 |
+
"model.layers.12.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 101 |
+
"model.layers.12.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 102 |
+
"model.layers.12.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 103 |
+
"model.layers.12.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 104 |
+
"model.layers.13.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 105 |
+
"model.layers.13.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 106 |
+
"model.layers.13.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 107 |
+
"model.layers.13.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 108 |
+
"model.layers.13.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 109 |
+
"model.layers.13.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 110 |
+
"model.layers.13.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 111 |
+
"model.layers.13.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 112 |
+
"model.layers.13.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 113 |
+
"model.layers.13.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 114 |
+
"model.layers.13.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 115 |
+
"model.layers.13.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 116 |
+
"model.layers.13.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 117 |
+
"model.layers.13.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 118 |
+
"model.layers.13.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 119 |
+
"model.layers.13.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 120 |
+
"model.layers.13.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 121 |
+
"model.layers.13.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 122 |
+
"model.layers.13.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 123 |
+
"model.layers.14.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 124 |
+
"model.layers.14.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 125 |
+
"model.layers.14.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 126 |
+
"model.layers.14.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 127 |
+
"model.layers.14.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 128 |
+
"model.layers.14.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 129 |
+
"model.layers.14.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 130 |
+
"model.layers.14.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 131 |
+
"model.layers.14.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 132 |
+
"model.layers.14.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 133 |
+
"model.layers.14.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 134 |
+
"model.layers.14.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 135 |
+
"model.layers.14.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 136 |
+
"model.layers.14.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 137 |
+
"model.layers.14.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 138 |
+
"model.layers.14.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 139 |
+
"model.layers.14.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 140 |
+
"model.layers.14.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 141 |
+
"model.layers.14.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 142 |
+
"model.layers.15.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 143 |
+
"model.layers.15.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 144 |
+
"model.layers.15.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 145 |
+
"model.layers.15.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 146 |
+
"model.layers.15.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 147 |
+
"model.layers.15.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 148 |
+
"model.layers.15.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 149 |
+
"model.layers.15.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 150 |
+
"model.layers.15.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 151 |
+
"model.layers.15.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 152 |
+
"model.layers.15.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 153 |
+
"model.layers.15.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 154 |
+
"model.layers.15.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 155 |
+
"model.layers.15.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 156 |
+
"model.layers.15.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 157 |
+
"model.layers.15.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 158 |
+
"model.layers.15.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 159 |
+
"model.layers.15.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 160 |
+
"model.layers.15.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 161 |
+
"model.layers.16.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 162 |
+
"model.layers.16.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 163 |
+
"model.layers.16.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 164 |
+
"model.layers.16.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 165 |
+
"model.layers.16.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 166 |
+
"model.layers.16.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 167 |
+
"model.layers.16.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 168 |
+
"model.layers.16.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 169 |
+
"model.layers.16.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 170 |
+
"model.layers.16.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 171 |
+
"model.layers.16.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 172 |
+
"model.layers.16.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 173 |
+
"model.layers.16.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 174 |
+
"model.layers.16.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 175 |
+
"model.layers.16.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 176 |
+
"model.layers.16.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 177 |
+
"model.layers.16.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 178 |
+
"model.layers.16.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 179 |
+
"model.layers.16.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 180 |
+
"model.layers.17.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 181 |
+
"model.layers.17.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 182 |
+
"model.layers.17.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 183 |
+
"model.layers.17.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 184 |
+
"model.layers.17.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 185 |
+
"model.layers.17.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 186 |
+
"model.layers.17.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 187 |
+
"model.layers.17.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 188 |
+
"model.layers.17.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 189 |
+
"model.layers.17.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 190 |
+
"model.layers.17.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 191 |
+
"model.layers.17.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 192 |
+
"model.layers.17.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 193 |
+
"model.layers.17.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 194 |
+
"model.layers.17.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 195 |
+
"model.layers.17.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 196 |
+
"model.layers.17.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 197 |
+
"model.layers.17.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 198 |
+
"model.layers.17.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 199 |
+
"model.layers.18.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 200 |
+
"model.layers.18.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 201 |
+
"model.layers.18.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 202 |
+
"model.layers.18.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 203 |
+
"model.layers.18.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 204 |
+
"model.layers.18.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 205 |
+
"model.layers.18.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 206 |
+
"model.layers.18.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 207 |
+
"model.layers.18.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 208 |
+
"model.layers.18.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 209 |
+
"model.layers.18.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 210 |
+
"model.layers.18.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 211 |
+
"model.layers.18.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 212 |
+
"model.layers.18.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 213 |
+
"model.layers.18.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 214 |
+
"model.layers.18.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 215 |
+
"model.layers.18.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 216 |
+
"model.layers.18.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 217 |
+
"model.layers.18.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 218 |
+
"model.layers.19.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 219 |
+
"model.layers.19.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 220 |
+
"model.layers.19.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 221 |
+
"model.layers.19.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 222 |
+
"model.layers.19.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 223 |
+
"model.layers.19.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 224 |
+
"model.layers.19.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 225 |
+
"model.layers.19.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 226 |
+
"model.layers.19.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 227 |
+
"model.layers.19.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 228 |
+
"model.layers.19.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 229 |
+
"model.layers.19.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 230 |
+
"model.layers.19.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 231 |
+
"model.layers.19.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 232 |
+
"model.layers.19.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 233 |
+
"model.layers.19.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 234 |
+
"model.layers.19.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 235 |
+
"model.layers.19.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 236 |
+
"model.layers.19.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 237 |
+
"model.layers.2.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 238 |
+
"model.layers.2.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 239 |
+
"model.layers.2.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 240 |
+
"model.layers.2.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 241 |
+
"model.layers.2.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 242 |
+
"model.layers.2.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
|
| 243 |
+
"model.layers.2.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
|
| 244 |
+
"model.layers.2.mlp.router.bias": "model-00001-of-00003.safetensors",
|
| 245 |
+
"model.layers.2.mlp.router.weight": "model-00001-of-00003.safetensors",
|
| 246 |
+
"model.layers.2.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 247 |
+
"model.layers.2.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
|
| 248 |
+
"model.layers.2.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
|
| 249 |
+
"model.layers.2.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
|
| 250 |
+
"model.layers.2.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
|
| 251 |
+
"model.layers.2.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
|
| 252 |
+
"model.layers.2.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
|
| 253 |
+
"model.layers.2.self_attn.sinks": "model-00001-of-00003.safetensors",
|
| 254 |
+
"model.layers.2.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
|
| 255 |
+
"model.layers.2.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
|
| 256 |
+
"model.layers.20.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 257 |
+
"model.layers.20.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 258 |
+
"model.layers.20.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 259 |
+
"model.layers.20.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 260 |
+
"model.layers.20.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 261 |
+
"model.layers.20.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 262 |
+
"model.layers.20.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 263 |
+
"model.layers.20.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 264 |
+
"model.layers.20.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 265 |
+
"model.layers.20.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 266 |
+
"model.layers.20.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 267 |
+
"model.layers.20.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 268 |
+
"model.layers.20.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 269 |
+
"model.layers.20.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 270 |
+
"model.layers.20.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 271 |
+
"model.layers.20.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 272 |
+
"model.layers.20.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 273 |
+
"model.layers.20.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 274 |
+
"model.layers.20.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 275 |
+
"model.layers.21.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 276 |
+
"model.layers.21.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 277 |
+
"model.layers.21.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 278 |
+
"model.layers.21.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 279 |
+
"model.layers.21.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 280 |
+
"model.layers.21.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 281 |
+
"model.layers.21.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 282 |
+
"model.layers.21.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 283 |
+
"model.layers.21.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 284 |
+
"model.layers.21.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 285 |
+
"model.layers.21.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 286 |
+
"model.layers.21.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 287 |
+
"model.layers.21.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 288 |
+
"model.layers.21.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 289 |
+
"model.layers.21.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 290 |
+
"model.layers.21.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 291 |
+
"model.layers.21.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 292 |
+
"model.layers.21.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 293 |
+
"model.layers.21.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 294 |
+
"model.layers.22.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 295 |
+
"model.layers.22.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 296 |
+
"model.layers.22.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 297 |
+
"model.layers.22.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 298 |
+
"model.layers.22.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 299 |
+
"model.layers.22.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 300 |
+
"model.layers.22.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 301 |
+
"model.layers.22.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 302 |
+
"model.layers.22.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 303 |
+
"model.layers.22.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 304 |
+
"model.layers.22.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 305 |
+
"model.layers.22.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 306 |
+
"model.layers.22.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 307 |
+
"model.layers.22.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 308 |
+
"model.layers.22.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 309 |
+
"model.layers.22.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 310 |
+
"model.layers.22.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 311 |
+
"model.layers.22.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 312 |
+
"model.layers.22.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 313 |
+
"model.layers.23.input_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 314 |
+
"model.layers.23.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
|
| 315 |
+
"model.layers.23.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
|
| 316 |
+
"model.layers.23.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
|
| 317 |
+
"model.layers.23.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
|
| 318 |
+
"model.layers.23.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
|
| 319 |
+
"model.layers.23.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
|
| 320 |
+
"model.layers.23.mlp.router.bias": "model-00003-of-00003.safetensors",
|
| 321 |
+
"model.layers.23.mlp.router.weight": "model-00003-of-00003.safetensors",
|
| 322 |
+
"model.layers.23.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
|
| 323 |
+
"model.layers.23.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
|
| 324 |
+
"model.layers.23.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
|
| 325 |
+
"model.layers.23.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
|
| 326 |
+
"model.layers.23.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
|
| 327 |
+
"model.layers.23.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
|
| 328 |
+
"model.layers.23.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
|
| 329 |
+
"model.layers.23.self_attn.sinks": "model-00003-of-00003.safetensors",
|
| 330 |
+
"model.layers.23.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
|
| 331 |
+
"model.layers.23.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
|
| 332 |
+
"model.layers.3.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 333 |
+
"model.layers.3.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 334 |
+
"model.layers.3.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 335 |
+
"model.layers.3.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 336 |
+
"model.layers.3.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 337 |
+
"model.layers.3.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
|
| 338 |
+
"model.layers.3.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
|
| 339 |
+
"model.layers.3.mlp.router.bias": "model-00001-of-00003.safetensors",
|
| 340 |
+
"model.layers.3.mlp.router.weight": "model-00001-of-00003.safetensors",
|
| 341 |
+
"model.layers.3.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 342 |
+
"model.layers.3.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
|
| 343 |
+
"model.layers.3.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
|
| 344 |
+
"model.layers.3.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
|
| 345 |
+
"model.layers.3.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
|
| 346 |
+
"model.layers.3.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
|
| 347 |
+
"model.layers.3.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
|
| 348 |
+
"model.layers.3.self_attn.sinks": "model-00001-of-00003.safetensors",
|
| 349 |
+
"model.layers.3.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
|
| 350 |
+
"model.layers.3.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
|
| 351 |
+
"model.layers.4.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 352 |
+
"model.layers.4.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 353 |
+
"model.layers.4.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 354 |
+
"model.layers.4.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 355 |
+
"model.layers.4.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 356 |
+
"model.layers.4.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
|
| 357 |
+
"model.layers.4.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
|
| 358 |
+
"model.layers.4.mlp.router.bias": "model-00001-of-00003.safetensors",
|
| 359 |
+
"model.layers.4.mlp.router.weight": "model-00001-of-00003.safetensors",
|
| 360 |
+
"model.layers.4.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 361 |
+
"model.layers.4.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
|
| 362 |
+
"model.layers.4.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
|
| 363 |
+
"model.layers.4.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
|
| 364 |
+
"model.layers.4.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
|
| 365 |
+
"model.layers.4.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
|
| 366 |
+
"model.layers.4.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
|
| 367 |
+
"model.layers.4.self_attn.sinks": "model-00001-of-00003.safetensors",
|
| 368 |
+
"model.layers.4.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
|
| 369 |
+
"model.layers.4.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
|
| 370 |
+
"model.layers.5.input_layernorm.weight": "model-00001-of-00003.safetensors",
|
| 371 |
+
"model.layers.5.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
|
| 372 |
+
"model.layers.5.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
|
| 373 |
+
"model.layers.5.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
|
| 374 |
+
"model.layers.5.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
|
| 375 |
+
"model.layers.5.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 376 |
+
"model.layers.5.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 377 |
+
"model.layers.5.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 378 |
+
"model.layers.5.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 379 |
+
"model.layers.5.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 380 |
+
"model.layers.5.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 381 |
+
"model.layers.5.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 382 |
+
"model.layers.5.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 383 |
+
"model.layers.5.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 384 |
+
"model.layers.5.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 385 |
+
"model.layers.5.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 386 |
+
"model.layers.5.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 387 |
+
"model.layers.5.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 388 |
+
"model.layers.5.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 389 |
+
"model.layers.6.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 390 |
+
"model.layers.6.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 391 |
+
"model.layers.6.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 392 |
+
"model.layers.6.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 393 |
+
"model.layers.6.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 394 |
+
"model.layers.6.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 395 |
+
"model.layers.6.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 396 |
+
"model.layers.6.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 397 |
+
"model.layers.6.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 398 |
+
"model.layers.6.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 399 |
+
"model.layers.6.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 400 |
+
"model.layers.6.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 401 |
+
"model.layers.6.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 402 |
+
"model.layers.6.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 403 |
+
"model.layers.6.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 404 |
+
"model.layers.6.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 405 |
+
"model.layers.6.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 406 |
+
"model.layers.6.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 407 |
+
"model.layers.6.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 408 |
+
"model.layers.7.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 409 |
+
"model.layers.7.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 410 |
+
"model.layers.7.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 411 |
+
"model.layers.7.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 412 |
+
"model.layers.7.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 413 |
+
"model.layers.7.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 414 |
+
"model.layers.7.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 415 |
+
"model.layers.7.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 416 |
+
"model.layers.7.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 417 |
+
"model.layers.7.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 418 |
+
"model.layers.7.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 419 |
+
"model.layers.7.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 420 |
+
"model.layers.7.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 421 |
+
"model.layers.7.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 422 |
+
"model.layers.7.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 423 |
+
"model.layers.7.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 424 |
+
"model.layers.7.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 425 |
+
"model.layers.7.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 426 |
+
"model.layers.7.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 427 |
+
"model.layers.8.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 428 |
+
"model.layers.8.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 429 |
+
"model.layers.8.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 430 |
+
"model.layers.8.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 431 |
+
"model.layers.8.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 432 |
+
"model.layers.8.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 433 |
+
"model.layers.8.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 434 |
+
"model.layers.8.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 435 |
+
"model.layers.8.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 436 |
+
"model.layers.8.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 437 |
+
"model.layers.8.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 438 |
+
"model.layers.8.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 439 |
+
"model.layers.8.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 440 |
+
"model.layers.8.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 441 |
+
"model.layers.8.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 442 |
+
"model.layers.8.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 443 |
+
"model.layers.8.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 444 |
+
"model.layers.8.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 445 |
+
"model.layers.8.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 446 |
+
"model.layers.9.input_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 447 |
+
"model.layers.9.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
|
| 448 |
+
"model.layers.9.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
|
| 449 |
+
"model.layers.9.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
|
| 450 |
+
"model.layers.9.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
|
| 451 |
+
"model.layers.9.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
|
| 452 |
+
"model.layers.9.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
|
| 453 |
+
"model.layers.9.mlp.router.bias": "model-00002-of-00003.safetensors",
|
| 454 |
+
"model.layers.9.mlp.router.weight": "model-00002-of-00003.safetensors",
|
| 455 |
+
"model.layers.9.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
|
| 456 |
+
"model.layers.9.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
|
| 457 |
+
"model.layers.9.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
|
| 458 |
+
"model.layers.9.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
|
| 459 |
+
"model.layers.9.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
|
| 460 |
+
"model.layers.9.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
|
| 461 |
+
"model.layers.9.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
|
| 462 |
+
"model.layers.9.self_attn.sinks": "model-00002-of-00003.safetensors",
|
| 463 |
+
"model.layers.9.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
|
| 464 |
+
"model.layers.9.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
|
| 465 |
+
"model.norm.weight": "model-00003-of-00003.safetensors"
|
| 466 |
+
}
|
| 467 |
+
}
|
tokenizer/chat_template.jinja
ADDED
|
@@ -0,0 +1,331 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{#-
|
| 2 |
+
In addition to the normal inputs of `messages` and `tools`, this template also accepts the
|
| 3 |
+
following kwargs:
|
| 4 |
+
- "builtin_tools": A list, can contain "browser" and/or "python".
|
| 5 |
+
- "model_identity": A string that optionally describes the model identity.
|
| 6 |
+
- "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
|
| 7 |
+
#}
|
| 8 |
+
|
| 9 |
+
{#- Tool Definition Rendering ============================================== #}
|
| 10 |
+
{%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
|
| 11 |
+
{%- if param_spec.type == "array" -%}
|
| 12 |
+
{%- if param_spec['items'] -%}
|
| 13 |
+
{%- if param_spec['items']['type'] == "string" -%}
|
| 14 |
+
{{- "string[]" }}
|
| 15 |
+
{%- elif param_spec['items']['type'] == "number" -%}
|
| 16 |
+
{{- "number[]" }}
|
| 17 |
+
{%- elif param_spec['items']['type'] == "integer" -%}
|
| 18 |
+
{{- "number[]" }}
|
| 19 |
+
{%- elif param_spec['items']['type'] == "boolean" -%}
|
| 20 |
+
{{- "boolean[]" }}
|
| 21 |
+
{%- else -%}
|
| 22 |
+
{%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
|
| 23 |
+
{%- if inner_type == "object | object" or inner_type|length > 50 -%}
|
| 24 |
+
{{- "any[]" }}
|
| 25 |
+
{%- else -%}
|
| 26 |
+
{{- inner_type + "[]" }}
|
| 27 |
+
{%- endif -%}
|
| 28 |
+
{%- endif -%}
|
| 29 |
+
{%- if param_spec.nullable -%}
|
| 30 |
+
{{- " | null" }}
|
| 31 |
+
{%- endif -%}
|
| 32 |
+
{%- else -%}
|
| 33 |
+
{{- "any[]" }}
|
| 34 |
+
{%- if param_spec.nullable -%}
|
| 35 |
+
{{- " | null" }}
|
| 36 |
+
{%- endif -%}
|
| 37 |
+
{%- endif -%}
|
| 38 |
+
{%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
|
| 39 |
+
{#- Handle array of types like ["object", "object"] from Union[dict, list] #}
|
| 40 |
+
{%- if param_spec.type | length > 1 -%}
|
| 41 |
+
{{- param_spec.type | join(" | ") }}
|
| 42 |
+
{%- else -%}
|
| 43 |
+
{{- param_spec.type[0] }}
|
| 44 |
+
{%- endif -%}
|
| 45 |
+
{%- elif param_spec.oneOf -%}
|
| 46 |
+
{#- Handle oneOf schemas - check for complex unions and fallback to any #}
|
| 47 |
+
{%- set has_object_variants = false -%}
|
| 48 |
+
{%- for variant in param_spec.oneOf -%}
|
| 49 |
+
{%- if variant.type == "object" -%}
|
| 50 |
+
{%- set has_object_variants = true -%}
|
| 51 |
+
{%- endif -%}
|
| 52 |
+
{%- endfor -%}
|
| 53 |
+
{%- if has_object_variants and param_spec.oneOf|length > 1 -%}
|
| 54 |
+
{{- "any" }}
|
| 55 |
+
{%- else -%}
|
| 56 |
+
{%- for variant in param_spec.oneOf -%}
|
| 57 |
+
{{- render_typescript_type(variant, required_params) -}}
|
| 58 |
+
{%- if variant.description %}
|
| 59 |
+
{{- "// " + variant.description }}
|
| 60 |
+
{%- endif -%}
|
| 61 |
+
{%- if variant.default is defined %}
|
| 62 |
+
{{ "// default: " + variant.default|tojson }}
|
| 63 |
+
{%- endif -%}
|
| 64 |
+
{%- if not loop.last %}
|
| 65 |
+
{{- " | " }}
|
| 66 |
+
{% endif -%}
|
| 67 |
+
{%- endfor -%}
|
| 68 |
+
{%- endif -%}
|
| 69 |
+
{%- elif param_spec.type == "string" -%}
|
| 70 |
+
{%- if param_spec.enum -%}
|
| 71 |
+
{{- '"' + param_spec.enum|join('" | "') + '"' -}}
|
| 72 |
+
{%- else -%}
|
| 73 |
+
{{- "string" }}
|
| 74 |
+
{%- if param_spec.nullable %}
|
| 75 |
+
{{- " | null" }}
|
| 76 |
+
{%- endif -%}
|
| 77 |
+
{%- endif -%}
|
| 78 |
+
{%- elif param_spec.type == "number" -%}
|
| 79 |
+
{{- "number" }}
|
| 80 |
+
{%- elif param_spec.type == "integer" -%}
|
| 81 |
+
{{- "number" }}
|
| 82 |
+
{%- elif param_spec.type == "boolean" -%}
|
| 83 |
+
{{- "boolean" }}
|
| 84 |
+
|
| 85 |
+
{%- elif param_spec.type == "object" -%}
|
| 86 |
+
{%- if param_spec.properties -%}
|
| 87 |
+
{{- "{\n" }}
|
| 88 |
+
{%- for prop_name, prop_spec in param_spec.properties.items() -%}
|
| 89 |
+
{{- prop_name -}}
|
| 90 |
+
{%- if prop_name not in (param_spec.required or []) -%}
|
| 91 |
+
{{- "?" }}
|
| 92 |
+
{%- endif -%}
|
| 93 |
+
{{- ": " }}
|
| 94 |
+
{{ render_typescript_type(prop_spec, param_spec.required or []) }}
|
| 95 |
+
{%- if not loop.last -%}
|
| 96 |
+
{{-", " }}
|
| 97 |
+
{%- endif -%}
|
| 98 |
+
{%- endfor -%}
|
| 99 |
+
{{- "}" }}
|
| 100 |
+
{%- else -%}
|
| 101 |
+
{{- "object" }}
|
| 102 |
+
{%- endif -%}
|
| 103 |
+
{%- else -%}
|
| 104 |
+
{{- "any" }}
|
| 105 |
+
{%- endif -%}
|
| 106 |
+
{%- endmacro -%}
|
| 107 |
+
|
| 108 |
+
{%- macro render_tool_namespace(namespace_name, tools) -%}
|
| 109 |
+
{{- "## " + namespace_name + "\n\n" }}
|
| 110 |
+
{{- "namespace " + namespace_name + " {\n\n" }}
|
| 111 |
+
{%- for tool in tools %}
|
| 112 |
+
{%- set tool = tool.function %}
|
| 113 |
+
{{- "// " + tool.description + "\n" }}
|
| 114 |
+
{{- "type "+ tool.name + " = " }}
|
| 115 |
+
{%- if tool.parameters and tool.parameters.properties %}
|
| 116 |
+
{{- "(_: {\n" }}
|
| 117 |
+
{%- for param_name, param_spec in tool.parameters.properties.items() %}
|
| 118 |
+
{%- if param_spec.description %}
|
| 119 |
+
{{- "// " + param_spec.description + "\n" }}
|
| 120 |
+
{%- endif %}
|
| 121 |
+
{{- param_name }}
|
| 122 |
+
{%- if param_name not in (tool.parameters.required or []) -%}
|
| 123 |
+
{{- "?" }}
|
| 124 |
+
{%- endif -%}
|
| 125 |
+
{{- ": " }}
|
| 126 |
+
{{- render_typescript_type(param_spec, tool.parameters.required or []) }}
|
| 127 |
+
{%- if param_spec.default is defined -%}
|
| 128 |
+
{%- if param_spec.enum %}
|
| 129 |
+
{{- ", // default: " + param_spec.default }}
|
| 130 |
+
{%- elif param_spec.oneOf %}
|
| 131 |
+
{{- "// default: " + param_spec.default }}
|
| 132 |
+
{%- else %}
|
| 133 |
+
{{- ", // default: " + param_spec.default|tojson }}
|
| 134 |
+
{%- endif -%}
|
| 135 |
+
{%- endif -%}
|
| 136 |
+
{%- if not loop.last %}
|
| 137 |
+
{{- ",\n" }}
|
| 138 |
+
{%- else %}
|
| 139 |
+
{{- ",\n" }}
|
| 140 |
+
{%- endif -%}
|
| 141 |
+
{%- endfor %}
|
| 142 |
+
{{- "}) => any;\n\n" }}
|
| 143 |
+
{%- else -%}
|
| 144 |
+
{{- "() => any;\n\n" }}
|
| 145 |
+
{%- endif -%}
|
| 146 |
+
{%- endfor %}
|
| 147 |
+
{{- "} // namespace " + namespace_name }}
|
| 148 |
+
{%- endmacro -%}
|
| 149 |
+
|
| 150 |
+
{%- macro render_builtin_tools(browser_tool, python_tool) -%}
|
| 151 |
+
{%- if browser_tool %}
|
| 152 |
+
{{- "## browser\n\n" }}
|
| 153 |
+
{{- "// Tool for browsing.\n" }}
|
| 154 |
+
{{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
|
| 155 |
+
{{- "// Cite information from the tool using the following format:\n" }}
|
| 156 |
+
{{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
|
| 157 |
+
{{- "// Do not quote more than 10 words directly from the tool output.\n" }}
|
| 158 |
+
{{- "// sources=web (default: web)\n" }}
|
| 159 |
+
{{- "namespace browser {\n\n" }}
|
| 160 |
+
{{- "// Searches for information related to `query` and displays `topn` results.\n" }}
|
| 161 |
+
{{- "type search = (_: {\n" }}
|
| 162 |
+
{{- "query: string,\n" }}
|
| 163 |
+
{{- "topn?: number, // default: 10\n" }}
|
| 164 |
+
{{- "source?: string,\n" }}
|
| 165 |
+
{{- "}) => any;\n\n" }}
|
| 166 |
+
{{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
|
| 167 |
+
{{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
|
| 168 |
+
{{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
|
| 169 |
+
{{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
|
| 170 |
+
{{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
|
| 171 |
+
{{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
|
| 172 |
+
{{- "type open = (_: {\n" }}
|
| 173 |
+
{{- "id?: number | string, // default: -1\n" }}
|
| 174 |
+
{{- "cursor?: number, // default: -1\n" }}
|
| 175 |
+
{{- "loc?: number, // default: -1\n" }}
|
| 176 |
+
{{- "num_lines?: number, // default: -1\n" }}
|
| 177 |
+
{{- "view_source?: boolean, // default: false\n" }}
|
| 178 |
+
{{- "source?: string,\n" }}
|
| 179 |
+
{{- "}) => any;\n\n" }}
|
| 180 |
+
{{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
|
| 181 |
+
{{- "type find = (_: {\n" }}
|
| 182 |
+
{{- "pattern: string,\n" }}
|
| 183 |
+
{{- "cursor?: number, // default: -1\n" }}
|
| 184 |
+
{{- "}) => any;\n\n" }}
|
| 185 |
+
{{- "} // namespace browser\n\n" }}
|
| 186 |
+
{%- endif -%}
|
| 187 |
+
|
| 188 |
+
{%- if python_tool %}
|
| 189 |
+
{{- "## python\n\n" }}
|
| 190 |
+
{{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
|
| 191 |
+
{{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
|
| 192 |
+
{%- endif -%}
|
| 193 |
+
{%- endmacro -%}
|
| 194 |
+
|
| 195 |
+
{#- System Message Construction ============================================ #}
|
| 196 |
+
{%- macro build_system_message() -%}
|
| 197 |
+
{%- if model_identity is not defined %}
|
| 198 |
+
{%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
|
| 199 |
+
{%- endif %}
|
| 200 |
+
{{- model_identity + "\n" }}
|
| 201 |
+
{{- "Knowledge cutoff: 2024-06\n" }}
|
| 202 |
+
{{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
|
| 203 |
+
{%- if reasoning_effort is not defined %}
|
| 204 |
+
{%- set reasoning_effort = "medium" %}
|
| 205 |
+
{%- endif %}
|
| 206 |
+
{{- "Reasoning: " + reasoning_effort + "\n\n" }}
|
| 207 |
+
{%- if builtin_tools %}
|
| 208 |
+
{{- "# Tools\n\n" }}
|
| 209 |
+
{%- set available_builtin_tools = namespace(browser=false, python=false) %}
|
| 210 |
+
{%- for tool in builtin_tools %}
|
| 211 |
+
{%- if tool == "browser" %}
|
| 212 |
+
{%- set available_builtin_tools.browser = true %}
|
| 213 |
+
{%- elif tool == "python" %}
|
| 214 |
+
{%- set available_builtin_tools.python = true %}
|
| 215 |
+
{%- endif %}
|
| 216 |
+
{%- endfor %}
|
| 217 |
+
{{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
|
| 218 |
+
{%- endif -%}
|
| 219 |
+
{{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
|
| 220 |
+
{%- if tools -%}
|
| 221 |
+
{{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
|
| 222 |
+
{%- endif -%}
|
| 223 |
+
{%- endmacro -%}
|
| 224 |
+
|
| 225 |
+
{#- Main Template Logic ================================================= #}
|
| 226 |
+
{#- Set defaults #}
|
| 227 |
+
|
| 228 |
+
{#- Render system message #}
|
| 229 |
+
{{- "<|start|>system<|message|>" }}
|
| 230 |
+
{{- build_system_message() }}
|
| 231 |
+
{{- "<|end|>" }}
|
| 232 |
+
|
| 233 |
+
{#- Extract developer message #}
|
| 234 |
+
{%- if messages[0].role == "developer" or messages[0].role == "system" %}
|
| 235 |
+
{%- set developer_message = messages[0].content %}
|
| 236 |
+
{%- set loop_messages = messages[1:] %}
|
| 237 |
+
{%- else %}
|
| 238 |
+
{%- set developer_message = "" %}
|
| 239 |
+
{%- set loop_messages = messages %}
|
| 240 |
+
{%- endif %}
|
| 241 |
+
|
| 242 |
+
{#- Render developer message #}
|
| 243 |
+
{%- if developer_message or tools %}
|
| 244 |
+
{{- "<|start|>developer<|message|>" }}
|
| 245 |
+
{%- if developer_message %}
|
| 246 |
+
{{- "# Instructions\n\n" }}
|
| 247 |
+
{{- developer_message }}
|
| 248 |
+
{{- "\n\n" }}
|
| 249 |
+
{%- endif %}
|
| 250 |
+
{%- if tools -%}
|
| 251 |
+
{{- "# Tools\n\n" }}
|
| 252 |
+
{{- render_tool_namespace("functions", tools) }}
|
| 253 |
+
{%- endif -%}
|
| 254 |
+
{{- "<|end|>" }}
|
| 255 |
+
{%- endif %}
|
| 256 |
+
|
| 257 |
+
{#- Render messages #}
|
| 258 |
+
{%- set last_tool_call = namespace(name=none) %}
|
| 259 |
+
{%- for message in loop_messages -%}
|
| 260 |
+
{#- At this point only assistant/user/tool messages should remain #}
|
| 261 |
+
{%- if message.role == 'assistant' -%}
|
| 262 |
+
{#- Checks to ensure the messages are being passed in the format we expect #}
|
| 263 |
+
{%- if "content" in message %}
|
| 264 |
+
{%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
|
| 265 |
+
{{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
|
| 266 |
+
{%- endif %}
|
| 267 |
+
{%- endif %}
|
| 268 |
+
{%- if "thinking" in message %}
|
| 269 |
+
{%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
|
| 270 |
+
{{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
|
| 271 |
+
{%- endif %}
|
| 272 |
+
{%- endif %}
|
| 273 |
+
{%- if "tool_calls" in message %}
|
| 274 |
+
{#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
|
| 275 |
+
{#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
|
| 276 |
+
{#- when we render CoT/analysis messages in inference. #}
|
| 277 |
+
{%- set future_final_message = namespace(found=false) %}
|
| 278 |
+
{%- for future_message in loop_messages[loop.index:] %}
|
| 279 |
+
{%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
|
| 280 |
+
{%- set future_final_message.found = true %}
|
| 281 |
+
{%- endif %}
|
| 282 |
+
{%- endfor %}
|
| 283 |
+
{#- We assume max 1 tool call per message, and so we infer the tool call name #}
|
| 284 |
+
{#- in "tool" messages from the most recent assistant tool call name #}
|
| 285 |
+
{%- set tool_call = message.tool_calls[0] %}
|
| 286 |
+
{%- if tool_call.function %}
|
| 287 |
+
{%- set tool_call = tool_call.function %}
|
| 288 |
+
{%- endif %}
|
| 289 |
+
{%- if message.content and message.thinking %}
|
| 290 |
+
{{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
|
| 291 |
+
{%- elif message.content and not future_final_message.found %}
|
| 292 |
+
{{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
|
| 293 |
+
{%- elif message.thinking and not future_final_message.found %}
|
| 294 |
+
{{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
|
| 295 |
+
{%- endif %}
|
| 296 |
+
{{- "<|start|>assistant to=" }}
|
| 297 |
+
{{- "functions." + tool_call.name + "<|channel|>commentary " }}
|
| 298 |
+
{{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
|
| 299 |
+
{{- tool_call.arguments|tojson }}
|
| 300 |
+
{{- "<|call|>" }}
|
| 301 |
+
{%- set last_tool_call.name = tool_call.name %}
|
| 302 |
+
{%- elif loop.last and not add_generation_prompt %}
|
| 303 |
+
{#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
|
| 304 |
+
{#- This is a situation that should only occur in training, never in inference. #}
|
| 305 |
+
{%- if "thinking" in message %}
|
| 306 |
+
{{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
|
| 307 |
+
{%- endif %}
|
| 308 |
+
{#- <|return|> indicates the end of generation, but <|end|> does not #}
|
| 309 |
+
{#- <|return|> should never be an input to the model, but we include it as the final token #}
|
| 310 |
+
{#- when training, so the model learns to emit it. #}
|
| 311 |
+
{{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
|
| 312 |
+
{%- else %}
|
| 313 |
+
{#- CoT is dropped during all previous turns, so we never render it for inference #}
|
| 314 |
+
{{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
|
| 315 |
+
{%- set last_tool_call.name = none %}
|
| 316 |
+
{%- endif %}
|
| 317 |
+
{%- elif message.role == 'tool' -%}
|
| 318 |
+
{%- if last_tool_call.name is none %}
|
| 319 |
+
{{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
|
| 320 |
+
{%- endif %}
|
| 321 |
+
{{- "<|start|>functions." + last_tool_call.name }}
|
| 322 |
+
{{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
|
| 323 |
+
{%- elif message.role == 'user' -%}
|
| 324 |
+
{{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
|
| 325 |
+
{%- endif -%}
|
| 326 |
+
{%- endfor -%}
|
| 327 |
+
|
| 328 |
+
{#- Generation prompt #}
|
| 329 |
+
{%- if add_generation_prompt -%}
|
| 330 |
+
<|start|>assistant
|
| 331 |
+
{%- endif -%}
|
tokenizer/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0614fe83cadab421296e664e1f48f4261fa8fef6e03e63bb75c20f38e37d07d3
|
| 3 |
+
size 27868174
|
tokenizer/tokenizer_config.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "tokenizers",
|
| 3 |
+
"bos_token": "<|startoftext|>",
|
| 4 |
+
"clean_up_tokenization_spaces": false,
|
| 5 |
+
"eos_token": "<|return|>",
|
| 6 |
+
"is_local": false,
|
| 7 |
+
"local_files_only": false,
|
| 8 |
+
"model_input_names": [
|
| 9 |
+
"input_ids",
|
| 10 |
+
"attention_mask"
|
| 11 |
+
],
|
| 12 |
+
"model_max_length": 1000000000000000019884624838656,
|
| 13 |
+
"pad_token": "<|endoftext|>",
|
| 14 |
+
"tokenizer_class": "TokenizersBackend"
|
| 15 |
+
}
|
transformer/config.json
ADDED
|
@@ -0,0 +1,476 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "LensTransformer2DModel",
|
| 3 |
+
"_diffusers_version": "0.38.0",
|
| 4 |
+
"_name_or_path": "microsoft/Lens",
|
| 5 |
+
"attention_head_dim": 64,
|
| 6 |
+
"axes_dims_rope": [
|
| 7 |
+
8,
|
| 8 |
+
28,
|
| 9 |
+
28
|
| 10 |
+
],
|
| 11 |
+
"enc_hidden_dim": 2880,
|
| 12 |
+
"gate_mlp": true,
|
| 13 |
+
"in_channels": 128,
|
| 14 |
+
"inner_dim": 1536,
|
| 15 |
+
"multi_layer_encoder_feature": true,
|
| 16 |
+
"num_attention_heads": 24,
|
| 17 |
+
"num_layers": 48,
|
| 18 |
+
"out_channels": 32,
|
| 19 |
+
"patch_size": 2,
|
| 20 |
+
"quantization_config": {
|
| 21 |
+
"add_skip_keys": false,
|
| 22 |
+
"dequantize_fp32": false,
|
| 23 |
+
"dynamic_loss_threshold": null,
|
| 24 |
+
"group_size": 0,
|
| 25 |
+
"hadamard_group_size": 128,
|
| 26 |
+
"is_integer": true,
|
| 27 |
+
"is_training": false,
|
| 28 |
+
"modules_dtype_dict": {},
|
| 29 |
+
"modules_quant_config": {},
|
| 30 |
+
"modules_to_not_convert": [
|
| 31 |
+
".emb_in",
|
| 32 |
+
".emb_out",
|
| 33 |
+
"norm",
|
| 34 |
+
".y_embedder",
|
| 35 |
+
"patch_emb",
|
| 36 |
+
"lm_head",
|
| 37 |
+
".condition_embedder",
|
| 38 |
+
".norm_out",
|
| 39 |
+
".t_embedder",
|
| 40 |
+
"patch_embedding",
|
| 41 |
+
".vid_in",
|
| 42 |
+
".txt_in",
|
| 43 |
+
".txt_out",
|
| 44 |
+
".time_embed",
|
| 45 |
+
"*.img_mod.*",
|
| 46 |
+
".proj_out",
|
| 47 |
+
".img_out",
|
| 48 |
+
"*.txt_mod.*",
|
| 49 |
+
".context_embedder",
|
| 50 |
+
".vid_out",
|
| 51 |
+
"time_text_embed",
|
| 52 |
+
"patch_embed",
|
| 53 |
+
"wte",
|
| 54 |
+
".img_in",
|
| 55 |
+
".final_layer",
|
| 56 |
+
".x_embedder",
|
| 57 |
+
"multi_modal_projector",
|
| 58 |
+
"pos_embed",
|
| 59 |
+
"txt_norm.0.weight",
|
| 60 |
+
"txt_norm.1.weight",
|
| 61 |
+
"txt_norm.2.weight",
|
| 62 |
+
"txt_norm.3.weight",
|
| 63 |
+
"transformer_blocks.0.attn.norm_q.weight",
|
| 64 |
+
"transformer_blocks.0.attn.norm_k.weight",
|
| 65 |
+
"transformer_blocks.0.attn.norm_added_q.weight",
|
| 66 |
+
"transformer_blocks.0.attn.norm_added_k.weight",
|
| 67 |
+
"transformer_blocks.0.img_norm1.weight",
|
| 68 |
+
"transformer_blocks.0.img_norm2.weight",
|
| 69 |
+
"transformer_blocks.0.txt_norm1.weight",
|
| 70 |
+
"transformer_blocks.0.txt_norm2.weight",
|
| 71 |
+
"transformer_blocks.1.attn.norm_q.weight",
|
| 72 |
+
"transformer_blocks.1.attn.norm_k.weight",
|
| 73 |
+
"transformer_blocks.1.attn.norm_added_q.weight",
|
| 74 |
+
"transformer_blocks.1.attn.norm_added_k.weight",
|
| 75 |
+
"transformer_blocks.1.img_norm1.weight",
|
| 76 |
+
"transformer_blocks.1.img_norm2.weight",
|
| 77 |
+
"transformer_blocks.1.txt_norm1.weight",
|
| 78 |
+
"transformer_blocks.1.txt_norm2.weight",
|
| 79 |
+
"transformer_blocks.2.attn.norm_q.weight",
|
| 80 |
+
"transformer_blocks.2.attn.norm_k.weight",
|
| 81 |
+
"transformer_blocks.2.attn.norm_added_q.weight",
|
| 82 |
+
"transformer_blocks.2.attn.norm_added_k.weight",
|
| 83 |
+
"transformer_blocks.2.img_norm1.weight",
|
| 84 |
+
"transformer_blocks.2.img_norm2.weight",
|
| 85 |
+
"transformer_blocks.2.txt_norm1.weight",
|
| 86 |
+
"transformer_blocks.2.txt_norm2.weight",
|
| 87 |
+
"transformer_blocks.3.attn.norm_q.weight",
|
| 88 |
+
"transformer_blocks.3.attn.norm_k.weight",
|
| 89 |
+
"transformer_blocks.3.attn.norm_added_q.weight",
|
| 90 |
+
"transformer_blocks.3.attn.norm_added_k.weight",
|
| 91 |
+
"transformer_blocks.3.img_norm1.weight",
|
| 92 |
+
"transformer_blocks.3.img_norm2.weight",
|
| 93 |
+
"transformer_blocks.3.txt_norm1.weight",
|
| 94 |
+
"transformer_blocks.3.txt_norm2.weight",
|
| 95 |
+
"transformer_blocks.4.attn.norm_q.weight",
|
| 96 |
+
"transformer_blocks.4.attn.norm_k.weight",
|
| 97 |
+
"transformer_blocks.4.attn.norm_added_q.weight",
|
| 98 |
+
"transformer_blocks.4.attn.norm_added_k.weight",
|
| 99 |
+
"transformer_blocks.4.img_norm1.weight",
|
| 100 |
+
"transformer_blocks.4.img_norm2.weight",
|
| 101 |
+
"transformer_blocks.4.txt_norm1.weight",
|
| 102 |
+
"transformer_blocks.4.txt_norm2.weight",
|
| 103 |
+
"transformer_blocks.5.attn.norm_q.weight",
|
| 104 |
+
"transformer_blocks.5.attn.norm_k.weight",
|
| 105 |
+
"transformer_blocks.5.attn.norm_added_q.weight",
|
| 106 |
+
"transformer_blocks.5.attn.norm_added_k.weight",
|
| 107 |
+
"transformer_blocks.5.img_norm1.weight",
|
| 108 |
+
"transformer_blocks.5.img_norm2.weight",
|
| 109 |
+
"transformer_blocks.5.txt_norm1.weight",
|
| 110 |
+
"transformer_blocks.5.txt_norm2.weight",
|
| 111 |
+
"transformer_blocks.6.attn.norm_q.weight",
|
| 112 |
+
"transformer_blocks.6.attn.norm_k.weight",
|
| 113 |
+
"transformer_blocks.6.attn.norm_added_q.weight",
|
| 114 |
+
"transformer_blocks.6.attn.norm_added_k.weight",
|
| 115 |
+
"transformer_blocks.6.img_norm1.weight",
|
| 116 |
+
"transformer_blocks.6.img_norm2.weight",
|
| 117 |
+
"transformer_blocks.6.txt_norm1.weight",
|
| 118 |
+
"transformer_blocks.6.txt_norm2.weight",
|
| 119 |
+
"transformer_blocks.7.attn.norm_q.weight",
|
| 120 |
+
"transformer_blocks.7.attn.norm_k.weight",
|
| 121 |
+
"transformer_blocks.7.attn.norm_added_q.weight",
|
| 122 |
+
"transformer_blocks.7.attn.norm_added_k.weight",
|
| 123 |
+
"transformer_blocks.7.img_norm1.weight",
|
| 124 |
+
"transformer_blocks.7.img_norm2.weight",
|
| 125 |
+
"transformer_blocks.7.txt_norm1.weight",
|
| 126 |
+
"transformer_blocks.7.txt_norm2.weight",
|
| 127 |
+
"transformer_blocks.8.attn.norm_q.weight",
|
| 128 |
+
"transformer_blocks.8.attn.norm_k.weight",
|
| 129 |
+
"transformer_blocks.8.attn.norm_added_q.weight",
|
| 130 |
+
"transformer_blocks.8.attn.norm_added_k.weight",
|
| 131 |
+
"transformer_blocks.8.img_norm1.weight",
|
| 132 |
+
"transformer_blocks.8.img_norm2.weight",
|
| 133 |
+
"transformer_blocks.8.txt_norm1.weight",
|
| 134 |
+
"transformer_blocks.8.txt_norm2.weight",
|
| 135 |
+
"transformer_blocks.9.attn.norm_q.weight",
|
| 136 |
+
"transformer_blocks.9.attn.norm_k.weight",
|
| 137 |
+
"transformer_blocks.9.attn.norm_added_q.weight",
|
| 138 |
+
"transformer_blocks.9.attn.norm_added_k.weight",
|
| 139 |
+
"transformer_blocks.9.img_norm1.weight",
|
| 140 |
+
"transformer_blocks.9.img_norm2.weight",
|
| 141 |
+
"transformer_blocks.9.txt_norm1.weight",
|
| 142 |
+
"transformer_blocks.9.txt_norm2.weight",
|
| 143 |
+
"transformer_blocks.10.attn.norm_q.weight",
|
| 144 |
+
"transformer_blocks.10.attn.norm_k.weight",
|
| 145 |
+
"transformer_blocks.10.attn.norm_added_q.weight",
|
| 146 |
+
"transformer_blocks.10.attn.norm_added_k.weight",
|
| 147 |
+
"transformer_blocks.10.img_norm1.weight",
|
| 148 |
+
"transformer_blocks.10.img_norm2.weight",
|
| 149 |
+
"transformer_blocks.10.txt_norm1.weight",
|
| 150 |
+
"transformer_blocks.10.txt_norm2.weight",
|
| 151 |
+
"transformer_blocks.11.attn.norm_q.weight",
|
| 152 |
+
"transformer_blocks.11.attn.norm_k.weight",
|
| 153 |
+
"transformer_blocks.11.attn.norm_added_q.weight",
|
| 154 |
+
"transformer_blocks.11.attn.norm_added_k.weight",
|
| 155 |
+
"transformer_blocks.11.img_norm1.weight",
|
| 156 |
+
"transformer_blocks.11.img_norm2.weight",
|
| 157 |
+
"transformer_blocks.11.txt_norm1.weight",
|
| 158 |
+
"transformer_blocks.11.txt_norm2.weight",
|
| 159 |
+
"transformer_blocks.12.attn.norm_q.weight",
|
| 160 |
+
"transformer_blocks.12.attn.norm_k.weight",
|
| 161 |
+
"transformer_blocks.12.attn.norm_added_q.weight",
|
| 162 |
+
"transformer_blocks.12.attn.norm_added_k.weight",
|
| 163 |
+
"transformer_blocks.12.img_norm1.weight",
|
| 164 |
+
"transformer_blocks.12.img_norm2.weight",
|
| 165 |
+
"transformer_blocks.12.txt_norm1.weight",
|
| 166 |
+
"transformer_blocks.12.txt_norm2.weight",
|
| 167 |
+
"transformer_blocks.13.attn.norm_q.weight",
|
| 168 |
+
"transformer_blocks.13.attn.norm_k.weight",
|
| 169 |
+
"transformer_blocks.13.attn.norm_added_q.weight",
|
| 170 |
+
"transformer_blocks.13.attn.norm_added_k.weight",
|
| 171 |
+
"transformer_blocks.13.img_norm1.weight",
|
| 172 |
+
"transformer_blocks.13.img_norm2.weight",
|
| 173 |
+
"transformer_blocks.13.txt_norm1.weight",
|
| 174 |
+
"transformer_blocks.13.txt_norm2.weight",
|
| 175 |
+
"transformer_blocks.14.attn.norm_q.weight",
|
| 176 |
+
"transformer_blocks.14.attn.norm_k.weight",
|
| 177 |
+
"transformer_blocks.14.attn.norm_added_q.weight",
|
| 178 |
+
"transformer_blocks.14.attn.norm_added_k.weight",
|
| 179 |
+
"transformer_blocks.14.img_norm1.weight",
|
| 180 |
+
"transformer_blocks.14.img_norm2.weight",
|
| 181 |
+
"transformer_blocks.14.txt_norm1.weight",
|
| 182 |
+
"transformer_blocks.14.txt_norm2.weight",
|
| 183 |
+
"transformer_blocks.15.attn.norm_q.weight",
|
| 184 |
+
"transformer_blocks.15.attn.norm_k.weight",
|
| 185 |
+
"transformer_blocks.15.attn.norm_added_q.weight",
|
| 186 |
+
"transformer_blocks.15.attn.norm_added_k.weight",
|
| 187 |
+
"transformer_blocks.15.img_norm1.weight",
|
| 188 |
+
"transformer_blocks.15.img_norm2.weight",
|
| 189 |
+
"transformer_blocks.15.txt_norm1.weight",
|
| 190 |
+
"transformer_blocks.15.txt_norm2.weight",
|
| 191 |
+
"transformer_blocks.16.attn.norm_q.weight",
|
| 192 |
+
"transformer_blocks.16.attn.norm_k.weight",
|
| 193 |
+
"transformer_blocks.16.attn.norm_added_q.weight",
|
| 194 |
+
"transformer_blocks.16.attn.norm_added_k.weight",
|
| 195 |
+
"transformer_blocks.16.img_norm1.weight",
|
| 196 |
+
"transformer_blocks.16.img_norm2.weight",
|
| 197 |
+
"transformer_blocks.16.txt_norm1.weight",
|
| 198 |
+
"transformer_blocks.16.txt_norm2.weight",
|
| 199 |
+
"transformer_blocks.17.attn.norm_q.weight",
|
| 200 |
+
"transformer_blocks.17.attn.norm_k.weight",
|
| 201 |
+
"transformer_blocks.17.attn.norm_added_q.weight",
|
| 202 |
+
"transformer_blocks.17.attn.norm_added_k.weight",
|
| 203 |
+
"transformer_blocks.17.img_norm1.weight",
|
| 204 |
+
"transformer_blocks.17.img_norm2.weight",
|
| 205 |
+
"transformer_blocks.17.txt_norm1.weight",
|
| 206 |
+
"transformer_blocks.17.txt_norm2.weight",
|
| 207 |
+
"transformer_blocks.18.attn.norm_q.weight",
|
| 208 |
+
"transformer_blocks.18.attn.norm_k.weight",
|
| 209 |
+
"transformer_blocks.18.attn.norm_added_q.weight",
|
| 210 |
+
"transformer_blocks.18.attn.norm_added_k.weight",
|
| 211 |
+
"transformer_blocks.18.img_norm1.weight",
|
| 212 |
+
"transformer_blocks.18.img_norm2.weight",
|
| 213 |
+
"transformer_blocks.18.txt_norm1.weight",
|
| 214 |
+
"transformer_blocks.18.txt_norm2.weight",
|
| 215 |
+
"transformer_blocks.19.attn.norm_q.weight",
|
| 216 |
+
"transformer_blocks.19.attn.norm_k.weight",
|
| 217 |
+
"transformer_blocks.19.attn.norm_added_q.weight",
|
| 218 |
+
"transformer_blocks.19.attn.norm_added_k.weight",
|
| 219 |
+
"transformer_blocks.19.img_norm1.weight",
|
| 220 |
+
"transformer_blocks.19.img_norm2.weight",
|
| 221 |
+
"transformer_blocks.19.txt_norm1.weight",
|
| 222 |
+
"transformer_blocks.19.txt_norm2.weight",
|
| 223 |
+
"transformer_blocks.20.attn.norm_q.weight",
|
| 224 |
+
"transformer_blocks.20.attn.norm_k.weight",
|
| 225 |
+
"transformer_blocks.20.attn.norm_added_q.weight",
|
| 226 |
+
"transformer_blocks.20.attn.norm_added_k.weight",
|
| 227 |
+
"transformer_blocks.20.img_norm1.weight",
|
| 228 |
+
"transformer_blocks.20.img_norm2.weight",
|
| 229 |
+
"transformer_blocks.20.txt_norm1.weight",
|
| 230 |
+
"transformer_blocks.20.txt_norm2.weight",
|
| 231 |
+
"transformer_blocks.21.attn.norm_q.weight",
|
| 232 |
+
"transformer_blocks.21.attn.norm_k.weight",
|
| 233 |
+
"transformer_blocks.21.attn.norm_added_q.weight",
|
| 234 |
+
"transformer_blocks.21.attn.norm_added_k.weight",
|
| 235 |
+
"transformer_blocks.21.img_norm1.weight",
|
| 236 |
+
"transformer_blocks.21.img_norm2.weight",
|
| 237 |
+
"transformer_blocks.21.txt_norm1.weight",
|
| 238 |
+
"transformer_blocks.21.txt_norm2.weight",
|
| 239 |
+
"transformer_blocks.22.attn.norm_q.weight",
|
| 240 |
+
"transformer_blocks.22.attn.norm_k.weight",
|
| 241 |
+
"transformer_blocks.22.attn.norm_added_q.weight",
|
| 242 |
+
"transformer_blocks.22.attn.norm_added_k.weight",
|
| 243 |
+
"transformer_blocks.22.img_norm1.weight",
|
| 244 |
+
"transformer_blocks.22.img_norm2.weight",
|
| 245 |
+
"transformer_blocks.22.txt_norm1.weight",
|
| 246 |
+
"transformer_blocks.22.txt_norm2.weight",
|
| 247 |
+
"transformer_blocks.23.attn.norm_q.weight",
|
| 248 |
+
"transformer_blocks.23.attn.norm_k.weight",
|
| 249 |
+
"transformer_blocks.23.attn.norm_added_q.weight",
|
| 250 |
+
"transformer_blocks.23.attn.norm_added_k.weight",
|
| 251 |
+
"transformer_blocks.23.img_norm1.weight",
|
| 252 |
+
"transformer_blocks.23.img_norm2.weight",
|
| 253 |
+
"transformer_blocks.23.txt_norm1.weight",
|
| 254 |
+
"transformer_blocks.23.txt_norm2.weight",
|
| 255 |
+
"transformer_blocks.24.attn.norm_q.weight",
|
| 256 |
+
"transformer_blocks.24.attn.norm_k.weight",
|
| 257 |
+
"transformer_blocks.24.attn.norm_added_q.weight",
|
| 258 |
+
"transformer_blocks.24.attn.norm_added_k.weight",
|
| 259 |
+
"transformer_blocks.24.img_norm1.weight",
|
| 260 |
+
"transformer_blocks.24.img_norm2.weight",
|
| 261 |
+
"transformer_blocks.24.txt_norm1.weight",
|
| 262 |
+
"transformer_blocks.24.txt_norm2.weight",
|
| 263 |
+
"transformer_blocks.25.attn.norm_q.weight",
|
| 264 |
+
"transformer_blocks.25.attn.norm_k.weight",
|
| 265 |
+
"transformer_blocks.25.attn.norm_added_q.weight",
|
| 266 |
+
"transformer_blocks.25.attn.norm_added_k.weight",
|
| 267 |
+
"transformer_blocks.25.img_norm1.weight",
|
| 268 |
+
"transformer_blocks.25.img_norm2.weight",
|
| 269 |
+
"transformer_blocks.25.txt_norm1.weight",
|
| 270 |
+
"transformer_blocks.25.txt_norm2.weight",
|
| 271 |
+
"transformer_blocks.26.attn.norm_q.weight",
|
| 272 |
+
"transformer_blocks.26.attn.norm_k.weight",
|
| 273 |
+
"transformer_blocks.26.attn.norm_added_q.weight",
|
| 274 |
+
"transformer_blocks.26.attn.norm_added_k.weight",
|
| 275 |
+
"transformer_blocks.26.img_norm1.weight",
|
| 276 |
+
"transformer_blocks.26.img_norm2.weight",
|
| 277 |
+
"transformer_blocks.26.txt_norm1.weight",
|
| 278 |
+
"transformer_blocks.26.txt_norm2.weight",
|
| 279 |
+
"transformer_blocks.27.attn.norm_q.weight",
|
| 280 |
+
"transformer_blocks.27.attn.norm_k.weight",
|
| 281 |
+
"transformer_blocks.27.attn.norm_added_q.weight",
|
| 282 |
+
"transformer_blocks.27.attn.norm_added_k.weight",
|
| 283 |
+
"transformer_blocks.27.img_norm1.weight",
|
| 284 |
+
"transformer_blocks.27.img_norm2.weight",
|
| 285 |
+
"transformer_blocks.27.txt_norm1.weight",
|
| 286 |
+
"transformer_blocks.27.txt_norm2.weight",
|
| 287 |
+
"transformer_blocks.28.attn.norm_q.weight",
|
| 288 |
+
"transformer_blocks.28.attn.norm_k.weight",
|
| 289 |
+
"transformer_blocks.28.attn.norm_added_q.weight",
|
| 290 |
+
"transformer_blocks.28.attn.norm_added_k.weight",
|
| 291 |
+
"transformer_blocks.28.img_norm1.weight",
|
| 292 |
+
"transformer_blocks.28.img_norm2.weight",
|
| 293 |
+
"transformer_blocks.28.txt_norm1.weight",
|
| 294 |
+
"transformer_blocks.28.txt_norm2.weight",
|
| 295 |
+
"transformer_blocks.29.attn.norm_q.weight",
|
| 296 |
+
"transformer_blocks.29.attn.norm_k.weight",
|
| 297 |
+
"transformer_blocks.29.attn.norm_added_q.weight",
|
| 298 |
+
"transformer_blocks.29.attn.norm_added_k.weight",
|
| 299 |
+
"transformer_blocks.29.img_norm1.weight",
|
| 300 |
+
"transformer_blocks.29.img_norm2.weight",
|
| 301 |
+
"transformer_blocks.29.txt_norm1.weight",
|
| 302 |
+
"transformer_blocks.29.txt_norm2.weight",
|
| 303 |
+
"transformer_blocks.30.attn.norm_q.weight",
|
| 304 |
+
"transformer_blocks.30.attn.norm_k.weight",
|
| 305 |
+
"transformer_blocks.30.attn.norm_added_q.weight",
|
| 306 |
+
"transformer_blocks.30.attn.norm_added_k.weight",
|
| 307 |
+
"transformer_blocks.30.img_norm1.weight",
|
| 308 |
+
"transformer_blocks.30.img_norm2.weight",
|
| 309 |
+
"transformer_blocks.30.txt_norm1.weight",
|
| 310 |
+
"transformer_blocks.30.txt_norm2.weight",
|
| 311 |
+
"transformer_blocks.31.attn.norm_q.weight",
|
| 312 |
+
"transformer_blocks.31.attn.norm_k.weight",
|
| 313 |
+
"transformer_blocks.31.attn.norm_added_q.weight",
|
| 314 |
+
"transformer_blocks.31.attn.norm_added_k.weight",
|
| 315 |
+
"transformer_blocks.31.img_norm1.weight",
|
| 316 |
+
"transformer_blocks.31.img_norm2.weight",
|
| 317 |
+
"transformer_blocks.31.txt_norm1.weight",
|
| 318 |
+
"transformer_blocks.31.txt_norm2.weight",
|
| 319 |
+
"transformer_blocks.32.attn.norm_q.weight",
|
| 320 |
+
"transformer_blocks.32.attn.norm_k.weight",
|
| 321 |
+
"transformer_blocks.32.attn.norm_added_q.weight",
|
| 322 |
+
"transformer_blocks.32.attn.norm_added_k.weight",
|
| 323 |
+
"transformer_blocks.32.img_norm1.weight",
|
| 324 |
+
"transformer_blocks.32.img_norm2.weight",
|
| 325 |
+
"transformer_blocks.32.txt_norm1.weight",
|
| 326 |
+
"transformer_blocks.32.txt_norm2.weight",
|
| 327 |
+
"transformer_blocks.33.attn.norm_q.weight",
|
| 328 |
+
"transformer_blocks.33.attn.norm_k.weight",
|
| 329 |
+
"transformer_blocks.33.attn.norm_added_q.weight",
|
| 330 |
+
"transformer_blocks.33.attn.norm_added_k.weight",
|
| 331 |
+
"transformer_blocks.33.img_norm1.weight",
|
| 332 |
+
"transformer_blocks.33.img_norm2.weight",
|
| 333 |
+
"transformer_blocks.33.txt_norm1.weight",
|
| 334 |
+
"transformer_blocks.33.txt_norm2.weight",
|
| 335 |
+
"transformer_blocks.34.attn.norm_q.weight",
|
| 336 |
+
"transformer_blocks.34.attn.norm_k.weight",
|
| 337 |
+
"transformer_blocks.34.attn.norm_added_q.weight",
|
| 338 |
+
"transformer_blocks.34.attn.norm_added_k.weight",
|
| 339 |
+
"transformer_blocks.34.img_norm1.weight",
|
| 340 |
+
"transformer_blocks.34.img_norm2.weight",
|
| 341 |
+
"transformer_blocks.34.txt_norm1.weight",
|
| 342 |
+
"transformer_blocks.34.txt_norm2.weight",
|
| 343 |
+
"transformer_blocks.35.attn.norm_q.weight",
|
| 344 |
+
"transformer_blocks.35.attn.norm_k.weight",
|
| 345 |
+
"transformer_blocks.35.attn.norm_added_q.weight",
|
| 346 |
+
"transformer_blocks.35.attn.norm_added_k.weight",
|
| 347 |
+
"transformer_blocks.35.img_norm1.weight",
|
| 348 |
+
"transformer_blocks.35.img_norm2.weight",
|
| 349 |
+
"transformer_blocks.35.txt_norm1.weight",
|
| 350 |
+
"transformer_blocks.35.txt_norm2.weight",
|
| 351 |
+
"transformer_blocks.36.attn.norm_q.weight",
|
| 352 |
+
"transformer_blocks.36.attn.norm_k.weight",
|
| 353 |
+
"transformer_blocks.36.attn.norm_added_q.weight",
|
| 354 |
+
"transformer_blocks.36.attn.norm_added_k.weight",
|
| 355 |
+
"transformer_blocks.36.img_norm1.weight",
|
| 356 |
+
"transformer_blocks.36.img_norm2.weight",
|
| 357 |
+
"transformer_blocks.36.txt_norm1.weight",
|
| 358 |
+
"transformer_blocks.36.txt_norm2.weight",
|
| 359 |
+
"transformer_blocks.37.attn.norm_q.weight",
|
| 360 |
+
"transformer_blocks.37.attn.norm_k.weight",
|
| 361 |
+
"transformer_blocks.37.attn.norm_added_q.weight",
|
| 362 |
+
"transformer_blocks.37.attn.norm_added_k.weight",
|
| 363 |
+
"transformer_blocks.37.img_norm1.weight",
|
| 364 |
+
"transformer_blocks.37.img_norm2.weight",
|
| 365 |
+
"transformer_blocks.37.txt_norm1.weight",
|
| 366 |
+
"transformer_blocks.37.txt_norm2.weight",
|
| 367 |
+
"transformer_blocks.38.attn.norm_q.weight",
|
| 368 |
+
"transformer_blocks.38.attn.norm_k.weight",
|
| 369 |
+
"transformer_blocks.38.attn.norm_added_q.weight",
|
| 370 |
+
"transformer_blocks.38.attn.norm_added_k.weight",
|
| 371 |
+
"transformer_blocks.38.img_norm1.weight",
|
| 372 |
+
"transformer_blocks.38.img_norm2.weight",
|
| 373 |
+
"transformer_blocks.38.txt_norm1.weight",
|
| 374 |
+
"transformer_blocks.38.txt_norm2.weight",
|
| 375 |
+
"transformer_blocks.39.attn.norm_q.weight",
|
| 376 |
+
"transformer_blocks.39.attn.norm_k.weight",
|
| 377 |
+
"transformer_blocks.39.attn.norm_added_q.weight",
|
| 378 |
+
"transformer_blocks.39.attn.norm_added_k.weight",
|
| 379 |
+
"transformer_blocks.39.img_norm1.weight",
|
| 380 |
+
"transformer_blocks.39.img_norm2.weight",
|
| 381 |
+
"transformer_blocks.39.txt_norm1.weight",
|
| 382 |
+
"transformer_blocks.39.txt_norm2.weight",
|
| 383 |
+
"transformer_blocks.40.attn.norm_q.weight",
|
| 384 |
+
"transformer_blocks.40.attn.norm_k.weight",
|
| 385 |
+
"transformer_blocks.40.attn.norm_added_q.weight",
|
| 386 |
+
"transformer_blocks.40.attn.norm_added_k.weight",
|
| 387 |
+
"transformer_blocks.40.img_norm1.weight",
|
| 388 |
+
"transformer_blocks.40.img_norm2.weight",
|
| 389 |
+
"transformer_blocks.40.txt_norm1.weight",
|
| 390 |
+
"transformer_blocks.40.txt_norm2.weight",
|
| 391 |
+
"transformer_blocks.41.attn.norm_q.weight",
|
| 392 |
+
"transformer_blocks.41.attn.norm_k.weight",
|
| 393 |
+
"transformer_blocks.41.attn.norm_added_q.weight",
|
| 394 |
+
"transformer_blocks.41.attn.norm_added_k.weight",
|
| 395 |
+
"transformer_blocks.41.img_norm1.weight",
|
| 396 |
+
"transformer_blocks.41.img_norm2.weight",
|
| 397 |
+
"transformer_blocks.41.txt_norm1.weight",
|
| 398 |
+
"transformer_blocks.41.txt_norm2.weight",
|
| 399 |
+
"transformer_blocks.42.attn.norm_q.weight",
|
| 400 |
+
"transformer_blocks.42.attn.norm_k.weight",
|
| 401 |
+
"transformer_blocks.42.attn.norm_added_q.weight",
|
| 402 |
+
"transformer_blocks.42.attn.norm_added_k.weight",
|
| 403 |
+
"transformer_blocks.42.img_norm1.weight",
|
| 404 |
+
"transformer_blocks.42.img_norm2.weight",
|
| 405 |
+
"transformer_blocks.42.txt_norm1.weight",
|
| 406 |
+
"transformer_blocks.42.txt_norm2.weight",
|
| 407 |
+
"transformer_blocks.43.attn.norm_q.weight",
|
| 408 |
+
"transformer_blocks.43.attn.norm_k.weight",
|
| 409 |
+
"transformer_blocks.43.attn.norm_added_q.weight",
|
| 410 |
+
"transformer_blocks.43.attn.norm_added_k.weight",
|
| 411 |
+
"transformer_blocks.43.img_norm1.weight",
|
| 412 |
+
"transformer_blocks.43.img_norm2.weight",
|
| 413 |
+
"transformer_blocks.43.txt_norm1.weight",
|
| 414 |
+
"transformer_blocks.43.txt_norm2.weight",
|
| 415 |
+
"transformer_blocks.44.attn.norm_q.weight",
|
| 416 |
+
"transformer_blocks.44.attn.norm_k.weight",
|
| 417 |
+
"transformer_blocks.44.attn.norm_added_q.weight",
|
| 418 |
+
"transformer_blocks.44.attn.norm_added_k.weight",
|
| 419 |
+
"transformer_blocks.44.img_norm1.weight",
|
| 420 |
+
"transformer_blocks.44.img_norm2.weight",
|
| 421 |
+
"transformer_blocks.44.txt_norm1.weight",
|
| 422 |
+
"transformer_blocks.44.txt_norm2.weight",
|
| 423 |
+
"transformer_blocks.45.attn.norm_q.weight",
|
| 424 |
+
"transformer_blocks.45.attn.norm_k.weight",
|
| 425 |
+
"transformer_blocks.45.attn.norm_added_q.weight",
|
| 426 |
+
"transformer_blocks.45.attn.norm_added_k.weight",
|
| 427 |
+
"transformer_blocks.45.img_norm1.weight",
|
| 428 |
+
"transformer_blocks.45.img_norm2.weight",
|
| 429 |
+
"transformer_blocks.45.txt_norm1.weight",
|
| 430 |
+
"transformer_blocks.45.txt_norm2.weight",
|
| 431 |
+
"transformer_blocks.46.attn.norm_q.weight",
|
| 432 |
+
"transformer_blocks.46.attn.norm_k.weight",
|
| 433 |
+
"transformer_blocks.46.attn.norm_added_q.weight",
|
| 434 |
+
"transformer_blocks.46.attn.norm_added_k.weight",
|
| 435 |
+
"transformer_blocks.46.img_norm1.weight",
|
| 436 |
+
"transformer_blocks.46.img_norm2.weight",
|
| 437 |
+
"transformer_blocks.46.txt_norm1.weight",
|
| 438 |
+
"transformer_blocks.46.txt_norm2.weight",
|
| 439 |
+
"transformer_blocks.47.attn.norm_q.weight",
|
| 440 |
+
"transformer_blocks.47.attn.norm_k.weight",
|
| 441 |
+
"transformer_blocks.47.attn.norm_added_q.weight",
|
| 442 |
+
"transformer_blocks.47.attn.norm_added_k.weight",
|
| 443 |
+
"transformer_blocks.47.img_norm1.weight",
|
| 444 |
+
"transformer_blocks.47.img_norm2.weight",
|
| 445 |
+
"transformer_blocks.47.txt_norm1.weight",
|
| 446 |
+
"transformer_blocks.47.txt_norm2.weight"
|
| 447 |
+
],
|
| 448 |
+
"modules_to_not_use_matmul": [],
|
| 449 |
+
"non_blocking": false,
|
| 450 |
+
"quant_conv": false,
|
| 451 |
+
"quant_embedding": false,
|
| 452 |
+
"quant_method": "sdnq",
|
| 453 |
+
"quantization_device": null,
|
| 454 |
+
"quantized_matmul_dtype": "int8",
|
| 455 |
+
"return_device": null,
|
| 456 |
+
"sdnq_version": "0.2.0",
|
| 457 |
+
"svd_rank": 32,
|
| 458 |
+
"svd_steps": 8,
|
| 459 |
+
"use_dynamic_quantization": false,
|
| 460 |
+
"use_grad_ckpt": true,
|
| 461 |
+
"use_hadamard": false,
|
| 462 |
+
"use_quantized_matmul": true,
|
| 463 |
+
"use_quantized_matmul_conv": false,
|
| 464 |
+
"use_static_quantization": true,
|
| 465 |
+
"use_stochastic_rounding": false,
|
| 466 |
+
"use_svd": false,
|
| 467 |
+
"weights_dtype": "uint4"
|
| 468 |
+
},
|
| 469 |
+
"rms_norm": true,
|
| 470 |
+
"selected_layer_index": [
|
| 471 |
+
5,
|
| 472 |
+
11,
|
| 473 |
+
17,
|
| 474 |
+
23
|
| 475 |
+
]
|
| 476 |
+
}
|
transformer/diffusion_pytorch_model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abd3791d4c163f82fb8e95f7f53bd7af38043e24b19bc5bcab600e2c2633ec87
|
| 3 |
+
size 3987262976
|
transformer/diffusion_pytorch_model-00002-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1065a7a189f5d7dbe23820538667563f615c92685e566e2c8b7d8777ea350c5e
|
| 3 |
+
size 314450920
|
transformer/diffusion_pytorch_model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
transformer/quantization_config.json
ADDED
|
@@ -0,0 +1,449 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_skip_keys": false,
|
| 3 |
+
"dequantize_fp32": false,
|
| 4 |
+
"dynamic_loss_threshold": null,
|
| 5 |
+
"group_size": 0,
|
| 6 |
+
"hadamard_group_size": 128,
|
| 7 |
+
"is_integer": true,
|
| 8 |
+
"is_training": false,
|
| 9 |
+
"modules_dtype_dict": {},
|
| 10 |
+
"modules_quant_config": {},
|
| 11 |
+
"modules_to_not_convert": [
|
| 12 |
+
".emb_in",
|
| 13 |
+
".emb_out",
|
| 14 |
+
"norm",
|
| 15 |
+
".y_embedder",
|
| 16 |
+
"patch_emb",
|
| 17 |
+
"lm_head",
|
| 18 |
+
".condition_embedder",
|
| 19 |
+
".norm_out",
|
| 20 |
+
".t_embedder",
|
| 21 |
+
"patch_embedding",
|
| 22 |
+
".vid_in",
|
| 23 |
+
".txt_in",
|
| 24 |
+
".txt_out",
|
| 25 |
+
".time_embed",
|
| 26 |
+
"*.img_mod.*",
|
| 27 |
+
".proj_out",
|
| 28 |
+
".img_out",
|
| 29 |
+
"*.txt_mod.*",
|
| 30 |
+
".context_embedder",
|
| 31 |
+
".vid_out",
|
| 32 |
+
"time_text_embed",
|
| 33 |
+
"patch_embed",
|
| 34 |
+
"wte",
|
| 35 |
+
".img_in",
|
| 36 |
+
".final_layer",
|
| 37 |
+
".x_embedder",
|
| 38 |
+
"multi_modal_projector",
|
| 39 |
+
"pos_embed",
|
| 40 |
+
"txt_norm.0.weight",
|
| 41 |
+
"txt_norm.1.weight",
|
| 42 |
+
"txt_norm.2.weight",
|
| 43 |
+
"txt_norm.3.weight",
|
| 44 |
+
"transformer_blocks.0.attn.norm_q.weight",
|
| 45 |
+
"transformer_blocks.0.attn.norm_k.weight",
|
| 46 |
+
"transformer_blocks.0.attn.norm_added_q.weight",
|
| 47 |
+
"transformer_blocks.0.attn.norm_added_k.weight",
|
| 48 |
+
"transformer_blocks.0.img_norm1.weight",
|
| 49 |
+
"transformer_blocks.0.img_norm2.weight",
|
| 50 |
+
"transformer_blocks.0.txt_norm1.weight",
|
| 51 |
+
"transformer_blocks.0.txt_norm2.weight",
|
| 52 |
+
"transformer_blocks.1.attn.norm_q.weight",
|
| 53 |
+
"transformer_blocks.1.attn.norm_k.weight",
|
| 54 |
+
"transformer_blocks.1.attn.norm_added_q.weight",
|
| 55 |
+
"transformer_blocks.1.attn.norm_added_k.weight",
|
| 56 |
+
"transformer_blocks.1.img_norm1.weight",
|
| 57 |
+
"transformer_blocks.1.img_norm2.weight",
|
| 58 |
+
"transformer_blocks.1.txt_norm1.weight",
|
| 59 |
+
"transformer_blocks.1.txt_norm2.weight",
|
| 60 |
+
"transformer_blocks.2.attn.norm_q.weight",
|
| 61 |
+
"transformer_blocks.2.attn.norm_k.weight",
|
| 62 |
+
"transformer_blocks.2.attn.norm_added_q.weight",
|
| 63 |
+
"transformer_blocks.2.attn.norm_added_k.weight",
|
| 64 |
+
"transformer_blocks.2.img_norm1.weight",
|
| 65 |
+
"transformer_blocks.2.img_norm2.weight",
|
| 66 |
+
"transformer_blocks.2.txt_norm1.weight",
|
| 67 |
+
"transformer_blocks.2.txt_norm2.weight",
|
| 68 |
+
"transformer_blocks.3.attn.norm_q.weight",
|
| 69 |
+
"transformer_blocks.3.attn.norm_k.weight",
|
| 70 |
+
"transformer_blocks.3.attn.norm_added_q.weight",
|
| 71 |
+
"transformer_blocks.3.attn.norm_added_k.weight",
|
| 72 |
+
"transformer_blocks.3.img_norm1.weight",
|
| 73 |
+
"transformer_blocks.3.img_norm2.weight",
|
| 74 |
+
"transformer_blocks.3.txt_norm1.weight",
|
| 75 |
+
"transformer_blocks.3.txt_norm2.weight",
|
| 76 |
+
"transformer_blocks.4.attn.norm_q.weight",
|
| 77 |
+
"transformer_blocks.4.attn.norm_k.weight",
|
| 78 |
+
"transformer_blocks.4.attn.norm_added_q.weight",
|
| 79 |
+
"transformer_blocks.4.attn.norm_added_k.weight",
|
| 80 |
+
"transformer_blocks.4.img_norm1.weight",
|
| 81 |
+
"transformer_blocks.4.img_norm2.weight",
|
| 82 |
+
"transformer_blocks.4.txt_norm1.weight",
|
| 83 |
+
"transformer_blocks.4.txt_norm2.weight",
|
| 84 |
+
"transformer_blocks.5.attn.norm_q.weight",
|
| 85 |
+
"transformer_blocks.5.attn.norm_k.weight",
|
| 86 |
+
"transformer_blocks.5.attn.norm_added_q.weight",
|
| 87 |
+
"transformer_blocks.5.attn.norm_added_k.weight",
|
| 88 |
+
"transformer_blocks.5.img_norm1.weight",
|
| 89 |
+
"transformer_blocks.5.img_norm2.weight",
|
| 90 |
+
"transformer_blocks.5.txt_norm1.weight",
|
| 91 |
+
"transformer_blocks.5.txt_norm2.weight",
|
| 92 |
+
"transformer_blocks.6.attn.norm_q.weight",
|
| 93 |
+
"transformer_blocks.6.attn.norm_k.weight",
|
| 94 |
+
"transformer_blocks.6.attn.norm_added_q.weight",
|
| 95 |
+
"transformer_blocks.6.attn.norm_added_k.weight",
|
| 96 |
+
"transformer_blocks.6.img_norm1.weight",
|
| 97 |
+
"transformer_blocks.6.img_norm2.weight",
|
| 98 |
+
"transformer_blocks.6.txt_norm1.weight",
|
| 99 |
+
"transformer_blocks.6.txt_norm2.weight",
|
| 100 |
+
"transformer_blocks.7.attn.norm_q.weight",
|
| 101 |
+
"transformer_blocks.7.attn.norm_k.weight",
|
| 102 |
+
"transformer_blocks.7.attn.norm_added_q.weight",
|
| 103 |
+
"transformer_blocks.7.attn.norm_added_k.weight",
|
| 104 |
+
"transformer_blocks.7.img_norm1.weight",
|
| 105 |
+
"transformer_blocks.7.img_norm2.weight",
|
| 106 |
+
"transformer_blocks.7.txt_norm1.weight",
|
| 107 |
+
"transformer_blocks.7.txt_norm2.weight",
|
| 108 |
+
"transformer_blocks.8.attn.norm_q.weight",
|
| 109 |
+
"transformer_blocks.8.attn.norm_k.weight",
|
| 110 |
+
"transformer_blocks.8.attn.norm_added_q.weight",
|
| 111 |
+
"transformer_blocks.8.attn.norm_added_k.weight",
|
| 112 |
+
"transformer_blocks.8.img_norm1.weight",
|
| 113 |
+
"transformer_blocks.8.img_norm2.weight",
|
| 114 |
+
"transformer_blocks.8.txt_norm1.weight",
|
| 115 |
+
"transformer_blocks.8.txt_norm2.weight",
|
| 116 |
+
"transformer_blocks.9.attn.norm_q.weight",
|
| 117 |
+
"transformer_blocks.9.attn.norm_k.weight",
|
| 118 |
+
"transformer_blocks.9.attn.norm_added_q.weight",
|
| 119 |
+
"transformer_blocks.9.attn.norm_added_k.weight",
|
| 120 |
+
"transformer_blocks.9.img_norm1.weight",
|
| 121 |
+
"transformer_blocks.9.img_norm2.weight",
|
| 122 |
+
"transformer_blocks.9.txt_norm1.weight",
|
| 123 |
+
"transformer_blocks.9.txt_norm2.weight",
|
| 124 |
+
"transformer_blocks.10.attn.norm_q.weight",
|
| 125 |
+
"transformer_blocks.10.attn.norm_k.weight",
|
| 126 |
+
"transformer_blocks.10.attn.norm_added_q.weight",
|
| 127 |
+
"transformer_blocks.10.attn.norm_added_k.weight",
|
| 128 |
+
"transformer_blocks.10.img_norm1.weight",
|
| 129 |
+
"transformer_blocks.10.img_norm2.weight",
|
| 130 |
+
"transformer_blocks.10.txt_norm1.weight",
|
| 131 |
+
"transformer_blocks.10.txt_norm2.weight",
|
| 132 |
+
"transformer_blocks.11.attn.norm_q.weight",
|
| 133 |
+
"transformer_blocks.11.attn.norm_k.weight",
|
| 134 |
+
"transformer_blocks.11.attn.norm_added_q.weight",
|
| 135 |
+
"transformer_blocks.11.attn.norm_added_k.weight",
|
| 136 |
+
"transformer_blocks.11.img_norm1.weight",
|
| 137 |
+
"transformer_blocks.11.img_norm2.weight",
|
| 138 |
+
"transformer_blocks.11.txt_norm1.weight",
|
| 139 |
+
"transformer_blocks.11.txt_norm2.weight",
|
| 140 |
+
"transformer_blocks.12.attn.norm_q.weight",
|
| 141 |
+
"transformer_blocks.12.attn.norm_k.weight",
|
| 142 |
+
"transformer_blocks.12.attn.norm_added_q.weight",
|
| 143 |
+
"transformer_blocks.12.attn.norm_added_k.weight",
|
| 144 |
+
"transformer_blocks.12.img_norm1.weight",
|
| 145 |
+
"transformer_blocks.12.img_norm2.weight",
|
| 146 |
+
"transformer_blocks.12.txt_norm1.weight",
|
| 147 |
+
"transformer_blocks.12.txt_norm2.weight",
|
| 148 |
+
"transformer_blocks.13.attn.norm_q.weight",
|
| 149 |
+
"transformer_blocks.13.attn.norm_k.weight",
|
| 150 |
+
"transformer_blocks.13.attn.norm_added_q.weight",
|
| 151 |
+
"transformer_blocks.13.attn.norm_added_k.weight",
|
| 152 |
+
"transformer_blocks.13.img_norm1.weight",
|
| 153 |
+
"transformer_blocks.13.img_norm2.weight",
|
| 154 |
+
"transformer_blocks.13.txt_norm1.weight",
|
| 155 |
+
"transformer_blocks.13.txt_norm2.weight",
|
| 156 |
+
"transformer_blocks.14.attn.norm_q.weight",
|
| 157 |
+
"transformer_blocks.14.attn.norm_k.weight",
|
| 158 |
+
"transformer_blocks.14.attn.norm_added_q.weight",
|
| 159 |
+
"transformer_blocks.14.attn.norm_added_k.weight",
|
| 160 |
+
"transformer_blocks.14.img_norm1.weight",
|
| 161 |
+
"transformer_blocks.14.img_norm2.weight",
|
| 162 |
+
"transformer_blocks.14.txt_norm1.weight",
|
| 163 |
+
"transformer_blocks.14.txt_norm2.weight",
|
| 164 |
+
"transformer_blocks.15.attn.norm_q.weight",
|
| 165 |
+
"transformer_blocks.15.attn.norm_k.weight",
|
| 166 |
+
"transformer_blocks.15.attn.norm_added_q.weight",
|
| 167 |
+
"transformer_blocks.15.attn.norm_added_k.weight",
|
| 168 |
+
"transformer_blocks.15.img_norm1.weight",
|
| 169 |
+
"transformer_blocks.15.img_norm2.weight",
|
| 170 |
+
"transformer_blocks.15.txt_norm1.weight",
|
| 171 |
+
"transformer_blocks.15.txt_norm2.weight",
|
| 172 |
+
"transformer_blocks.16.attn.norm_q.weight",
|
| 173 |
+
"transformer_blocks.16.attn.norm_k.weight",
|
| 174 |
+
"transformer_blocks.16.attn.norm_added_q.weight",
|
| 175 |
+
"transformer_blocks.16.attn.norm_added_k.weight",
|
| 176 |
+
"transformer_blocks.16.img_norm1.weight",
|
| 177 |
+
"transformer_blocks.16.img_norm2.weight",
|
| 178 |
+
"transformer_blocks.16.txt_norm1.weight",
|
| 179 |
+
"transformer_blocks.16.txt_norm2.weight",
|
| 180 |
+
"transformer_blocks.17.attn.norm_q.weight",
|
| 181 |
+
"transformer_blocks.17.attn.norm_k.weight",
|
| 182 |
+
"transformer_blocks.17.attn.norm_added_q.weight",
|
| 183 |
+
"transformer_blocks.17.attn.norm_added_k.weight",
|
| 184 |
+
"transformer_blocks.17.img_norm1.weight",
|
| 185 |
+
"transformer_blocks.17.img_norm2.weight",
|
| 186 |
+
"transformer_blocks.17.txt_norm1.weight",
|
| 187 |
+
"transformer_blocks.17.txt_norm2.weight",
|
| 188 |
+
"transformer_blocks.18.attn.norm_q.weight",
|
| 189 |
+
"transformer_blocks.18.attn.norm_k.weight",
|
| 190 |
+
"transformer_blocks.18.attn.norm_added_q.weight",
|
| 191 |
+
"transformer_blocks.18.attn.norm_added_k.weight",
|
| 192 |
+
"transformer_blocks.18.img_norm1.weight",
|
| 193 |
+
"transformer_blocks.18.img_norm2.weight",
|
| 194 |
+
"transformer_blocks.18.txt_norm1.weight",
|
| 195 |
+
"transformer_blocks.18.txt_norm2.weight",
|
| 196 |
+
"transformer_blocks.19.attn.norm_q.weight",
|
| 197 |
+
"transformer_blocks.19.attn.norm_k.weight",
|
| 198 |
+
"transformer_blocks.19.attn.norm_added_q.weight",
|
| 199 |
+
"transformer_blocks.19.attn.norm_added_k.weight",
|
| 200 |
+
"transformer_blocks.19.img_norm1.weight",
|
| 201 |
+
"transformer_blocks.19.img_norm2.weight",
|
| 202 |
+
"transformer_blocks.19.txt_norm1.weight",
|
| 203 |
+
"transformer_blocks.19.txt_norm2.weight",
|
| 204 |
+
"transformer_blocks.20.attn.norm_q.weight",
|
| 205 |
+
"transformer_blocks.20.attn.norm_k.weight",
|
| 206 |
+
"transformer_blocks.20.attn.norm_added_q.weight",
|
| 207 |
+
"transformer_blocks.20.attn.norm_added_k.weight",
|
| 208 |
+
"transformer_blocks.20.img_norm1.weight",
|
| 209 |
+
"transformer_blocks.20.img_norm2.weight",
|
| 210 |
+
"transformer_blocks.20.txt_norm1.weight",
|
| 211 |
+
"transformer_blocks.20.txt_norm2.weight",
|
| 212 |
+
"transformer_blocks.21.attn.norm_q.weight",
|
| 213 |
+
"transformer_blocks.21.attn.norm_k.weight",
|
| 214 |
+
"transformer_blocks.21.attn.norm_added_q.weight",
|
| 215 |
+
"transformer_blocks.21.attn.norm_added_k.weight",
|
| 216 |
+
"transformer_blocks.21.img_norm1.weight",
|
| 217 |
+
"transformer_blocks.21.img_norm2.weight",
|
| 218 |
+
"transformer_blocks.21.txt_norm1.weight",
|
| 219 |
+
"transformer_blocks.21.txt_norm2.weight",
|
| 220 |
+
"transformer_blocks.22.attn.norm_q.weight",
|
| 221 |
+
"transformer_blocks.22.attn.norm_k.weight",
|
| 222 |
+
"transformer_blocks.22.attn.norm_added_q.weight",
|
| 223 |
+
"transformer_blocks.22.attn.norm_added_k.weight",
|
| 224 |
+
"transformer_blocks.22.img_norm1.weight",
|
| 225 |
+
"transformer_blocks.22.img_norm2.weight",
|
| 226 |
+
"transformer_blocks.22.txt_norm1.weight",
|
| 227 |
+
"transformer_blocks.22.txt_norm2.weight",
|
| 228 |
+
"transformer_blocks.23.attn.norm_q.weight",
|
| 229 |
+
"transformer_blocks.23.attn.norm_k.weight",
|
| 230 |
+
"transformer_blocks.23.attn.norm_added_q.weight",
|
| 231 |
+
"transformer_blocks.23.attn.norm_added_k.weight",
|
| 232 |
+
"transformer_blocks.23.img_norm1.weight",
|
| 233 |
+
"transformer_blocks.23.img_norm2.weight",
|
| 234 |
+
"transformer_blocks.23.txt_norm1.weight",
|
| 235 |
+
"transformer_blocks.23.txt_norm2.weight",
|
| 236 |
+
"transformer_blocks.24.attn.norm_q.weight",
|
| 237 |
+
"transformer_blocks.24.attn.norm_k.weight",
|
| 238 |
+
"transformer_blocks.24.attn.norm_added_q.weight",
|
| 239 |
+
"transformer_blocks.24.attn.norm_added_k.weight",
|
| 240 |
+
"transformer_blocks.24.img_norm1.weight",
|
| 241 |
+
"transformer_blocks.24.img_norm2.weight",
|
| 242 |
+
"transformer_blocks.24.txt_norm1.weight",
|
| 243 |
+
"transformer_blocks.24.txt_norm2.weight",
|
| 244 |
+
"transformer_blocks.25.attn.norm_q.weight",
|
| 245 |
+
"transformer_blocks.25.attn.norm_k.weight",
|
| 246 |
+
"transformer_blocks.25.attn.norm_added_q.weight",
|
| 247 |
+
"transformer_blocks.25.attn.norm_added_k.weight",
|
| 248 |
+
"transformer_blocks.25.img_norm1.weight",
|
| 249 |
+
"transformer_blocks.25.img_norm2.weight",
|
| 250 |
+
"transformer_blocks.25.txt_norm1.weight",
|
| 251 |
+
"transformer_blocks.25.txt_norm2.weight",
|
| 252 |
+
"transformer_blocks.26.attn.norm_q.weight",
|
| 253 |
+
"transformer_blocks.26.attn.norm_k.weight",
|
| 254 |
+
"transformer_blocks.26.attn.norm_added_q.weight",
|
| 255 |
+
"transformer_blocks.26.attn.norm_added_k.weight",
|
| 256 |
+
"transformer_blocks.26.img_norm1.weight",
|
| 257 |
+
"transformer_blocks.26.img_norm2.weight",
|
| 258 |
+
"transformer_blocks.26.txt_norm1.weight",
|
| 259 |
+
"transformer_blocks.26.txt_norm2.weight",
|
| 260 |
+
"transformer_blocks.27.attn.norm_q.weight",
|
| 261 |
+
"transformer_blocks.27.attn.norm_k.weight",
|
| 262 |
+
"transformer_blocks.27.attn.norm_added_q.weight",
|
| 263 |
+
"transformer_blocks.27.attn.norm_added_k.weight",
|
| 264 |
+
"transformer_blocks.27.img_norm1.weight",
|
| 265 |
+
"transformer_blocks.27.img_norm2.weight",
|
| 266 |
+
"transformer_blocks.27.txt_norm1.weight",
|
| 267 |
+
"transformer_blocks.27.txt_norm2.weight",
|
| 268 |
+
"transformer_blocks.28.attn.norm_q.weight",
|
| 269 |
+
"transformer_blocks.28.attn.norm_k.weight",
|
| 270 |
+
"transformer_blocks.28.attn.norm_added_q.weight",
|
| 271 |
+
"transformer_blocks.28.attn.norm_added_k.weight",
|
| 272 |
+
"transformer_blocks.28.img_norm1.weight",
|
| 273 |
+
"transformer_blocks.28.img_norm2.weight",
|
| 274 |
+
"transformer_blocks.28.txt_norm1.weight",
|
| 275 |
+
"transformer_blocks.28.txt_norm2.weight",
|
| 276 |
+
"transformer_blocks.29.attn.norm_q.weight",
|
| 277 |
+
"transformer_blocks.29.attn.norm_k.weight",
|
| 278 |
+
"transformer_blocks.29.attn.norm_added_q.weight",
|
| 279 |
+
"transformer_blocks.29.attn.norm_added_k.weight",
|
| 280 |
+
"transformer_blocks.29.img_norm1.weight",
|
| 281 |
+
"transformer_blocks.29.img_norm2.weight",
|
| 282 |
+
"transformer_blocks.29.txt_norm1.weight",
|
| 283 |
+
"transformer_blocks.29.txt_norm2.weight",
|
| 284 |
+
"transformer_blocks.30.attn.norm_q.weight",
|
| 285 |
+
"transformer_blocks.30.attn.norm_k.weight",
|
| 286 |
+
"transformer_blocks.30.attn.norm_added_q.weight",
|
| 287 |
+
"transformer_blocks.30.attn.norm_added_k.weight",
|
| 288 |
+
"transformer_blocks.30.img_norm1.weight",
|
| 289 |
+
"transformer_blocks.30.img_norm2.weight",
|
| 290 |
+
"transformer_blocks.30.txt_norm1.weight",
|
| 291 |
+
"transformer_blocks.30.txt_norm2.weight",
|
| 292 |
+
"transformer_blocks.31.attn.norm_q.weight",
|
| 293 |
+
"transformer_blocks.31.attn.norm_k.weight",
|
| 294 |
+
"transformer_blocks.31.attn.norm_added_q.weight",
|
| 295 |
+
"transformer_blocks.31.attn.norm_added_k.weight",
|
| 296 |
+
"transformer_blocks.31.img_norm1.weight",
|
| 297 |
+
"transformer_blocks.31.img_norm2.weight",
|
| 298 |
+
"transformer_blocks.31.txt_norm1.weight",
|
| 299 |
+
"transformer_blocks.31.txt_norm2.weight",
|
| 300 |
+
"transformer_blocks.32.attn.norm_q.weight",
|
| 301 |
+
"transformer_blocks.32.attn.norm_k.weight",
|
| 302 |
+
"transformer_blocks.32.attn.norm_added_q.weight",
|
| 303 |
+
"transformer_blocks.32.attn.norm_added_k.weight",
|
| 304 |
+
"transformer_blocks.32.img_norm1.weight",
|
| 305 |
+
"transformer_blocks.32.img_norm2.weight",
|
| 306 |
+
"transformer_blocks.32.txt_norm1.weight",
|
| 307 |
+
"transformer_blocks.32.txt_norm2.weight",
|
| 308 |
+
"transformer_blocks.33.attn.norm_q.weight",
|
| 309 |
+
"transformer_blocks.33.attn.norm_k.weight",
|
| 310 |
+
"transformer_blocks.33.attn.norm_added_q.weight",
|
| 311 |
+
"transformer_blocks.33.attn.norm_added_k.weight",
|
| 312 |
+
"transformer_blocks.33.img_norm1.weight",
|
| 313 |
+
"transformer_blocks.33.img_norm2.weight",
|
| 314 |
+
"transformer_blocks.33.txt_norm1.weight",
|
| 315 |
+
"transformer_blocks.33.txt_norm2.weight",
|
| 316 |
+
"transformer_blocks.34.attn.norm_q.weight",
|
| 317 |
+
"transformer_blocks.34.attn.norm_k.weight",
|
| 318 |
+
"transformer_blocks.34.attn.norm_added_q.weight",
|
| 319 |
+
"transformer_blocks.34.attn.norm_added_k.weight",
|
| 320 |
+
"transformer_blocks.34.img_norm1.weight",
|
| 321 |
+
"transformer_blocks.34.img_norm2.weight",
|
| 322 |
+
"transformer_blocks.34.txt_norm1.weight",
|
| 323 |
+
"transformer_blocks.34.txt_norm2.weight",
|
| 324 |
+
"transformer_blocks.35.attn.norm_q.weight",
|
| 325 |
+
"transformer_blocks.35.attn.norm_k.weight",
|
| 326 |
+
"transformer_blocks.35.attn.norm_added_q.weight",
|
| 327 |
+
"transformer_blocks.35.attn.norm_added_k.weight",
|
| 328 |
+
"transformer_blocks.35.img_norm1.weight",
|
| 329 |
+
"transformer_blocks.35.img_norm2.weight",
|
| 330 |
+
"transformer_blocks.35.txt_norm1.weight",
|
| 331 |
+
"transformer_blocks.35.txt_norm2.weight",
|
| 332 |
+
"transformer_blocks.36.attn.norm_q.weight",
|
| 333 |
+
"transformer_blocks.36.attn.norm_k.weight",
|
| 334 |
+
"transformer_blocks.36.attn.norm_added_q.weight",
|
| 335 |
+
"transformer_blocks.36.attn.norm_added_k.weight",
|
| 336 |
+
"transformer_blocks.36.img_norm1.weight",
|
| 337 |
+
"transformer_blocks.36.img_norm2.weight",
|
| 338 |
+
"transformer_blocks.36.txt_norm1.weight",
|
| 339 |
+
"transformer_blocks.36.txt_norm2.weight",
|
| 340 |
+
"transformer_blocks.37.attn.norm_q.weight",
|
| 341 |
+
"transformer_blocks.37.attn.norm_k.weight",
|
| 342 |
+
"transformer_blocks.37.attn.norm_added_q.weight",
|
| 343 |
+
"transformer_blocks.37.attn.norm_added_k.weight",
|
| 344 |
+
"transformer_blocks.37.img_norm1.weight",
|
| 345 |
+
"transformer_blocks.37.img_norm2.weight",
|
| 346 |
+
"transformer_blocks.37.txt_norm1.weight",
|
| 347 |
+
"transformer_blocks.37.txt_norm2.weight",
|
| 348 |
+
"transformer_blocks.38.attn.norm_q.weight",
|
| 349 |
+
"transformer_blocks.38.attn.norm_k.weight",
|
| 350 |
+
"transformer_blocks.38.attn.norm_added_q.weight",
|
| 351 |
+
"transformer_blocks.38.attn.norm_added_k.weight",
|
| 352 |
+
"transformer_blocks.38.img_norm1.weight",
|
| 353 |
+
"transformer_blocks.38.img_norm2.weight",
|
| 354 |
+
"transformer_blocks.38.txt_norm1.weight",
|
| 355 |
+
"transformer_blocks.38.txt_norm2.weight",
|
| 356 |
+
"transformer_blocks.39.attn.norm_q.weight",
|
| 357 |
+
"transformer_blocks.39.attn.norm_k.weight",
|
| 358 |
+
"transformer_blocks.39.attn.norm_added_q.weight",
|
| 359 |
+
"transformer_blocks.39.attn.norm_added_k.weight",
|
| 360 |
+
"transformer_blocks.39.img_norm1.weight",
|
| 361 |
+
"transformer_blocks.39.img_norm2.weight",
|
| 362 |
+
"transformer_blocks.39.txt_norm1.weight",
|
| 363 |
+
"transformer_blocks.39.txt_norm2.weight",
|
| 364 |
+
"transformer_blocks.40.attn.norm_q.weight",
|
| 365 |
+
"transformer_blocks.40.attn.norm_k.weight",
|
| 366 |
+
"transformer_blocks.40.attn.norm_added_q.weight",
|
| 367 |
+
"transformer_blocks.40.attn.norm_added_k.weight",
|
| 368 |
+
"transformer_blocks.40.img_norm1.weight",
|
| 369 |
+
"transformer_blocks.40.img_norm2.weight",
|
| 370 |
+
"transformer_blocks.40.txt_norm1.weight",
|
| 371 |
+
"transformer_blocks.40.txt_norm2.weight",
|
| 372 |
+
"transformer_blocks.41.attn.norm_q.weight",
|
| 373 |
+
"transformer_blocks.41.attn.norm_k.weight",
|
| 374 |
+
"transformer_blocks.41.attn.norm_added_q.weight",
|
| 375 |
+
"transformer_blocks.41.attn.norm_added_k.weight",
|
| 376 |
+
"transformer_blocks.41.img_norm1.weight",
|
| 377 |
+
"transformer_blocks.41.img_norm2.weight",
|
| 378 |
+
"transformer_blocks.41.txt_norm1.weight",
|
| 379 |
+
"transformer_blocks.41.txt_norm2.weight",
|
| 380 |
+
"transformer_blocks.42.attn.norm_q.weight",
|
| 381 |
+
"transformer_blocks.42.attn.norm_k.weight",
|
| 382 |
+
"transformer_blocks.42.attn.norm_added_q.weight",
|
| 383 |
+
"transformer_blocks.42.attn.norm_added_k.weight",
|
| 384 |
+
"transformer_blocks.42.img_norm1.weight",
|
| 385 |
+
"transformer_blocks.42.img_norm2.weight",
|
| 386 |
+
"transformer_blocks.42.txt_norm1.weight",
|
| 387 |
+
"transformer_blocks.42.txt_norm2.weight",
|
| 388 |
+
"transformer_blocks.43.attn.norm_q.weight",
|
| 389 |
+
"transformer_blocks.43.attn.norm_k.weight",
|
| 390 |
+
"transformer_blocks.43.attn.norm_added_q.weight",
|
| 391 |
+
"transformer_blocks.43.attn.norm_added_k.weight",
|
| 392 |
+
"transformer_blocks.43.img_norm1.weight",
|
| 393 |
+
"transformer_blocks.43.img_norm2.weight",
|
| 394 |
+
"transformer_blocks.43.txt_norm1.weight",
|
| 395 |
+
"transformer_blocks.43.txt_norm2.weight",
|
| 396 |
+
"transformer_blocks.44.attn.norm_q.weight",
|
| 397 |
+
"transformer_blocks.44.attn.norm_k.weight",
|
| 398 |
+
"transformer_blocks.44.attn.norm_added_q.weight",
|
| 399 |
+
"transformer_blocks.44.attn.norm_added_k.weight",
|
| 400 |
+
"transformer_blocks.44.img_norm1.weight",
|
| 401 |
+
"transformer_blocks.44.img_norm2.weight",
|
| 402 |
+
"transformer_blocks.44.txt_norm1.weight",
|
| 403 |
+
"transformer_blocks.44.txt_norm2.weight",
|
| 404 |
+
"transformer_blocks.45.attn.norm_q.weight",
|
| 405 |
+
"transformer_blocks.45.attn.norm_k.weight",
|
| 406 |
+
"transformer_blocks.45.attn.norm_added_q.weight",
|
| 407 |
+
"transformer_blocks.45.attn.norm_added_k.weight",
|
| 408 |
+
"transformer_blocks.45.img_norm1.weight",
|
| 409 |
+
"transformer_blocks.45.img_norm2.weight",
|
| 410 |
+
"transformer_blocks.45.txt_norm1.weight",
|
| 411 |
+
"transformer_blocks.45.txt_norm2.weight",
|
| 412 |
+
"transformer_blocks.46.attn.norm_q.weight",
|
| 413 |
+
"transformer_blocks.46.attn.norm_k.weight",
|
| 414 |
+
"transformer_blocks.46.attn.norm_added_q.weight",
|
| 415 |
+
"transformer_blocks.46.attn.norm_added_k.weight",
|
| 416 |
+
"transformer_blocks.46.img_norm1.weight",
|
| 417 |
+
"transformer_blocks.46.img_norm2.weight",
|
| 418 |
+
"transformer_blocks.46.txt_norm1.weight",
|
| 419 |
+
"transformer_blocks.46.txt_norm2.weight",
|
| 420 |
+
"transformer_blocks.47.attn.norm_q.weight",
|
| 421 |
+
"transformer_blocks.47.attn.norm_k.weight",
|
| 422 |
+
"transformer_blocks.47.attn.norm_added_q.weight",
|
| 423 |
+
"transformer_blocks.47.attn.norm_added_k.weight",
|
| 424 |
+
"transformer_blocks.47.img_norm1.weight",
|
| 425 |
+
"transformer_blocks.47.img_norm2.weight",
|
| 426 |
+
"transformer_blocks.47.txt_norm1.weight",
|
| 427 |
+
"transformer_blocks.47.txt_norm2.weight"
|
| 428 |
+
],
|
| 429 |
+
"modules_to_not_use_matmul": [],
|
| 430 |
+
"non_blocking": false,
|
| 431 |
+
"quant_conv": false,
|
| 432 |
+
"quant_embedding": false,
|
| 433 |
+
"quant_method": "sdnq",
|
| 434 |
+
"quantization_device": null,
|
| 435 |
+
"quantized_matmul_dtype": "int8",
|
| 436 |
+
"return_device": null,
|
| 437 |
+
"sdnq_version": "0.2.0",
|
| 438 |
+
"svd_rank": 32,
|
| 439 |
+
"svd_steps": 8,
|
| 440 |
+
"use_dynamic_quantization": false,
|
| 441 |
+
"use_grad_ckpt": true,
|
| 442 |
+
"use_hadamard": false,
|
| 443 |
+
"use_quantized_matmul": true,
|
| 444 |
+
"use_quantized_matmul_conv": false,
|
| 445 |
+
"use_static_quantization": true,
|
| 446 |
+
"use_stochastic_rounding": false,
|
| 447 |
+
"use_svd": false,
|
| 448 |
+
"weights_dtype": "uint4"
|
| 449 |
+
}
|
vae/config.json
ADDED
|
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_class_name": "AutoencoderKLFlux2",
|
| 3 |
+
"_diffusers_version": "0.37.1",
|
| 4 |
+
"_name_or_path": "black-forest-labs/FLUX.2-dev",
|
| 5 |
+
"act_fn": "silu",
|
| 6 |
+
"batch_norm_eps": 0.0001,
|
| 7 |
+
"batch_norm_momentum": 0.1,
|
| 8 |
+
"block_out_channels": [
|
| 9 |
+
128,
|
| 10 |
+
256,
|
| 11 |
+
512,
|
| 12 |
+
512
|
| 13 |
+
],
|
| 14 |
+
"down_block_types": [
|
| 15 |
+
"DownEncoderBlock2D",
|
| 16 |
+
"DownEncoderBlock2D",
|
| 17 |
+
"DownEncoderBlock2D",
|
| 18 |
+
"DownEncoderBlock2D"
|
| 19 |
+
],
|
| 20 |
+
"force_upcast": true,
|
| 21 |
+
"in_channels": 3,
|
| 22 |
+
"latent_channels": 32,
|
| 23 |
+
"layers_per_block": 2,
|
| 24 |
+
"mid_block_add_attention": true,
|
| 25 |
+
"norm_num_groups": 32,
|
| 26 |
+
"out_channels": 3,
|
| 27 |
+
"patch_size": [
|
| 28 |
+
2,
|
| 29 |
+
2
|
| 30 |
+
],
|
| 31 |
+
"sample_size": 1024,
|
| 32 |
+
"up_block_types": [
|
| 33 |
+
"UpDecoderBlock2D",
|
| 34 |
+
"UpDecoderBlock2D",
|
| 35 |
+
"UpDecoderBlock2D",
|
| 36 |
+
"UpDecoderBlock2D"
|
| 37 |
+
],
|
| 38 |
+
"use_post_quant_conv": true,
|
| 39 |
+
"use_quant_conv": true
|
| 40 |
+
}
|
vae/diffusion_pytorch_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d64f3a68e1cc4f9f4e29b6e0da38a0204fe9a49f2d4053f0ec1fa1ca02f9c4b5
|
| 3 |
+
size 336213556
|