WaveCut commited on
Commit
9a16379
·
verified ·
1 Parent(s): ebed6ee

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,3 +33,39 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/gallery/000-1440x1440.png filter=lfs diff=lfs merge=lfs -text
37
+ assets/gallery/001-1440x1440.png filter=lfs diff=lfs merge=lfs -text
38
+ assets/gallery/002-1440x1440.png filter=lfs diff=lfs merge=lfs -text
39
+ assets/gallery/003-1248x1664.png filter=lfs diff=lfs merge=lfs -text
40
+ assets/gallery/004-1664x1248.png filter=lfs diff=lfs merge=lfs -text
41
+ assets/gallery/005-1664x1248.png filter=lfs diff=lfs merge=lfs -text
42
+ assets/gallery/006-1248x1664.png filter=lfs diff=lfs merge=lfs -text
43
+ assets/gallery/007-1440x1440.png filter=lfs diff=lfs merge=lfs -text
44
+ assets/gallery/008-1440x1440.png filter=lfs diff=lfs merge=lfs -text
45
+ assets/gallery/009-1664x1248.png filter=lfs diff=lfs merge=lfs -text
46
+ assets/gallery/010-1664x1248.png filter=lfs diff=lfs merge=lfs -text
47
+ assets/gallery/011-1664x1248.png filter=lfs diff=lfs merge=lfs -text
48
+ assets/gallery/012-1664x1248.png filter=lfs diff=lfs merge=lfs -text
49
+ assets/gallery/013-1664x1248.png filter=lfs diff=lfs merge=lfs -text
50
+ assets/gallery/014-1248x1664.png filter=lfs diff=lfs merge=lfs -text
51
+ assets/gallery/015-1248x1664.png filter=lfs diff=lfs merge=lfs -text
52
+ assets/gallery/016-1664x1248.png filter=lfs diff=lfs merge=lfs -text
53
+ assets/gallery/017-1248x1664.png filter=lfs diff=lfs merge=lfs -text
54
+ assets/gallery/018-1248x1664.png filter=lfs diff=lfs merge=lfs -text
55
+ assets/gallery/019-1664x1248.png filter=lfs diff=lfs merge=lfs -text
56
+ assets/gallery/020-1664x1248.png filter=lfs diff=lfs merge=lfs -text
57
+ assets/gallery/021-1664x1248.png filter=lfs diff=lfs merge=lfs -text
58
+ assets/gallery/022-1440x1440.png filter=lfs diff=lfs merge=lfs -text
59
+ assets/gallery/023-1248x1664.png filter=lfs diff=lfs merge=lfs -text
60
+ assets/gallery/024-1664x1248.png filter=lfs diff=lfs merge=lfs -text
61
+ assets/gallery/025-1664x1248.png filter=lfs diff=lfs merge=lfs -text
62
+ assets/gallery/026-1664x1248.png filter=lfs diff=lfs merge=lfs -text
63
+ assets/gallery/027-1664x1248.png filter=lfs diff=lfs merge=lfs -text
64
+ assets/gallery/028-1248x1664.png filter=lfs diff=lfs merge=lfs -text
65
+ assets/gallery/029-1664x1248.png filter=lfs diff=lfs merge=lfs -text
66
+ assets/gallery/030-1664x1248.png filter=lfs diff=lfs merge=lfs -text
67
+ assets/gallery/031-1664x1248.png filter=lfs diff=lfs merge=lfs -text
68
+ assets/teaser.webp filter=lfs diff=lfs merge=lfs -text
69
+ tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
70
+ assets/teaser.png filter=lfs diff=lfs merge=lfs -text
71
+ assets/comparison/comparison_grid_1to1_q98.webp filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ base_model: microsoft/Lens
4
+ pipeline_tag: text-to-image
5
+ tags:
6
+ - lens
7
+ - text-to-image
8
+ - sdnq
9
+ - uint4
10
+ - static-quantization
11
+ - ablation
12
+ - model-cpu-offload
13
+ ---
14
+
15
+ # Lens SDNQ uint4 static
16
+
17
+ This is a corrected SDNQ static UINT4 quantized variant of [microsoft/Lens](https://huggingface.co/microsoft/Lens).
18
+
19
+ The recipe follows the Lens-Turbo ablation result: all-linear UINT4 quantization can introduce periodic grid artifacts and severe text degradation when transformer modulation linears are quantized. This checkpoint keeps `*.img_mod.*` and `*.txt_mod.*` in bfloat16 and quantizes the rest of the denoising transformer with SDNQ UINT4.
20
+
21
+ ## Visual Comparison
22
+
23
+ **Full-size comparison grid:** the image below is built from native 1440x1440 samples without resampling the image cells and saved as WebP quality 98. Raw file: [assets/comparison/comparison_grid_1to1_q98.webp](https://huggingface.co/WaveCut/Lens-SDNQ-uint4-static/resolve/main/assets/comparison/comparison_grid_1to1_q98.webp).
24
+
25
+ ![Original vs SDNQ comparison grid](assets/comparison/comparison_grid_1to1_q98.webp)
26
+
27
+ ## Quantization Recipe
28
+
29
+ | Field | Value |
30
+ | --- | --- |
31
+ | Method | SDNQ uint4 static |
32
+ | Source model | `microsoft/Lens` |
33
+ | Quantized component | Denoising transformer |
34
+ | Text encoder | Unchanged upstream GPT-OSS text encoder |
35
+ | VAE | Unchanged upstream VAE |
36
+ | `weights_dtype` | `uint4` |
37
+ | `quantized_matmul_dtype` | `int8` |
38
+ | `use_quantized_matmul` | `true` |
39
+ | `group_size` | `0` |
40
+ | `dequantize_fp32` | `false` |
41
+ | Critical skip rule | `*.img_mod.*`, `*.txt_mod.*` kept in bfloat16 |
42
+
43
+ ## Usage
44
+
45
+ Run from the cloned [microsoft/Lens](https://github.com/microsoft/Lens) repo root so the custom Lens classes are registered.
46
+
47
+ ```python
48
+ import torch
49
+ from huggingface_hub import snapshot_download
50
+ from lens import LensPipeline, LensTransformer2DModel
51
+ from sdnq import load_sdnq_model
52
+
53
+ model_dir = snapshot_download("WaveCut/Lens-SDNQ-uint4-static")
54
+ transformer = load_sdnq_model(
55
+ model_dir + "/transformer",
56
+ model_cls=LensTransformer2DModel,
57
+ dtype=torch.bfloat16,
58
+ device=torch.device("cuda"),
59
+ dequantize_fp32=False,
60
+ use_quantized_matmul=True,
61
+ )
62
+ pipe = LensPipeline.from_pretrained(
63
+ model_dir,
64
+ transformer=transformer,
65
+ torch_dtype=torch.bfloat16,
66
+ ).to("cuda")
67
+
68
+ image = pipe(
69
+ prompt="A cat holding a sign that says hello world",
70
+ base_resolution=1440,
71
+ aspect_ratio="1:1",
72
+ num_inference_steps=20,
73
+ guidance_scale=5.0,
74
+ generator=torch.Generator("cuda").manual_seed(0),
75
+ ).images[0]
76
+ ```
77
+
78
+ ## Benchmark
79
+
80
+ Hardware: RunPod NVIDIA H100 80GB HBM3 (H100 SXM), PyTorch 2.8.0 CUDA 12.8 container, local container disk only. Benchmark date: 2026-05-24. Generation settings: `base_resolution=1440`, `aspect_ratio="1:1"`, `num_inference_steps=20`, `guidance_scale=5.0`.
81
+
82
+ | Metric | Original Lens | SDNQ uint4 static |
83
+ | --- | ---: | ---: |
84
+ | Load time, seconds | 17.641 | 14.605 |
85
+ | Load peak allocated VRAM, GB | 22.342 | 18.446 |
86
+ | Load peak reserved VRAM, GB | 22.471 | 18.516 |
87
+ | Transformer tensor storage footprint, GB | 16.417 | 4.301 |
88
+ | Transformer storage reduction vs original | baseline | 73.8% smaller |
89
+ | Average prompt runtime, seconds | 15.357 | 17.937 |
90
+ | Median prompt runtime, seconds | 14.346 | 17.813 |
91
+ | Average generation peak allocated VRAM, GB | 27.462 | 23.533 |
92
+ | Max generation peak allocated VRAM, GB | 27.467 | 23.538 |
93
+
94
+ Transformer-only footprint is computed from safetensors tensor storage for the denoising transformer parameter tensors only; it excludes allocator overhead and non-transformer components. The original transformer tensors are F32; the corrected SDNQ transformer stores quantized tensors as U8 plus the excluded modulation layers as BF16.
95
+
96
+ ### Model CPU Offload Benchmark
97
+
98
+ Same 10 prompts, using `pipe.enable_model_cpu_offload()`. The reported load time uses a warm local Hugging Face cache on the container disk, so model download time is excluded. Each model was measured in a fresh Python process. `Cold generation` is P01, the first generation immediately after load/offload setup; `warm generation` aggregates P02-P10.
99
+
100
+ | Metric | Original Lens | SDNQ uint4 static |
101
+ | --- | ---: | ---: |
102
+ | Offload setup/load time, seconds | 15.510 | 13.573 |
103
+ | Offload setup peak allocated VRAM, GB | 12.582 | 12.582 |
104
+ | Offload setup peak reserved VRAM, GB | 13.881 | 13.881 |
105
+ | Cold generation time, seconds | 26.217 | 21.473 |
106
+ | Cold generation peak allocated VRAM, GB | 19.274 | 15.479 |
107
+ | Cold generation peak reserved VRAM, GB | 19.608 | 19.126 |
108
+ | Warm generation average time, seconds | 18.123 | 17.650 |
109
+ | Warm generation median time, seconds | 17.178 | 17.519 |
110
+ | Warm generation average peak allocated VRAM, GB | 19.271 | 15.480 |
111
+ | Warm generation average peak reserved VRAM, GB | 19.630 | 18.965 |
112
+ | Warm generation max peak allocated VRAM, GB | 19.276 | 15.482 |
113
+ | Warm generation max peak reserved VRAM, GB | 19.803 | 19.210 |
114
+
115
+ Raw metrics: [`benchmark_metrics.json`](benchmark_metrics.json), [`comparison_matrix.json`](comparison_matrix.json), [`model_cpu_offload_benchmark.json`](model_cpu_offload_benchmark.json), [`sdnq_quantization_summary.json`](sdnq_quantization_summary.json).
116
+
117
+ ## 10-Prompt Matrix
118
+
119
+ | ID | Scenario | Seed | Original time, s | Quant time, s | Delta | Original peak allocated VRAM, GB | Quant peak allocated VRAM, GB |
120
+ | --- | --- | ---: | ---: | ---: | ---: | ---: | ---: |
121
+ | P01 | Midnight Library Weather Station | 301 | 19.518 | 24.105 | +23.5% | 27.461 | 23.532 |
122
+ | P02 | Desert Observatory Treaty Room | 302 | 16.986 | 18.565 | +9.3% | 27.461 | 23.532 |
123
+ | P03 | Arctic Submarine Greenhouse | 303 | 13.903 | 17.882 | +28.6% | 27.461 | 23.532 |
124
+ | P04 | Long English Museum Labels | 304 | 14.439 | 17.848 | +23.6% | 27.461 | 23.533 |
125
+ | P05 | Tokyo Rooftop Repair Diner | 305 | 14.253 | 17.779 | +24.7% | 27.461 | 23.532 |
126
+ | P06 | Russian Provincial Print Shop | 306 | 16.744 | 18.136 | +8.3% | 27.467 | 23.538 |
127
+ | P07 | Ocean Cartography Bakery | 307 | 13.918 | 14.828 | +6.5% | 27.461 | 23.532 |
128
+ | P08 | Long English Train Notice Wall | 308 | 13.906 | 14.826 | +6.6% | 27.461 | 23.532 |
129
+ | P09 | Orbital Botanical Courtroom | 309 | 16.204 | 17.740 | +9.5% | 27.461 | 23.533 |
130
+ | P10 | Byzantine Data Center Chapel | 310 | 13.703 | 17.665 | +28.9% | 27.461 | 23.532 |
131
+
132
+ ## Full Prompts
133
+
134
+ <details>
135
+ <summary>P01 - Midnight Library Weather Station</summary>
136
+
137
+ A vast midnight library converted into a Victorian weather station, brass barometers, hanging cloud chambers, blue lightning outside stained-glass windows, spiral ladders, rainwater collecting in crystal funnels, and readable labels everywhere. Include a large oak sign saying "ARCHIVE OF STORMS - EAST WING", a ledger title saying "BAROMETRIC ANOMALIES 1897-1903", a small drawer label saying "FOG SAMPLES / DO NOT SHAKE", a chalkboard note saying "THUNDER ARRIVES AT 02:17", and a bookmark saying "RETURN TO SHELF C-19". Extremely detailed, cinematic, natural perspective, crisp small typography.
138
+
139
+ </details>
140
+
141
+ <details>
142
+ <summary>P02 - Desert Observatory Treaty Room</summary>
143
+
144
+ An ancient desert observatory at golden hour, now used as a treaty room for astronomers and nomad diplomats, sandstone arches, astrolabes, folded star maps, copper tea service, wind-blown curtains, tiny dust motes, and many readable inscriptions. The central parchment must read "TREATY OF THE SEVEN MOONS". A wall plaque reads "OBSERVATORY OF QASR AL-SUHAIL". A tea label says "CARDAMOM - NO SUGAR". A blue wax seal says "WITNESSED UNDER MARS". A telescope tag says "CALIBRATE BEFORE SUNSET". Hyperreal, warm shadows, intricate surface wear.
145
+
146
+ </details>
147
+
148
+ <details>
149
+ <summary>P03 - Arctic Submarine Greenhouse</summary>
150
+
151
+ A transparent research submarine trapped under Arctic ice, transformed into a warm hydroponic greenhouse with orange grow lights, condensation, polar bears visible above through thick ice, scientists in wool sweaters, algae tanks, and frost patterns on glass. Include readable text on multiple objects: "POLAR BOTANY UNIT 4" on the bulkhead, "EMERGENCY SEED VAULT" on a red locker, "LIGHT CYCLE: 18 HOURS" on a tablet, "DO NOT FEED THE KELP" on a handwritten note, and "RETURN CORE SAMPLES" on a metal tray. Detailed, atmospheric, believable engineering.
152
+
153
+ </details>
154
+
155
+ <details>
156
+ <summary>P04 - Long English Museum Labels</summary>
157
+
158
+ A photorealistic museum exhibit room about impossible machines, with glass cases, velvet ropes, soft spotlights, and several long English placards that must be visible on different parts of the image. Placard one reads: "THE CLOCK THAT REMEMBERED WINTER: assembled from brass, bone, and borrowed tides, circa 1814." Placard two reads: "PLEASE DO NOT TOUCH THE PERPETUAL ENGINE; it becomes anxious when observed too closely." Placard three reads: "CURATOR'S NOTE: every gear was catalogued, polished, numbered, and returned before dawn." Also include ticket stubs, tiny accession numbers, fingerprints on glass, and realistic museum lighting.
159
+
160
+ </details>
161
+
162
+ <details>
163
+ <summary>P05 - Tokyo Rooftop Repair Diner</summary>
164
+
165
+ A rainy Tokyo rooftop diner that doubles as a robot repair shop, neon reflections, steam from ramen bowls, umbrellas, tiny servo motors, handwritten order slips, rain beads on chrome, and a skyline full of antennas. Readable signs: a pink neon sign says "MIDNIGHT RAMEN & REPAIRS", a menu board says "SPECIAL: MISO, BATTERY PACK, GREEN TEA", a repair invoice says "UNIT 7B - LEFT HAND RECALIBRATION", a sticker says "NO DRONES AFTER 2 AM", and a paper lantern says "OPEN WHEN IT RAINS". High detail, shallow depth of field, cinematic realism.
166
+
167
+ </details>
168
+
169
+ <details>
170
+ <summary>P06 - Russian Provincial Print Shop</summary>
171
+
172
+ Старинная провинциальная типография в России, поздний вечер, керосиновые лампы, деревянные кассы со свинцовыми литерами, мокрые афиши на веревках, самовар, иней на окне, реалистичная пыль и следы краски. На большой вывеске долж��о быть написано: "ТИПОГРАФИЯ УЕЗДНЫХ ВЕСТЕЙ". На длинной афише читаемый текст: "Завтра в городском саду: лекция о кометах, духовой оркестр, чай с баранками, начало ровно в семь часов вечера". На ящике: "ЛИТЕРЫ: А-Я, НЕ РОНЯТЬ". На записке: "Срочно отпечатать до рассвета". Очень детально, без мультяшности.
173
+
174
+ </details>
175
+
176
+ <details>
177
+ <summary>P07 - Ocean Cartography Bakery</summary>
178
+
179
+ A cozy bakery inside an old ocean cartography office, with croissants shaped like sea monsters, nautical charts dusted with flour, brass compasses, jars of ink, morning light, and a baker drawing coastlines in powdered sugar. Text elements: "TIDAL BREAD & MAPS" on the front sign, "SOURDOUGH CURRENT - 6:30 AM" on a chalkboard, "UNCHARTED PLUM TARTS" on a pastry label, "DO NOT EAT THE COMPASS" on a note, and "NORTH SEA BATCH 12" stamped on a paper bag. Warm, detailed, whimsical but realistic.
180
+
181
+ </details>
182
+
183
+ <details>
184
+ <summary>P08 - Long English Train Notice Wall</summary>
185
+
186
+ A foggy Edwardian railway platform at dawn with a wall of overlapping long English notices, brass lamps, wet cobblestones, porters, suitcases, pigeons, steam, and reflections. The largest notice must read: "IMPORTANT SERVICE CHANGE: The 6:42 express to Northbridge will depart from Platform Three after the moonlit freight has cleared the signal box." A second poster reads: "LOST PROPERTY: one violin case, two blue gloves, a silver compass, and a letter never posted." A timetable says "WINTER ROUTE - DELAYS EXPECTED NEAR THE MARSH". Ultra detailed, cinematic, legible signs, natural perspective.
187
+
188
+ </details>
189
+
190
+ <details>
191
+ <summary>P09 - Orbital Botanical Courtroom</summary>
192
+
193
+ A surreal but photorealistic courtroom inside an orbital botanical garden, judges in dark robes, enormous ferns, floating pollen, Earth visible through a curved window, holographic evidence screens, and a tiny robot stenographer. Required readable text: "CASE 44-B: THE PEOPLE VS. THE SUNFLOWER" on the main screen, "EVIDENCE: THREE PETALS AND A BROKEN VASE" on a side display, "SILENCE IN THE GREENHOUSE COURT" on a sign, "WITNESS: DR. LYSANDER MOSS" on a nameplate, and "OXYGEN TAX RECEIPT" on a paper slip. Sharp, high-detail, dramatic lighting.
194
+
195
+ </details>
196
+
197
+ <details>
198
+ <summary>P10 - Byzantine Data Center Chapel</summary>
199
+
200
+ A Byzantine chapel converted into a quiet data center, gold mosaics reflecting server LEDs, incense smoke, marble floors, monks maintaining fiber cables, illuminated manuscripts next to diagnostic terminals, and beautiful cable management. Text must appear in multiple places: "SANCTUM SERVER ROOM - AUTHORIZED MONKS ONLY" on a bronze door, "BACKUP PSALMS COMPLETED AT 03:12" on a terminal, "DO NOT UNPLUG THE RELIQUARY" on a warning label, "LATENCY PRAYER REQUESTS" on a clipboard, and "ARCHIVE NODE IX" etched on a server rack. Rich texture, controlled highlights, realistic scale.
201
+
202
+ </details>
203
+
204
+ ## Notes
205
+
206
+ This checkpoint is intended for research and evaluation. It inherits the upstream Lens limitations and responsible AI considerations from the source model. Text rendering remains challenging; the corrected recipe is designed to avoid the obvious grid/printed texture failure seen when transformer modulation linears are quantized.
assets/comparison/comparison_grid_1to1_q98.webp ADDED

Git LFS Details

  • SHA256: 16ff57dc58c48f438e786bd41502a2f5aa36646f55763cdc3b3e6d957cf46dc5
  • Pointer size: 133 Bytes
  • Size of remote file: 16.1 MB
benchmark_metrics.json ADDED
@@ -0,0 +1,349 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
3
+ "mode": "full GPU, pipe.to('cuda')",
4
+ "base_resolution": 1440,
5
+ "aspect_ratio": "1:1",
6
+ "num_inference_steps": 20,
7
+ "guidance_scale": 5.0,
8
+ "dtype": "torch.bfloat16",
9
+ "models": {
10
+ "base": {
11
+ "load": {
12
+ "load_time_s": 17.641,
13
+ "peak_allocated_gb": 22.342,
14
+ "peak_reserved_gb": 22.471,
15
+ "end_allocated_gb": 22.342,
16
+ "end_reserved_gb": 22.471
17
+ },
18
+ "summary": {
19
+ "avg_time_s": 15.357,
20
+ "median_time_s": 14.346,
21
+ "avg_peak_allocated_gb": 27.462,
22
+ "avg_peak_reserved_gb": 31.756,
23
+ "max_peak_allocated_gb": 27.467,
24
+ "max_peak_reserved_gb": 31.965
25
+ },
26
+ "prompts": [
27
+ {
28
+ "id": "P01",
29
+ "title": "Midnight Library Weather Station",
30
+ "seed": 301,
31
+ "time_s": 19.518,
32
+ "image_size": [
33
+ 1440,
34
+ 1440
35
+ ],
36
+ "peak_allocated_gb": 27.461,
37
+ "peak_reserved_gb": 31.74,
38
+ "end_allocated_gb": 22.377,
39
+ "end_reserved_gb": 31.74,
40
+ "image": "/workspace/lens_sdnq_work/generated/base/p01_base.png"
41
+ },
42
+ {
43
+ "id": "P02",
44
+ "title": "Desert Observatory Treaty Room",
45
+ "seed": 302,
46
+ "time_s": 16.986,
47
+ "image_size": [
48
+ 1440,
49
+ 1440
50
+ ],
51
+ "peak_allocated_gb": 27.461,
52
+ "peak_reserved_gb": 31.74,
53
+ "end_allocated_gb": 22.377,
54
+ "end_reserved_gb": 31.74,
55
+ "image": "/workspace/lens_sdnq_work/generated/base/p02_base.png"
56
+ },
57
+ {
58
+ "id": "P03",
59
+ "title": "Arctic Submarine Greenhouse",
60
+ "seed": 303,
61
+ "time_s": 13.903,
62
+ "image_size": [
63
+ 1440,
64
+ 1440
65
+ ],
66
+ "peak_allocated_gb": 27.461,
67
+ "peak_reserved_gb": 31.719,
68
+ "end_allocated_gb": 22.377,
69
+ "end_reserved_gb": 31.719,
70
+ "image": "/workspace/lens_sdnq_work/generated/base/p03_base.png"
71
+ },
72
+ {
73
+ "id": "P04",
74
+ "title": "Long English Museum Labels",
75
+ "seed": 304,
76
+ "time_s": 14.439,
77
+ "image_size": [
78
+ 1440,
79
+ 1440
80
+ ],
81
+ "peak_allocated_gb": 27.461,
82
+ "peak_reserved_gb": 31.719,
83
+ "end_allocated_gb": 22.377,
84
+ "end_reserved_gb": 31.719,
85
+ "image": "/workspace/lens_sdnq_work/generated/base/p04_base.png"
86
+ },
87
+ {
88
+ "id": "P05",
89
+ "title": "Tokyo Rooftop Repair Diner",
90
+ "seed": 305,
91
+ "time_s": 14.253,
92
+ "image_size": [
93
+ 1440,
94
+ 1440
95
+ ],
96
+ "peak_allocated_gb": 27.461,
97
+ "peak_reserved_gb": 31.74,
98
+ "end_allocated_gb": 22.377,
99
+ "end_reserved_gb": 31.74,
100
+ "image": "/workspace/lens_sdnq_work/generated/base/p05_base.png"
101
+ },
102
+ {
103
+ "id": "P06",
104
+ "title": "Russian Provincial Print Shop",
105
+ "seed": 306,
106
+ "time_s": 16.744,
107
+ "image_size": [
108
+ 1440,
109
+ 1440
110
+ ],
111
+ "peak_allocated_gb": 27.467,
112
+ "peak_reserved_gb": 31.965,
113
+ "end_allocated_gb": 22.377,
114
+ "end_reserved_gb": 31.965,
115
+ "image": "/workspace/lens_sdnq_work/generated/base/p06_base.png"
116
+ },
117
+ {
118
+ "id": "P07",
119
+ "title": "Ocean Cartography Bakery",
120
+ "seed": 307,
121
+ "time_s": 13.918,
122
+ "image_size": [
123
+ 1440,
124
+ 1440
125
+ ],
126
+ "peak_allocated_gb": 27.461,
127
+ "peak_reserved_gb": 31.74,
128
+ "end_allocated_gb": 22.377,
129
+ "end_reserved_gb": 31.74,
130
+ "image": "/workspace/lens_sdnq_work/generated/base/p07_base.png"
131
+ },
132
+ {
133
+ "id": "P08",
134
+ "title": "Long English Train Notice Wall",
135
+ "seed": 308,
136
+ "time_s": 13.906,
137
+ "image_size": [
138
+ 1440,
139
+ 1440
140
+ ],
141
+ "peak_allocated_gb": 27.461,
142
+ "peak_reserved_gb": 31.74,
143
+ "end_allocated_gb": 22.377,
144
+ "end_reserved_gb": 31.74,
145
+ "image": "/workspace/lens_sdnq_work/generated/base/p08_base.png"
146
+ },
147
+ {
148
+ "id": "P09",
149
+ "title": "Orbital Botanical Courtroom",
150
+ "seed": 309,
151
+ "time_s": 16.204,
152
+ "image_size": [
153
+ 1440,
154
+ 1440
155
+ ],
156
+ "peak_allocated_gb": 27.461,
157
+ "peak_reserved_gb": 31.719,
158
+ "end_allocated_gb": 22.377,
159
+ "end_reserved_gb": 31.719,
160
+ "image": "/workspace/lens_sdnq_work/generated/base/p09_base.png"
161
+ },
162
+ {
163
+ "id": "P10",
164
+ "title": "Byzantine Data Center Chapel",
165
+ "seed": 310,
166
+ "time_s": 13.703,
167
+ "image_size": [
168
+ 1440,
169
+ 1440
170
+ ],
171
+ "peak_allocated_gb": 27.461,
172
+ "peak_reserved_gb": 31.74,
173
+ "end_allocated_gb": 22.377,
174
+ "end_reserved_gb": 31.74,
175
+ "image": "/workspace/lens_sdnq_work/generated/base/p10_base.png"
176
+ }
177
+ ]
178
+ },
179
+ "quant": {
180
+ "load": {
181
+ "load_time_s": 14.605,
182
+ "peak_allocated_gb": 18.446,
183
+ "peak_reserved_gb": 18.516,
184
+ "end_allocated_gb": 18.446,
185
+ "end_reserved_gb": 18.516
186
+ },
187
+ "summary": {
188
+ "avg_time_s": 17.937,
189
+ "median_time_s": 17.813,
190
+ "avg_peak_allocated_gb": 23.533,
191
+ "avg_peak_reserved_gb": 27.699,
192
+ "max_peak_allocated_gb": 23.538,
193
+ "max_peak_reserved_gb": 27.712
194
+ },
195
+ "prompts": [
196
+ {
197
+ "id": "P01",
198
+ "title": "Midnight Library Weather Station",
199
+ "seed": 301,
200
+ "time_s": 24.105,
201
+ "image_size": [
202
+ 1440,
203
+ 1440
204
+ ],
205
+ "peak_allocated_gb": 23.532,
206
+ "peak_reserved_gb": 27.682,
207
+ "end_allocated_gb": 18.448,
208
+ "end_reserved_gb": 27.682,
209
+ "image": "/workspace/lens_sdnq_work/generated/quant/p01_quant.png"
210
+ },
211
+ {
212
+ "id": "P02",
213
+ "title": "Desert Observatory Treaty Room",
214
+ "seed": 302,
215
+ "time_s": 18.565,
216
+ "image_size": [
217
+ 1440,
218
+ 1440
219
+ ],
220
+ "peak_allocated_gb": 23.532,
221
+ "peak_reserved_gb": 27.712,
222
+ "end_allocated_gb": 18.448,
223
+ "end_reserved_gb": 27.712,
224
+ "image": "/workspace/lens_sdnq_work/generated/quant/p02_quant.png"
225
+ },
226
+ {
227
+ "id": "P03",
228
+ "title": "Arctic Submarine Greenhouse",
229
+ "seed": 303,
230
+ "time_s": 17.882,
231
+ "image_size": [
232
+ 1440,
233
+ 1440
234
+ ],
235
+ "peak_allocated_gb": 23.532,
236
+ "peak_reserved_gb": 27.712,
237
+ "end_allocated_gb": 18.448,
238
+ "end_reserved_gb": 27.712,
239
+ "image": "/workspace/lens_sdnq_work/generated/quant/p03_quant.png"
240
+ },
241
+ {
242
+ "id": "P04",
243
+ "title": "Long English Museum Labels",
244
+ "seed": 304,
245
+ "time_s": 17.848,
246
+ "image_size": [
247
+ 1440,
248
+ 1440
249
+ ],
250
+ "peak_allocated_gb": 23.533,
251
+ "peak_reserved_gb": 27.712,
252
+ "end_allocated_gb": 18.448,
253
+ "end_reserved_gb": 27.712,
254
+ "image": "/workspace/lens_sdnq_work/generated/quant/p04_quant.png"
255
+ },
256
+ {
257
+ "id": "P05",
258
+ "title": "Tokyo Rooftop Repair Diner",
259
+ "seed": 305,
260
+ "time_s": 17.779,
261
+ "image_size": [
262
+ 1440,
263
+ 1440
264
+ ],
265
+ "peak_allocated_gb": 23.532,
266
+ "peak_reserved_gb": 27.712,
267
+ "end_allocated_gb": 18.448,
268
+ "end_reserved_gb": 27.712,
269
+ "image": "/workspace/lens_sdnq_work/generated/quant/p05_quant.png"
270
+ },
271
+ {
272
+ "id": "P06",
273
+ "title": "Russian Provincial Print Shop",
274
+ "seed": 306,
275
+ "time_s": 18.136,
276
+ "image_size": [
277
+ 1440,
278
+ 1440
279
+ ],
280
+ "peak_allocated_gb": 23.538,
281
+ "peak_reserved_gb": 27.615,
282
+ "end_allocated_gb": 18.448,
283
+ "end_reserved_gb": 27.615,
284
+ "image": "/workspace/lens_sdnq_work/generated/quant/p06_quant.png"
285
+ },
286
+ {
287
+ "id": "P07",
288
+ "title": "Ocean Cartography Bakery",
289
+ "seed": 307,
290
+ "time_s": 14.828,
291
+ "image_size": [
292
+ 1440,
293
+ 1440
294
+ ],
295
+ "peak_allocated_gb": 23.532,
296
+ "peak_reserved_gb": 27.712,
297
+ "end_allocated_gb": 18.448,
298
+ "end_reserved_gb": 27.712,
299
+ "image": "/workspace/lens_sdnq_work/generated/quant/p07_quant.png"
300
+ },
301
+ {
302
+ "id": "P08",
303
+ "title": "Long English Train Notice Wall",
304
+ "seed": 308,
305
+ "time_s": 14.826,
306
+ "image_size": [
307
+ 1440,
308
+ 1440
309
+ ],
310
+ "peak_allocated_gb": 23.532,
311
+ "peak_reserved_gb": 27.712,
312
+ "end_allocated_gb": 18.448,
313
+ "end_reserved_gb": 27.712,
314
+ "image": "/workspace/lens_sdnq_work/generated/quant/p08_quant.png"
315
+ },
316
+ {
317
+ "id": "P09",
318
+ "title": "Orbital Botanical Courtroom",
319
+ "seed": 309,
320
+ "time_s": 17.74,
321
+ "image_size": [
322
+ 1440,
323
+ 1440
324
+ ],
325
+ "peak_allocated_gb": 23.533,
326
+ "peak_reserved_gb": 27.712,
327
+ "end_allocated_gb": 18.448,
328
+ "end_reserved_gb": 27.712,
329
+ "image": "/workspace/lens_sdnq_work/generated/quant/p09_quant.png"
330
+ },
331
+ {
332
+ "id": "P10",
333
+ "title": "Byzantine Data Center Chapel",
334
+ "seed": 310,
335
+ "time_s": 17.665,
336
+ "image_size": [
337
+ 1440,
338
+ 1440
339
+ ],
340
+ "peak_allocated_gb": 23.532,
341
+ "peak_reserved_gb": 27.712,
342
+ "end_allocated_gb": 18.448,
343
+ "end_reserved_gb": 27.712,
344
+ "image": "/workspace/lens_sdnq_work/generated/quant/p10_quant.png"
345
+ }
346
+ ]
347
+ }
348
+ }
349
+ }
comparison_matrix.json ADDED
@@ -0,0 +1,362 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "id": "P01",
4
+ "title": "Midnight Library Weather Station",
5
+ "seed": 301,
6
+ "prompt": "A vast midnight library converted into a Victorian weather station, brass barometers, hanging cloud chambers, blue lightning outside stained-glass windows, spiral ladders, rainwater collecting in crystal funnels, and readable labels everywhere. Include a large oak sign saying \"ARCHIVE OF STORMS - EAST WING\", a ledger title saying \"BAROMETRIC ANOMALIES 1897-1903\", a small drawer label saying \"FOG SAMPLES / DO NOT SHAKE\", a chalkboard note saying \"THUNDER ARRIVES AT 02:17\", and a bookmark saying \"RETURN TO SHELF C-19\". Extremely detailed, cinematic, natural perspective, crisp small typography.",
7
+ "base": {
8
+ "id": "P01",
9
+ "title": "Midnight Library Weather Station",
10
+ "seed": 301,
11
+ "time_s": 19.518,
12
+ "image_size": [
13
+ 1440,
14
+ 1440
15
+ ],
16
+ "peak_allocated_gb": 27.461,
17
+ "peak_reserved_gb": 31.74,
18
+ "end_allocated_gb": 22.377,
19
+ "end_reserved_gb": 31.74,
20
+ "image": "/workspace/lens_sdnq_work/generated/base/p01_base.png"
21
+ },
22
+ "quant": {
23
+ "id": "P01",
24
+ "title": "Midnight Library Weather Station",
25
+ "seed": 301,
26
+ "time_s": 24.105,
27
+ "image_size": [
28
+ 1440,
29
+ 1440
30
+ ],
31
+ "peak_allocated_gb": 23.532,
32
+ "peak_reserved_gb": 27.682,
33
+ "end_allocated_gb": 18.448,
34
+ "end_reserved_gb": 27.682,
35
+ "image": "/workspace/lens_sdnq_work/generated/quant/p01_quant.png"
36
+ }
37
+ },
38
+ {
39
+ "id": "P02",
40
+ "title": "Desert Observatory Treaty Room",
41
+ "seed": 302,
42
+ "prompt": "An ancient desert observatory at golden hour, now used as a treaty room for astronomers and nomad diplomats, sandstone arches, astrolabes, folded star maps, copper tea service, wind-blown curtains, tiny dust motes, and many readable inscriptions. The central parchment must read \"TREATY OF THE SEVEN MOONS\". A wall plaque reads \"OBSERVATORY OF QASR AL-SUHAIL\". A tea label says \"CARDAMOM - NO SUGAR\". A blue wax seal says \"WITNESSED UNDER MARS\". A telescope tag says \"CALIBRATE BEFORE SUNSET\". Hyperreal, warm shadows, intricate surface wear.",
43
+ "base": {
44
+ "id": "P02",
45
+ "title": "Desert Observatory Treaty Room",
46
+ "seed": 302,
47
+ "time_s": 16.986,
48
+ "image_size": [
49
+ 1440,
50
+ 1440
51
+ ],
52
+ "peak_allocated_gb": 27.461,
53
+ "peak_reserved_gb": 31.74,
54
+ "end_allocated_gb": 22.377,
55
+ "end_reserved_gb": 31.74,
56
+ "image": "/workspace/lens_sdnq_work/generated/base/p02_base.png"
57
+ },
58
+ "quant": {
59
+ "id": "P02",
60
+ "title": "Desert Observatory Treaty Room",
61
+ "seed": 302,
62
+ "time_s": 18.565,
63
+ "image_size": [
64
+ 1440,
65
+ 1440
66
+ ],
67
+ "peak_allocated_gb": 23.532,
68
+ "peak_reserved_gb": 27.712,
69
+ "end_allocated_gb": 18.448,
70
+ "end_reserved_gb": 27.712,
71
+ "image": "/workspace/lens_sdnq_work/generated/quant/p02_quant.png"
72
+ }
73
+ },
74
+ {
75
+ "id": "P03",
76
+ "title": "Arctic Submarine Greenhouse",
77
+ "seed": 303,
78
+ "prompt": "A transparent research submarine trapped under Arctic ice, transformed into a warm hydroponic greenhouse with orange grow lights, condensation, polar bears visible above through thick ice, scientists in wool sweaters, algae tanks, and frost patterns on glass. Include readable text on multiple objects: \"POLAR BOTANY UNIT 4\" on the bulkhead, \"EMERGENCY SEED VAULT\" on a red locker, \"LIGHT CYCLE: 18 HOURS\" on a tablet, \"DO NOT FEED THE KELP\" on a handwritten note, and \"RETURN CORE SAMPLES\" on a metal tray. Detailed, atmospheric, believable engineering.",
79
+ "base": {
80
+ "id": "P03",
81
+ "title": "Arctic Submarine Greenhouse",
82
+ "seed": 303,
83
+ "time_s": 13.903,
84
+ "image_size": [
85
+ 1440,
86
+ 1440
87
+ ],
88
+ "peak_allocated_gb": 27.461,
89
+ "peak_reserved_gb": 31.719,
90
+ "end_allocated_gb": 22.377,
91
+ "end_reserved_gb": 31.719,
92
+ "image": "/workspace/lens_sdnq_work/generated/base/p03_base.png"
93
+ },
94
+ "quant": {
95
+ "id": "P03",
96
+ "title": "Arctic Submarine Greenhouse",
97
+ "seed": 303,
98
+ "time_s": 17.882,
99
+ "image_size": [
100
+ 1440,
101
+ 1440
102
+ ],
103
+ "peak_allocated_gb": 23.532,
104
+ "peak_reserved_gb": 27.712,
105
+ "end_allocated_gb": 18.448,
106
+ "end_reserved_gb": 27.712,
107
+ "image": "/workspace/lens_sdnq_work/generated/quant/p03_quant.png"
108
+ }
109
+ },
110
+ {
111
+ "id": "P04",
112
+ "title": "Long English Museum Labels",
113
+ "seed": 304,
114
+ "prompt": "A photorealistic museum exhibit room about impossible machines, with glass cases, velvet ropes, soft spotlights, and several long English placards that must be visible on different parts of the image. Placard one reads: \"THE CLOCK THAT REMEMBERED WINTER: assembled from brass, bone, and borrowed tides, circa 1814.\" Placard two reads: \"PLEASE DO NOT TOUCH THE PERPETUAL ENGINE; it becomes anxious when observed too closely.\" Placard three reads: \"CURATOR'S NOTE: every gear was catalogued, polished, numbered, and returned before dawn.\" Also include ticket stubs, tiny accession numbers, fingerprints on glass, and realistic museum lighting.",
115
+ "base": {
116
+ "id": "P04",
117
+ "title": "Long English Museum Labels",
118
+ "seed": 304,
119
+ "time_s": 14.439,
120
+ "image_size": [
121
+ 1440,
122
+ 1440
123
+ ],
124
+ "peak_allocated_gb": 27.461,
125
+ "peak_reserved_gb": 31.719,
126
+ "end_allocated_gb": 22.377,
127
+ "end_reserved_gb": 31.719,
128
+ "image": "/workspace/lens_sdnq_work/generated/base/p04_base.png"
129
+ },
130
+ "quant": {
131
+ "id": "P04",
132
+ "title": "Long English Museum Labels",
133
+ "seed": 304,
134
+ "time_s": 17.848,
135
+ "image_size": [
136
+ 1440,
137
+ 1440
138
+ ],
139
+ "peak_allocated_gb": 23.533,
140
+ "peak_reserved_gb": 27.712,
141
+ "end_allocated_gb": 18.448,
142
+ "end_reserved_gb": 27.712,
143
+ "image": "/workspace/lens_sdnq_work/generated/quant/p04_quant.png"
144
+ }
145
+ },
146
+ {
147
+ "id": "P05",
148
+ "title": "Tokyo Rooftop Repair Diner",
149
+ "seed": 305,
150
+ "prompt": "A rainy Tokyo rooftop diner that doubles as a robot repair shop, neon reflections, steam from ramen bowls, umbrellas, tiny servo motors, handwritten order slips, rain beads on chrome, and a skyline full of antennas. Readable signs: a pink neon sign says \"MIDNIGHT RAMEN & REPAIRS\", a menu board says \"SPECIAL: MISO, BATTERY PACK, GREEN TEA\", a repair invoice says \"UNIT 7B - LEFT HAND RECALIBRATION\", a sticker says \"NO DRONES AFTER 2 AM\", and a paper lantern says \"OPEN WHEN IT RAINS\". High detail, shallow depth of field, cinematic realism.",
151
+ "base": {
152
+ "id": "P05",
153
+ "title": "Tokyo Rooftop Repair Diner",
154
+ "seed": 305,
155
+ "time_s": 14.253,
156
+ "image_size": [
157
+ 1440,
158
+ 1440
159
+ ],
160
+ "peak_allocated_gb": 27.461,
161
+ "peak_reserved_gb": 31.74,
162
+ "end_allocated_gb": 22.377,
163
+ "end_reserved_gb": 31.74,
164
+ "image": "/workspace/lens_sdnq_work/generated/base/p05_base.png"
165
+ },
166
+ "quant": {
167
+ "id": "P05",
168
+ "title": "Tokyo Rooftop Repair Diner",
169
+ "seed": 305,
170
+ "time_s": 17.779,
171
+ "image_size": [
172
+ 1440,
173
+ 1440
174
+ ],
175
+ "peak_allocated_gb": 23.532,
176
+ "peak_reserved_gb": 27.712,
177
+ "end_allocated_gb": 18.448,
178
+ "end_reserved_gb": 27.712,
179
+ "image": "/workspace/lens_sdnq_work/generated/quant/p05_quant.png"
180
+ }
181
+ },
182
+ {
183
+ "id": "P06",
184
+ "title": "Russian Provincial Print Shop",
185
+ "seed": 306,
186
+ "prompt": "\u0421\u0442\u0430\u0440\u0438\u043d\u043d\u0430\u044f \u043f\u0440\u043e\u0432\u0438\u043d\u0446\u0438\u0430\u043b\u044c\u043d\u0430\u044f \u0442\u0438\u043f\u043e\u0433\u0440\u0430\u0444\u0438\u044f \u0432 \u0420\u043e\u0441\u0441\u0438\u0438, \u043f\u043e\u0437\u0434\u043d\u0438\u0439 \u0432\u0435\u0447\u0435\u0440, \u043a\u0435\u0440\u043e\u0441\u0438\u043d\u043e\u0432\u044b\u0435 \u043b\u0430\u043c\u043f\u044b, \u0434\u0435\u0440\u0435\u0432\u044f\u043d\u043d\u044b\u0435 \u043a\u0430\u0441\u0441\u044b \u0441\u043e \u0441\u0432\u0438\u043d\u0446\u043e\u0432\u044b\u043c\u0438 \u043b\u0438\u0442\u0435\u0440\u0430\u043c\u0438, \u043c\u043e\u043a\u0440\u044b\u0435 \u0430\u0444\u0438\u0448\u0438 \u043d\u0430 \u0432\u0435\u0440\u0435\u0432\u043a\u0430\u0445, \u0441\u0430\u043c\u043e\u0432\u0430\u0440, \u0438\u043d\u0435\u0439 \u043d\u0430 \u043e\u043a\u043d\u0435, \u0440\u0435\u0430\u043b\u0438\u0441\u0442\u0438\u0447\u043d\u0430\u044f \u043f\u044b\u043b\u044c \u0438 \u0441\u043b\u0435\u0434\u044b \u043a\u0440\u0430\u0441\u043a\u0438. \u041d\u0430 \u0431\u043e\u043b\u044c\u0448\u043e\u0439 \u0432\u044b\u0432\u0435\u0441\u043a\u0435 \u0434\u043e\u043b\u0436\u043d\u043e \u0431\u044b\u0442\u044c \u043d\u0430\u043f\u0438\u0441\u0430\u043d\u043e: \"\u0422\u0418\u041f\u041e\u0413\u0420\u0410\u0424\u0418\u042f \u0423\u0415\u0417\u0414\u041d\u042b\u0425 \u0412\u0415\u0421\u0422\u0415\u0419\". \u041d\u0430 \u0434\u043b\u0438\u043d\u043d\u043e\u0439 \u0430\u0444\u0438\u0448\u0435 \u0447\u0438\u0442\u0430\u0435\u043c\u044b\u0439 \u0442\u0435\u043a\u0441\u0442: \"\u0417\u0430\u0432\u0442\u0440\u0430 \u0432 \u0433\u043e\u0440\u043e\u0434\u0441\u043a\u043e\u043c \u0441\u0430\u0434\u0443: \u043b\u0435\u043a\u0446\u0438\u044f \u043e \u043a\u043e\u043c\u0435\u0442\u0430\u0445, \u0434\u0443\u0445\u043e\u0432\u043e\u0439 \u043e\u0440\u043a\u0435\u0441\u0442\u0440, \u0447\u0430\u0439 \u0441 \u0431\u0430\u0440\u0430\u043d\u043a\u0430\u043c\u0438, \u043d\u0430\u0447\u0430\u043b\u043e \u0440\u043e\u0432\u043d\u043e \u0432 \u0441\u0435\u043c\u044c \u0447\u0430\u0441\u043e\u0432 \u0432\u0435\u0447\u0435\u0440\u0430\". \u041d\u0430 \u044f\u0449\u0438\u043a\u0435: \"\u041b\u0418\u0422\u0415\u0420\u042b: \u0410-\u042f, \u041d\u0415 \u0420\u041e\u041d\u042f\u0422\u042c\". \u041d\u0430 \u0437\u0430\u043f\u0438\u0441\u043a\u0435: \"\u0421\u0440\u043e\u0447\u043d\u043e \u043e\u0442\u043f\u0435\u0447\u0430\u0442\u0430\u0442\u044c \u0434\u043e \u0440\u0430\u0441\u0441\u0432\u0435\u0442\u0430\". \u041e\u0447\u0435\u043d\u044c \u0434\u0435\u0442\u0430\u043b\u044c\u043d\u043e, \u0431\u0435\u0437 \u043c\u0443\u043b\u044c\u0442\u044f\u0448\u043d\u043e\u0441\u0442\u0438.",
187
+ "base": {
188
+ "id": "P06",
189
+ "title": "Russian Provincial Print Shop",
190
+ "seed": 306,
191
+ "time_s": 16.744,
192
+ "image_size": [
193
+ 1440,
194
+ 1440
195
+ ],
196
+ "peak_allocated_gb": 27.467,
197
+ "peak_reserved_gb": 31.965,
198
+ "end_allocated_gb": 22.377,
199
+ "end_reserved_gb": 31.965,
200
+ "image": "/workspace/lens_sdnq_work/generated/base/p06_base.png"
201
+ },
202
+ "quant": {
203
+ "id": "P06",
204
+ "title": "Russian Provincial Print Shop",
205
+ "seed": 306,
206
+ "time_s": 18.136,
207
+ "image_size": [
208
+ 1440,
209
+ 1440
210
+ ],
211
+ "peak_allocated_gb": 23.538,
212
+ "peak_reserved_gb": 27.615,
213
+ "end_allocated_gb": 18.448,
214
+ "end_reserved_gb": 27.615,
215
+ "image": "/workspace/lens_sdnq_work/generated/quant/p06_quant.png"
216
+ }
217
+ },
218
+ {
219
+ "id": "P07",
220
+ "title": "Ocean Cartography Bakery",
221
+ "seed": 307,
222
+ "prompt": "A cozy bakery inside an old ocean cartography office, with croissants shaped like sea monsters, nautical charts dusted with flour, brass compasses, jars of ink, morning light, and a baker drawing coastlines in powdered sugar. Text elements: \"TIDAL BREAD & MAPS\" on the front sign, \"SOURDOUGH CURRENT - 6:30 AM\" on a chalkboard, \"UNCHARTED PLUM TARTS\" on a pastry label, \"DO NOT EAT THE COMPASS\" on a note, and \"NORTH SEA BATCH 12\" stamped on a paper bag. Warm, detailed, whimsical but realistic.",
223
+ "base": {
224
+ "id": "P07",
225
+ "title": "Ocean Cartography Bakery",
226
+ "seed": 307,
227
+ "time_s": 13.918,
228
+ "image_size": [
229
+ 1440,
230
+ 1440
231
+ ],
232
+ "peak_allocated_gb": 27.461,
233
+ "peak_reserved_gb": 31.74,
234
+ "end_allocated_gb": 22.377,
235
+ "end_reserved_gb": 31.74,
236
+ "image": "/workspace/lens_sdnq_work/generated/base/p07_base.png"
237
+ },
238
+ "quant": {
239
+ "id": "P07",
240
+ "title": "Ocean Cartography Bakery",
241
+ "seed": 307,
242
+ "time_s": 14.828,
243
+ "image_size": [
244
+ 1440,
245
+ 1440
246
+ ],
247
+ "peak_allocated_gb": 23.532,
248
+ "peak_reserved_gb": 27.712,
249
+ "end_allocated_gb": 18.448,
250
+ "end_reserved_gb": 27.712,
251
+ "image": "/workspace/lens_sdnq_work/generated/quant/p07_quant.png"
252
+ }
253
+ },
254
+ {
255
+ "id": "P08",
256
+ "title": "Long English Train Notice Wall",
257
+ "seed": 308,
258
+ "prompt": "A foggy Edwardian railway platform at dawn with a wall of overlapping long English notices, brass lamps, wet cobblestones, porters, suitcases, pigeons, steam, and reflections. The largest notice must read: \"IMPORTANT SERVICE CHANGE: The 6:42 express to Northbridge will depart from Platform Three after the moonlit freight has cleared the signal box.\" A second poster reads: \"LOST PROPERTY: one violin case, two blue gloves, a silver compass, and a letter never posted.\" A timetable says \"WINTER ROUTE - DELAYS EXPECTED NEAR THE MARSH\". Ultra detailed, cinematic, legible signs, natural perspective.",
259
+ "base": {
260
+ "id": "P08",
261
+ "title": "Long English Train Notice Wall",
262
+ "seed": 308,
263
+ "time_s": 13.906,
264
+ "image_size": [
265
+ 1440,
266
+ 1440
267
+ ],
268
+ "peak_allocated_gb": 27.461,
269
+ "peak_reserved_gb": 31.74,
270
+ "end_allocated_gb": 22.377,
271
+ "end_reserved_gb": 31.74,
272
+ "image": "/workspace/lens_sdnq_work/generated/base/p08_base.png"
273
+ },
274
+ "quant": {
275
+ "id": "P08",
276
+ "title": "Long English Train Notice Wall",
277
+ "seed": 308,
278
+ "time_s": 14.826,
279
+ "image_size": [
280
+ 1440,
281
+ 1440
282
+ ],
283
+ "peak_allocated_gb": 23.532,
284
+ "peak_reserved_gb": 27.712,
285
+ "end_allocated_gb": 18.448,
286
+ "end_reserved_gb": 27.712,
287
+ "image": "/workspace/lens_sdnq_work/generated/quant/p08_quant.png"
288
+ }
289
+ },
290
+ {
291
+ "id": "P09",
292
+ "title": "Orbital Botanical Courtroom",
293
+ "seed": 309,
294
+ "prompt": "A surreal but photorealistic courtroom inside an orbital botanical garden, judges in dark robes, enormous ferns, floating pollen, Earth visible through a curved window, holographic evidence screens, and a tiny robot stenographer. Required readable text: \"CASE 44-B: THE PEOPLE VS. THE SUNFLOWER\" on the main screen, \"EVIDENCE: THREE PETALS AND A BROKEN VASE\" on a side display, \"SILENCE IN THE GREENHOUSE COURT\" on a sign, \"WITNESS: DR. LYSANDER MOSS\" on a nameplate, and \"OXYGEN TAX RECEIPT\" on a paper slip. Sharp, high-detail, dramatic lighting.",
295
+ "base": {
296
+ "id": "P09",
297
+ "title": "Orbital Botanical Courtroom",
298
+ "seed": 309,
299
+ "time_s": 16.204,
300
+ "image_size": [
301
+ 1440,
302
+ 1440
303
+ ],
304
+ "peak_allocated_gb": 27.461,
305
+ "peak_reserved_gb": 31.719,
306
+ "end_allocated_gb": 22.377,
307
+ "end_reserved_gb": 31.719,
308
+ "image": "/workspace/lens_sdnq_work/generated/base/p09_base.png"
309
+ },
310
+ "quant": {
311
+ "id": "P09",
312
+ "title": "Orbital Botanical Courtroom",
313
+ "seed": 309,
314
+ "time_s": 17.74,
315
+ "image_size": [
316
+ 1440,
317
+ 1440
318
+ ],
319
+ "peak_allocated_gb": 23.533,
320
+ "peak_reserved_gb": 27.712,
321
+ "end_allocated_gb": 18.448,
322
+ "end_reserved_gb": 27.712,
323
+ "image": "/workspace/lens_sdnq_work/generated/quant/p09_quant.png"
324
+ }
325
+ },
326
+ {
327
+ "id": "P10",
328
+ "title": "Byzantine Data Center Chapel",
329
+ "seed": 310,
330
+ "prompt": "A Byzantine chapel converted into a quiet data center, gold mosaics reflecting server LEDs, incense smoke, marble floors, monks maintaining fiber cables, illuminated manuscripts next to diagnostic terminals, and beautiful cable management. Text must appear in multiple places: \"SANCTUM SERVER ROOM - AUTHORIZED MONKS ONLY\" on a bronze door, \"BACKUP PSALMS COMPLETED AT 03:12\" on a terminal, \"DO NOT UNPLUG THE RELIQUARY\" on a warning label, \"LATENCY PRAYER REQUESTS\" on a clipboard, and \"ARCHIVE NODE IX\" etched on a server rack. Rich texture, controlled highlights, realistic scale.",
331
+ "base": {
332
+ "id": "P10",
333
+ "title": "Byzantine Data Center Chapel",
334
+ "seed": 310,
335
+ "time_s": 13.703,
336
+ "image_size": [
337
+ 1440,
338
+ 1440
339
+ ],
340
+ "peak_allocated_gb": 27.461,
341
+ "peak_reserved_gb": 31.74,
342
+ "end_allocated_gb": 22.377,
343
+ "end_reserved_gb": 31.74,
344
+ "image": "/workspace/lens_sdnq_work/generated/base/p10_base.png"
345
+ },
346
+ "quant": {
347
+ "id": "P10",
348
+ "title": "Byzantine Data Center Chapel",
349
+ "seed": 310,
350
+ "time_s": 17.665,
351
+ "image_size": [
352
+ 1440,
353
+ 1440
354
+ ],
355
+ "peak_allocated_gb": 23.532,
356
+ "peak_reserved_gb": 27.712,
357
+ "end_allocated_gb": 18.448,
358
+ "end_reserved_gb": 27.712,
359
+ "image": "/workspace/lens_sdnq_work/generated/quant/p10_quant.png"
360
+ }
361
+ }
362
+ ]
model_cpu_offload_benchmark.json ADDED
@@ -0,0 +1,363 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "model_cpu_offload_cold_warm",
3
+ "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
4
+ "mode": "Diffusers enable_model_cpu_offload()",
5
+ "cache_state": "warm local HF cache; no download time included",
6
+ "process_isolation": "single model per fresh Python process",
7
+ "base_resolution": 1440,
8
+ "aspect_ratio": "1:1",
9
+ "num_inference_steps": 20,
10
+ "guidance_scale": 5.0,
11
+ "dtype": "torch.bfloat16",
12
+ "definitions": {
13
+ "load_time_s": "Pipeline load plus enable_model_cpu_offload setup from warm local HF cache; download time excluded.",
14
+ "cold_generation": "P01, first generation immediately after fresh process load/offload setup.",
15
+ "warm_generation": "P02-P10 after the cold P01 generation."
16
+ },
17
+ "models": {
18
+ "base": {
19
+ "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
20
+ "mode": "Diffusers enable_model_cpu_offload()",
21
+ "cache_state": "warm local HF cache; no download time included",
22
+ "process_isolation": "single model per fresh Python process",
23
+ "base_resolution": 1440,
24
+ "aspect_ratio": "1:1",
25
+ "num_inference_steps": 20,
26
+ "guidance_scale": 5.0,
27
+ "dtype": "torch.bfloat16",
28
+ "kind": "base",
29
+ "load": {
30
+ "load_time_s": 15.51,
31
+ "peak_allocated_gb": 12.582,
32
+ "peak_reserved_gb": 13.881,
33
+ "end_allocated_gb": 10.185,
34
+ "end_reserved_gb": 10.679
35
+ },
36
+ "summary": {
37
+ "cold_time_s": 26.217,
38
+ "cold_peak_allocated_gb": 19.274,
39
+ "cold_peak_reserved_gb": 19.608,
40
+ "warm_avg_time_s": 18.123,
41
+ "warm_median_time_s": 17.178,
42
+ "warm_avg_peak_allocated_gb": 19.271,
43
+ "warm_avg_peak_reserved_gb": 19.63,
44
+ "warm_max_peak_allocated_gb": 19.276,
45
+ "warm_max_peak_reserved_gb": 19.803
46
+ },
47
+ "prompts": [
48
+ {
49
+ "id": "P01",
50
+ "title": "Midnight Library Weather Station",
51
+ "seed": 301,
52
+ "time_s": 26.217,
53
+ "image_size": [
54
+ 1440,
55
+ 1440
56
+ ],
57
+ "peak_allocated_gb": 19.274,
58
+ "peak_reserved_gb": 19.608,
59
+ "end_allocated_gb": 10.221,
60
+ "end_reserved_gb": 10.884
61
+ },
62
+ {
63
+ "id": "P02",
64
+ "title": "Desert Observatory Treaty Room",
65
+ "seed": 302,
66
+ "time_s": 21.285,
67
+ "image_size": [
68
+ 1440,
69
+ 1440
70
+ ],
71
+ "peak_allocated_gb": 19.274,
72
+ "peak_reserved_gb": 19.608,
73
+ "end_allocated_gb": 10.221,
74
+ "end_reserved_gb": 10.884
75
+ },
76
+ {
77
+ "id": "P03",
78
+ "title": "Arctic Submarine Greenhouse",
79
+ "seed": 303,
80
+ "time_s": 17.271,
81
+ "image_size": [
82
+ 1440,
83
+ 1440
84
+ ],
85
+ "peak_allocated_gb": 19.275,
86
+ "peak_reserved_gb": 19.608,
87
+ "end_allocated_gb": 10.221,
88
+ "end_reserved_gb": 10.809
89
+ },
90
+ {
91
+ "id": "P04",
92
+ "title": "Long English Museum Labels",
93
+ "seed": 304,
94
+ "time_s": 17.178,
95
+ "image_size": [
96
+ 1440,
97
+ 1440
98
+ ],
99
+ "peak_allocated_gb": 19.275,
100
+ "peak_reserved_gb": 19.608,
101
+ "end_allocated_gb": 10.221,
102
+ "end_reserved_gb": 10.884
103
+ },
104
+ {
105
+ "id": "P05",
106
+ "title": "Tokyo Rooftop Repair Diner",
107
+ "seed": 305,
108
+ "time_s": 17.058,
109
+ "image_size": [
110
+ 1440,
111
+ 1440
112
+ ],
113
+ "peak_allocated_gb": 19.275,
114
+ "peak_reserved_gb": 19.608,
115
+ "end_allocated_gb": 10.221,
116
+ "end_reserved_gb": 10.813
117
+ },
118
+ {
119
+ "id": "P06",
120
+ "title": "Russian Provincial Print Shop",
121
+ "seed": 306,
122
+ "time_s": 20.163,
123
+ "image_size": [
124
+ 1440,
125
+ 1440
126
+ ],
127
+ "peak_allocated_gb": 19.242,
128
+ "peak_reserved_gb": 19.803,
129
+ "end_allocated_gb": 10.221,
130
+ "end_reserved_gb": 13.16
131
+ },
132
+ {
133
+ "id": "P07",
134
+ "title": "Ocean Cartography Bakery",
135
+ "seed": 307,
136
+ "time_s": 16.903,
137
+ "image_size": [
138
+ 1440,
139
+ 1440
140
+ ],
141
+ "peak_allocated_gb": 19.274,
142
+ "peak_reserved_gb": 19.608,
143
+ "end_allocated_gb": 10.221,
144
+ "end_reserved_gb": 10.884
145
+ },
146
+ {
147
+ "id": "P08",
148
+ "title": "Long English Train Notice Wall",
149
+ "seed": 308,
150
+ "time_s": 16.857,
151
+ "image_size": [
152
+ 1440,
153
+ 1440
154
+ ],
155
+ "peak_allocated_gb": 19.274,
156
+ "peak_reserved_gb": 19.608,
157
+ "end_allocated_gb": 10.221,
158
+ "end_reserved_gb": 10.884
159
+ },
160
+ {
161
+ "id": "P09",
162
+ "title": "Orbital Botanical Courtroom",
163
+ "seed": 309,
164
+ "time_s": 19.664,
165
+ "image_size": [
166
+ 1440,
167
+ 1440
168
+ ],
169
+ "peak_allocated_gb": 19.276,
170
+ "peak_reserved_gb": 19.61,
171
+ "end_allocated_gb": 10.221,
172
+ "end_reserved_gb": 10.909
173
+ },
174
+ {
175
+ "id": "P10",
176
+ "title": "Byzantine Data Center Chapel",
177
+ "seed": 310,
178
+ "time_s": 16.731,
179
+ "image_size": [
180
+ 1440,
181
+ 1440
182
+ ],
183
+ "peak_allocated_gb": 19.276,
184
+ "peak_reserved_gb": 19.608,
185
+ "end_allocated_gb": 10.221,
186
+ "end_reserved_gb": 10.813
187
+ }
188
+ ]
189
+ },
190
+ "quant": {
191
+ "hardware": "RunPod NVIDIA H100 80GB HBM3 (H100 SXM)",
192
+ "mode": "Diffusers enable_model_cpu_offload()",
193
+ "cache_state": "warm local HF cache; no download time included",
194
+ "process_isolation": "single model per fresh Python process",
195
+ "base_resolution": 1440,
196
+ "aspect_ratio": "1:1",
197
+ "num_inference_steps": 20,
198
+ "guidance_scale": 5.0,
199
+ "dtype": "torch.bfloat16",
200
+ "kind": "quant",
201
+ "load": {
202
+ "load_time_s": 13.573,
203
+ "peak_allocated_gb": 12.582,
204
+ "peak_reserved_gb": 13.881,
205
+ "end_allocated_gb": 10.185,
206
+ "end_reserved_gb": 10.679
207
+ },
208
+ "summary": {
209
+ "cold_time_s": 21.473,
210
+ "cold_peak_allocated_gb": 15.479,
211
+ "cold_peak_reserved_gb": 19.126,
212
+ "warm_avg_time_s": 17.65,
213
+ "warm_median_time_s": 17.519,
214
+ "warm_avg_peak_allocated_gb": 15.48,
215
+ "warm_avg_peak_reserved_gb": 18.965,
216
+ "warm_max_peak_allocated_gb": 15.482,
217
+ "warm_max_peak_reserved_gb": 19.21
218
+ },
219
+ "prompts": [
220
+ {
221
+ "id": "P01",
222
+ "title": "Midnight Library Weather Station",
223
+ "seed": 301,
224
+ "time_s": 21.473,
225
+ "image_size": [
226
+ 1440,
227
+ 1440
228
+ ],
229
+ "peak_allocated_gb": 15.479,
230
+ "peak_reserved_gb": 19.126,
231
+ "end_allocated_gb": 10.221,
232
+ "end_reserved_gb": 10.865
233
+ },
234
+ {
235
+ "id": "P02",
236
+ "title": "Desert Observatory Treaty Room",
237
+ "seed": 302,
238
+ "time_s": 19.047,
239
+ "image_size": [
240
+ 1440,
241
+ 1440
242
+ ],
243
+ "peak_allocated_gb": 15.479,
244
+ "peak_reserved_gb": 19.126,
245
+ "end_allocated_gb": 10.221,
246
+ "end_reserved_gb": 10.865
247
+ },
248
+ {
249
+ "id": "P03",
250
+ "title": "Arctic Submarine Greenhouse",
251
+ "seed": 303,
252
+ "time_s": 17.133,
253
+ "image_size": [
254
+ 1440,
255
+ 1440
256
+ ],
257
+ "peak_allocated_gb": 15.479,
258
+ "peak_reserved_gb": 19.185,
259
+ "end_allocated_gb": 10.221,
260
+ "end_reserved_gb": 10.792
261
+ },
262
+ {
263
+ "id": "P04",
264
+ "title": "Long English Museum Labels",
265
+ "seed": 304,
266
+ "time_s": 17.73,
267
+ "image_size": [
268
+ 1440,
269
+ 1440
270
+ ],
271
+ "peak_allocated_gb": 15.479,
272
+ "peak_reserved_gb": 19.126,
273
+ "end_allocated_gb": 10.221,
274
+ "end_reserved_gb": 10.863
275
+ },
276
+ {
277
+ "id": "P05",
278
+ "title": "Tokyo Rooftop Repair Diner",
279
+ "seed": 305,
280
+ "time_s": 17.332,
281
+ "image_size": [
282
+ 1440,
283
+ 1440
284
+ ],
285
+ "peak_allocated_gb": 15.479,
286
+ "peak_reserved_gb": 19.21,
287
+ "end_allocated_gb": 10.221,
288
+ "end_reserved_gb": 10.815
289
+ },
290
+ {
291
+ "id": "P06",
292
+ "title": "Russian Provincial Print Shop",
293
+ "seed": 306,
294
+ "time_s": 17.519,
295
+ "image_size": [
296
+ 1440,
297
+ 1440
298
+ ],
299
+ "peak_allocated_gb": 15.482,
300
+ "peak_reserved_gb": 17.404,
301
+ "end_allocated_gb": 10.221,
302
+ "end_reserved_gb": 13.141
303
+ },
304
+ {
305
+ "id": "P07",
306
+ "title": "Ocean Cartography Bakery",
307
+ "seed": 307,
308
+ "time_s": 17.614,
309
+ "image_size": [
310
+ 1440,
311
+ 1440
312
+ ],
313
+ "peak_allocated_gb": 15.479,
314
+ "peak_reserved_gb": 19.126,
315
+ "end_allocated_gb": 10.221,
316
+ "end_reserved_gb": 10.865
317
+ },
318
+ {
319
+ "id": "P08",
320
+ "title": "Long English Train Notice Wall",
321
+ "seed": 308,
322
+ "time_s": 17.498,
323
+ "image_size": [
324
+ 1440,
325
+ 1440
326
+ ],
327
+ "peak_allocated_gb": 15.479,
328
+ "peak_reserved_gb": 19.126,
329
+ "end_allocated_gb": 10.221,
330
+ "end_reserved_gb": 10.865
331
+ },
332
+ {
333
+ "id": "P09",
334
+ "title": "Orbital Botanical Courtroom",
335
+ "seed": 309,
336
+ "time_s": 17.546,
337
+ "image_size": [
338
+ 1440,
339
+ 1440
340
+ ],
341
+ "peak_allocated_gb": 15.481,
342
+ "peak_reserved_gb": 19.172,
343
+ "end_allocated_gb": 10.221,
344
+ "end_reserved_gb": 10.888
345
+ },
346
+ {
347
+ "id": "P10",
348
+ "title": "Byzantine Data Center Chapel",
349
+ "seed": 310,
350
+ "time_s": 17.434,
351
+ "image_size": [
352
+ 1440,
353
+ 1440
354
+ ],
355
+ "peak_allocated_gb": 15.479,
356
+ "peak_reserved_gb": 19.21,
357
+ "end_allocated_gb": 10.221,
358
+ "end_reserved_gb": 10.813
359
+ }
360
+ ]
361
+ }
362
+ }
363
+ }
model_index.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "LensPipeline",
3
+ "_diffusers_version": "0.37.1",
4
+ "scheduler": [
5
+ "diffusers",
6
+ "FlowMatchEulerDiscreteScheduler"
7
+ ],
8
+ "vae": [
9
+ "diffusers",
10
+ "AutoencoderKLFlux2"
11
+ ],
12
+ "text_encoder": [
13
+ "transformers",
14
+ "LensGptOssEncoder"
15
+ ],
16
+ "tokenizer": [
17
+ "transformers",
18
+ "PreTrainedTokenizerFast"
19
+ ],
20
+ "transformer": [
21
+ "diffusers",
22
+ "LensTransformer2DModel"
23
+ ]
24
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
+ "_diffusers_version": "0.37.1",
4
+ "base_image_seq_len": 256,
5
+ "base_shift": 0.5,
6
+ "invert_sigmas": false,
7
+ "max_image_seq_len": 4096,
8
+ "max_shift": 1.15,
9
+ "num_train_timesteps": 1000,
10
+ "shift": 3.0,
11
+ "shift_terminal": null,
12
+ "stochastic_sampling": false,
13
+ "time_shift_type": "exponential",
14
+ "use_beta_sigmas": false,
15
+ "use_dynamic_shifting": true,
16
+ "use_exponential_sigmas": false,
17
+ "use_karras_sigmas": false
18
+ }
sdnq_quantization_summary.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "source_model": "microsoft/Lens",
3
+ "target_model": "WaveCut/Lens-SDNQ-uint4-static",
4
+ "method": "SDNQ uint4 static",
5
+ "corrected_recipe": true,
6
+ "weights_dtype": "uint4",
7
+ "quantized_matmul_dtype": "int8",
8
+ "group_size": 0,
9
+ "use_quantized_matmul": true,
10
+ "dequantize_fp32": false,
11
+ "modules_to_not_convert_user": [
12
+ ".final_layer",
13
+ "pos_embed",
14
+ ".norm_out",
15
+ ".y_embedder",
16
+ ".context_embedder",
17
+ ".condition_embedder",
18
+ ".x_embedder",
19
+ ".vid_out",
20
+ ".emb_out",
21
+ ".img_in",
22
+ "patch_embed",
23
+ ".time_embed",
24
+ ".t_embedder",
25
+ "multi_modal_projector",
26
+ "patch_emb",
27
+ "norm",
28
+ ".img_out",
29
+ "patch_embedding",
30
+ "lm_head",
31
+ ".proj_out",
32
+ ".vid_in",
33
+ ".txt_in",
34
+ "wte",
35
+ "time_text_embed",
36
+ ".txt_out",
37
+ ".emb_in",
38
+ "*.img_mod.*",
39
+ "*.txt_mod.*"
40
+ ],
41
+ "root_cause_from_turbo_ablation": "Do not quantize transformer modulation linears (*.img_mod.* and *.txt_mod.*); all-linear UINT4 caused periodic grid artifacts and text degradation on Lens-Turbo.",
42
+ "transformer_load_time_s": 3.677,
43
+ "transformer_load_peak_allocated_gb": 8.359,
44
+ "transformer_load_peak_reserved_gb": 8.424,
45
+ "quantization_time_s": 0.313,
46
+ "quantization_peak_allocated_gb": 8.425,
47
+ "quantization_peak_reserved_gb": 8.485,
48
+ "base_transformer_tensor_storage_gb": 16.417,
49
+ "quant_transformer_tensor_storage_gb": 4.301,
50
+ "transformer_storage_reduction_percent": 73.8,
51
+ "base_transformer_repo_files_gb": 16.417,
52
+ "quant_transformer_repo_files_gb": 4.302,
53
+ "base_transformer_dtypes": {
54
+ "FLOAT32": 16416900608
55
+ },
56
+ "quant_transformer_dtypes": {
57
+ "BFLOAT16": 2942501632,
58
+ "UINT8": 1358954496
59
+ },
60
+ "base_transformer_tensors": 1264,
61
+ "quant_transformer_tensors": 2224
62
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "GptOssForCausalLM"
4
+ ],
5
+ "attention_bias": true,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": null,
8
+ "dtype": "bfloat16",
9
+ "eos_token_id": 200002,
10
+ "experts_per_token": 4,
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 2880,
14
+ "initial_context_length": 4096,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 2880,
17
+ "layer_types": [
18
+ "sliding_attention",
19
+ "full_attention",
20
+ "sliding_attention",
21
+ "full_attention",
22
+ "sliding_attention",
23
+ "full_attention",
24
+ "sliding_attention",
25
+ "full_attention",
26
+ "sliding_attention",
27
+ "full_attention",
28
+ "sliding_attention",
29
+ "full_attention",
30
+ "sliding_attention",
31
+ "full_attention",
32
+ "sliding_attention",
33
+ "full_attention",
34
+ "sliding_attention",
35
+ "full_attention",
36
+ "sliding_attention",
37
+ "full_attention",
38
+ "sliding_attention",
39
+ "full_attention",
40
+ "sliding_attention",
41
+ "full_attention"
42
+ ],
43
+ "max_position_embeddings": 131072,
44
+ "model_type": "gpt_oss",
45
+ "num_attention_heads": 64,
46
+ "num_experts_per_tok": 4,
47
+ "num_hidden_layers": 24,
48
+ "num_key_value_heads": 8,
49
+ "num_local_experts": 32,
50
+ "output_router_logits": false,
51
+ "pad_token_id": 199999,
52
+ "quantization_config": {
53
+ "modules_to_not_convert": [
54
+ "model.layers.*.self_attn",
55
+ "model.layers.*.mlp.router",
56
+ "model.embed_tokens",
57
+ "lm_head"
58
+ ],
59
+ "quant_method": "mxfp4"
60
+ },
61
+ "rms_norm_eps": 1e-05,
62
+ "rope_parameters": {
63
+ "beta_fast": 32.0,
64
+ "beta_slow": 1.0,
65
+ "factor": 32.0,
66
+ "original_max_position_embeddings": 4096,
67
+ "rope_theta": 150000,
68
+ "rope_type": "yarn",
69
+ "truncate": false
70
+ },
71
+ "router_aux_loss_coef": 0.9,
72
+ "sliding_window": 128,
73
+ "swiglu_limit": 7.0,
74
+ "tie_word_embeddings": false,
75
+ "transformers_version": "5.8.0",
76
+ "use_cache": true,
77
+ "vocab_size": 201088
78
+ }
text_encoder/generation_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 199998,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 200002,
6
+ 199999,
7
+ 200012
8
+ ],
9
+ "pad_token_id": 199999,
10
+ "transformers_version": "5.8.0"
11
+ }
text_encoder/model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec5a256b3cdeea38db22f0988f9f156554fc9753f95857f5ecaea56048f43bd7
3
+ size 4845744456
text_encoder/model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:914d5c38cd798a3393e348942e29c38497851b38c09df529ee162f4bd1f13b64
3
+ size 4774186632
text_encoder/model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:931a994c03fc5554d6e343d95a991ae162502459eae6035cd9cc5ea773b598e3
3
+ size 4154656824
text_encoder/model.safetensors.index.json ADDED
@@ -0,0 +1,467 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_parameters": 1804459584,
4
+ "total_size": 13774535808
5
+ },
6
+ "weight_map": {
7
+ "lm_head.weight": "model-00001-of-00003.safetensors",
8
+ "model.embed_tokens.weight": "model-00001-of-00003.safetensors",
9
+ "model.layers.0.input_layernorm.weight": "model-00001-of-00003.safetensors",
10
+ "model.layers.0.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
11
+ "model.layers.0.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
12
+ "model.layers.0.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
13
+ "model.layers.0.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
14
+ "model.layers.0.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
15
+ "model.layers.0.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
16
+ "model.layers.0.mlp.router.bias": "model-00001-of-00003.safetensors",
17
+ "model.layers.0.mlp.router.weight": "model-00001-of-00003.safetensors",
18
+ "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
19
+ "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
20
+ "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
21
+ "model.layers.0.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
22
+ "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
23
+ "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
24
+ "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
25
+ "model.layers.0.self_attn.sinks": "model-00001-of-00003.safetensors",
26
+ "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
27
+ "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
28
+ "model.layers.1.input_layernorm.weight": "model-00001-of-00003.safetensors",
29
+ "model.layers.1.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
30
+ "model.layers.1.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
31
+ "model.layers.1.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
32
+ "model.layers.1.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
33
+ "model.layers.1.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
34
+ "model.layers.1.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
35
+ "model.layers.1.mlp.router.bias": "model-00001-of-00003.safetensors",
36
+ "model.layers.1.mlp.router.weight": "model-00001-of-00003.safetensors",
37
+ "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
38
+ "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
39
+ "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
40
+ "model.layers.1.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
41
+ "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
42
+ "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
43
+ "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
44
+ "model.layers.1.self_attn.sinks": "model-00001-of-00003.safetensors",
45
+ "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
46
+ "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
47
+ "model.layers.10.input_layernorm.weight": "model-00002-of-00003.safetensors",
48
+ "model.layers.10.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
49
+ "model.layers.10.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
50
+ "model.layers.10.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
51
+ "model.layers.10.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
52
+ "model.layers.10.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
53
+ "model.layers.10.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
54
+ "model.layers.10.mlp.router.bias": "model-00002-of-00003.safetensors",
55
+ "model.layers.10.mlp.router.weight": "model-00002-of-00003.safetensors",
56
+ "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
57
+ "model.layers.10.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
58
+ "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
59
+ "model.layers.10.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
60
+ "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
61
+ "model.layers.10.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
62
+ "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
63
+ "model.layers.10.self_attn.sinks": "model-00002-of-00003.safetensors",
64
+ "model.layers.10.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
65
+ "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
66
+ "model.layers.11.input_layernorm.weight": "model-00002-of-00003.safetensors",
67
+ "model.layers.11.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
68
+ "model.layers.11.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
69
+ "model.layers.11.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
70
+ "model.layers.11.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
71
+ "model.layers.11.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
72
+ "model.layers.11.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
73
+ "model.layers.11.mlp.router.bias": "model-00002-of-00003.safetensors",
74
+ "model.layers.11.mlp.router.weight": "model-00002-of-00003.safetensors",
75
+ "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
76
+ "model.layers.11.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
77
+ "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
78
+ "model.layers.11.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
79
+ "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
80
+ "model.layers.11.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
81
+ "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
82
+ "model.layers.11.self_attn.sinks": "model-00002-of-00003.safetensors",
83
+ "model.layers.11.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
84
+ "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
85
+ "model.layers.12.input_layernorm.weight": "model-00002-of-00003.safetensors",
86
+ "model.layers.12.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
87
+ "model.layers.12.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
88
+ "model.layers.12.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
89
+ "model.layers.12.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
90
+ "model.layers.12.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
91
+ "model.layers.12.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
92
+ "model.layers.12.mlp.router.bias": "model-00002-of-00003.safetensors",
93
+ "model.layers.12.mlp.router.weight": "model-00002-of-00003.safetensors",
94
+ "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
95
+ "model.layers.12.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
96
+ "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
97
+ "model.layers.12.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
98
+ "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
99
+ "model.layers.12.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
100
+ "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
101
+ "model.layers.12.self_attn.sinks": "model-00002-of-00003.safetensors",
102
+ "model.layers.12.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
103
+ "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
104
+ "model.layers.13.input_layernorm.weight": "model-00002-of-00003.safetensors",
105
+ "model.layers.13.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
106
+ "model.layers.13.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
107
+ "model.layers.13.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
108
+ "model.layers.13.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
109
+ "model.layers.13.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
110
+ "model.layers.13.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
111
+ "model.layers.13.mlp.router.bias": "model-00002-of-00003.safetensors",
112
+ "model.layers.13.mlp.router.weight": "model-00002-of-00003.safetensors",
113
+ "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
114
+ "model.layers.13.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
115
+ "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
116
+ "model.layers.13.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
117
+ "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
118
+ "model.layers.13.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
119
+ "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
120
+ "model.layers.13.self_attn.sinks": "model-00002-of-00003.safetensors",
121
+ "model.layers.13.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
122
+ "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
123
+ "model.layers.14.input_layernorm.weight": "model-00002-of-00003.safetensors",
124
+ "model.layers.14.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
125
+ "model.layers.14.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
126
+ "model.layers.14.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
127
+ "model.layers.14.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
128
+ "model.layers.14.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
129
+ "model.layers.14.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
130
+ "model.layers.14.mlp.router.bias": "model-00002-of-00003.safetensors",
131
+ "model.layers.14.mlp.router.weight": "model-00002-of-00003.safetensors",
132
+ "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
133
+ "model.layers.14.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
134
+ "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
135
+ "model.layers.14.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
136
+ "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
137
+ "model.layers.14.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
138
+ "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
139
+ "model.layers.14.self_attn.sinks": "model-00002-of-00003.safetensors",
140
+ "model.layers.14.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
141
+ "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
142
+ "model.layers.15.input_layernorm.weight": "model-00002-of-00003.safetensors",
143
+ "model.layers.15.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
144
+ "model.layers.15.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
145
+ "model.layers.15.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
146
+ "model.layers.15.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
147
+ "model.layers.15.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
148
+ "model.layers.15.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
149
+ "model.layers.15.mlp.router.bias": "model-00003-of-00003.safetensors",
150
+ "model.layers.15.mlp.router.weight": "model-00003-of-00003.safetensors",
151
+ "model.layers.15.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
152
+ "model.layers.15.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
153
+ "model.layers.15.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
154
+ "model.layers.15.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
155
+ "model.layers.15.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
156
+ "model.layers.15.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
157
+ "model.layers.15.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
158
+ "model.layers.15.self_attn.sinks": "model-00003-of-00003.safetensors",
159
+ "model.layers.15.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
160
+ "model.layers.15.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
161
+ "model.layers.16.input_layernorm.weight": "model-00003-of-00003.safetensors",
162
+ "model.layers.16.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
163
+ "model.layers.16.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
164
+ "model.layers.16.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
165
+ "model.layers.16.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
166
+ "model.layers.16.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
167
+ "model.layers.16.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
168
+ "model.layers.16.mlp.router.bias": "model-00003-of-00003.safetensors",
169
+ "model.layers.16.mlp.router.weight": "model-00003-of-00003.safetensors",
170
+ "model.layers.16.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
171
+ "model.layers.16.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
172
+ "model.layers.16.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
173
+ "model.layers.16.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
174
+ "model.layers.16.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
175
+ "model.layers.16.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
176
+ "model.layers.16.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
177
+ "model.layers.16.self_attn.sinks": "model-00003-of-00003.safetensors",
178
+ "model.layers.16.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
179
+ "model.layers.16.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
180
+ "model.layers.17.input_layernorm.weight": "model-00003-of-00003.safetensors",
181
+ "model.layers.17.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
182
+ "model.layers.17.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
183
+ "model.layers.17.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
184
+ "model.layers.17.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
185
+ "model.layers.17.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
186
+ "model.layers.17.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
187
+ "model.layers.17.mlp.router.bias": "model-00003-of-00003.safetensors",
188
+ "model.layers.17.mlp.router.weight": "model-00003-of-00003.safetensors",
189
+ "model.layers.17.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
190
+ "model.layers.17.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
191
+ "model.layers.17.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
192
+ "model.layers.17.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
193
+ "model.layers.17.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
194
+ "model.layers.17.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
195
+ "model.layers.17.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
196
+ "model.layers.17.self_attn.sinks": "model-00003-of-00003.safetensors",
197
+ "model.layers.17.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
198
+ "model.layers.17.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
199
+ "model.layers.18.input_layernorm.weight": "model-00003-of-00003.safetensors",
200
+ "model.layers.18.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
201
+ "model.layers.18.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
202
+ "model.layers.18.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
203
+ "model.layers.18.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
204
+ "model.layers.18.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
205
+ "model.layers.18.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
206
+ "model.layers.18.mlp.router.bias": "model-00003-of-00003.safetensors",
207
+ "model.layers.18.mlp.router.weight": "model-00003-of-00003.safetensors",
208
+ "model.layers.18.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
209
+ "model.layers.18.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
210
+ "model.layers.18.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
211
+ "model.layers.18.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
212
+ "model.layers.18.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
213
+ "model.layers.18.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
214
+ "model.layers.18.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
215
+ "model.layers.18.self_attn.sinks": "model-00003-of-00003.safetensors",
216
+ "model.layers.18.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
217
+ "model.layers.18.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
218
+ "model.layers.19.input_layernorm.weight": "model-00003-of-00003.safetensors",
219
+ "model.layers.19.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
220
+ "model.layers.19.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
221
+ "model.layers.19.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
222
+ "model.layers.19.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
223
+ "model.layers.19.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
224
+ "model.layers.19.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
225
+ "model.layers.19.mlp.router.bias": "model-00003-of-00003.safetensors",
226
+ "model.layers.19.mlp.router.weight": "model-00003-of-00003.safetensors",
227
+ "model.layers.19.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
228
+ "model.layers.19.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
229
+ "model.layers.19.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
230
+ "model.layers.19.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
231
+ "model.layers.19.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
232
+ "model.layers.19.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
233
+ "model.layers.19.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
234
+ "model.layers.19.self_attn.sinks": "model-00003-of-00003.safetensors",
235
+ "model.layers.19.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
236
+ "model.layers.19.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
237
+ "model.layers.2.input_layernorm.weight": "model-00001-of-00003.safetensors",
238
+ "model.layers.2.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
239
+ "model.layers.2.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
240
+ "model.layers.2.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
241
+ "model.layers.2.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
242
+ "model.layers.2.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
243
+ "model.layers.2.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
244
+ "model.layers.2.mlp.router.bias": "model-00001-of-00003.safetensors",
245
+ "model.layers.2.mlp.router.weight": "model-00001-of-00003.safetensors",
246
+ "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
247
+ "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
248
+ "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
249
+ "model.layers.2.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
250
+ "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
251
+ "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
252
+ "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
253
+ "model.layers.2.self_attn.sinks": "model-00001-of-00003.safetensors",
254
+ "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
255
+ "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
256
+ "model.layers.20.input_layernorm.weight": "model-00003-of-00003.safetensors",
257
+ "model.layers.20.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
258
+ "model.layers.20.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
259
+ "model.layers.20.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
260
+ "model.layers.20.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
261
+ "model.layers.20.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
262
+ "model.layers.20.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
263
+ "model.layers.20.mlp.router.bias": "model-00003-of-00003.safetensors",
264
+ "model.layers.20.mlp.router.weight": "model-00003-of-00003.safetensors",
265
+ "model.layers.20.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
266
+ "model.layers.20.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
267
+ "model.layers.20.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
268
+ "model.layers.20.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
269
+ "model.layers.20.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
270
+ "model.layers.20.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
271
+ "model.layers.20.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
272
+ "model.layers.20.self_attn.sinks": "model-00003-of-00003.safetensors",
273
+ "model.layers.20.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
274
+ "model.layers.20.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
275
+ "model.layers.21.input_layernorm.weight": "model-00003-of-00003.safetensors",
276
+ "model.layers.21.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
277
+ "model.layers.21.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
278
+ "model.layers.21.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
279
+ "model.layers.21.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
280
+ "model.layers.21.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
281
+ "model.layers.21.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
282
+ "model.layers.21.mlp.router.bias": "model-00003-of-00003.safetensors",
283
+ "model.layers.21.mlp.router.weight": "model-00003-of-00003.safetensors",
284
+ "model.layers.21.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
285
+ "model.layers.21.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
286
+ "model.layers.21.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
287
+ "model.layers.21.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
288
+ "model.layers.21.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
289
+ "model.layers.21.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
290
+ "model.layers.21.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
291
+ "model.layers.21.self_attn.sinks": "model-00003-of-00003.safetensors",
292
+ "model.layers.21.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
293
+ "model.layers.21.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
294
+ "model.layers.22.input_layernorm.weight": "model-00003-of-00003.safetensors",
295
+ "model.layers.22.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
296
+ "model.layers.22.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
297
+ "model.layers.22.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
298
+ "model.layers.22.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
299
+ "model.layers.22.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
300
+ "model.layers.22.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
301
+ "model.layers.22.mlp.router.bias": "model-00003-of-00003.safetensors",
302
+ "model.layers.22.mlp.router.weight": "model-00003-of-00003.safetensors",
303
+ "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
304
+ "model.layers.22.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
305
+ "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
306
+ "model.layers.22.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
307
+ "model.layers.22.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
308
+ "model.layers.22.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
309
+ "model.layers.22.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
310
+ "model.layers.22.self_attn.sinks": "model-00003-of-00003.safetensors",
311
+ "model.layers.22.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
312
+ "model.layers.22.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
313
+ "model.layers.23.input_layernorm.weight": "model-00003-of-00003.safetensors",
314
+ "model.layers.23.mlp.experts.down_proj_bias": "model-00003-of-00003.safetensors",
315
+ "model.layers.23.mlp.experts.down_proj_blocks": "model-00003-of-00003.safetensors",
316
+ "model.layers.23.mlp.experts.down_proj_scales": "model-00003-of-00003.safetensors",
317
+ "model.layers.23.mlp.experts.gate_up_proj_bias": "model-00003-of-00003.safetensors",
318
+ "model.layers.23.mlp.experts.gate_up_proj_blocks": "model-00003-of-00003.safetensors",
319
+ "model.layers.23.mlp.experts.gate_up_proj_scales": "model-00003-of-00003.safetensors",
320
+ "model.layers.23.mlp.router.bias": "model-00003-of-00003.safetensors",
321
+ "model.layers.23.mlp.router.weight": "model-00003-of-00003.safetensors",
322
+ "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00003.safetensors",
323
+ "model.layers.23.self_attn.k_proj.bias": "model-00003-of-00003.safetensors",
324
+ "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00003.safetensors",
325
+ "model.layers.23.self_attn.o_proj.bias": "model-00003-of-00003.safetensors",
326
+ "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00003.safetensors",
327
+ "model.layers.23.self_attn.q_proj.bias": "model-00003-of-00003.safetensors",
328
+ "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00003.safetensors",
329
+ "model.layers.23.self_attn.sinks": "model-00003-of-00003.safetensors",
330
+ "model.layers.23.self_attn.v_proj.bias": "model-00003-of-00003.safetensors",
331
+ "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00003.safetensors",
332
+ "model.layers.3.input_layernorm.weight": "model-00001-of-00003.safetensors",
333
+ "model.layers.3.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
334
+ "model.layers.3.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
335
+ "model.layers.3.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
336
+ "model.layers.3.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
337
+ "model.layers.3.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
338
+ "model.layers.3.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
339
+ "model.layers.3.mlp.router.bias": "model-00001-of-00003.safetensors",
340
+ "model.layers.3.mlp.router.weight": "model-00001-of-00003.safetensors",
341
+ "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
342
+ "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
343
+ "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
344
+ "model.layers.3.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
345
+ "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
346
+ "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
347
+ "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
348
+ "model.layers.3.self_attn.sinks": "model-00001-of-00003.safetensors",
349
+ "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
350
+ "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
351
+ "model.layers.4.input_layernorm.weight": "model-00001-of-00003.safetensors",
352
+ "model.layers.4.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
353
+ "model.layers.4.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
354
+ "model.layers.4.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
355
+ "model.layers.4.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
356
+ "model.layers.4.mlp.experts.gate_up_proj_blocks": "model-00001-of-00003.safetensors",
357
+ "model.layers.4.mlp.experts.gate_up_proj_scales": "model-00001-of-00003.safetensors",
358
+ "model.layers.4.mlp.router.bias": "model-00001-of-00003.safetensors",
359
+ "model.layers.4.mlp.router.weight": "model-00001-of-00003.safetensors",
360
+ "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00003.safetensors",
361
+ "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00003.safetensors",
362
+ "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00003.safetensors",
363
+ "model.layers.4.self_attn.o_proj.bias": "model-00001-of-00003.safetensors",
364
+ "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00003.safetensors",
365
+ "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00003.safetensors",
366
+ "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00003.safetensors",
367
+ "model.layers.4.self_attn.sinks": "model-00001-of-00003.safetensors",
368
+ "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00003.safetensors",
369
+ "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00003.safetensors",
370
+ "model.layers.5.input_layernorm.weight": "model-00001-of-00003.safetensors",
371
+ "model.layers.5.mlp.experts.down_proj_bias": "model-00001-of-00003.safetensors",
372
+ "model.layers.5.mlp.experts.down_proj_blocks": "model-00001-of-00003.safetensors",
373
+ "model.layers.5.mlp.experts.down_proj_scales": "model-00001-of-00003.safetensors",
374
+ "model.layers.5.mlp.experts.gate_up_proj_bias": "model-00001-of-00003.safetensors",
375
+ "model.layers.5.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
376
+ "model.layers.5.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
377
+ "model.layers.5.mlp.router.bias": "model-00002-of-00003.safetensors",
378
+ "model.layers.5.mlp.router.weight": "model-00002-of-00003.safetensors",
379
+ "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
380
+ "model.layers.5.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
381
+ "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
382
+ "model.layers.5.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
383
+ "model.layers.5.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
384
+ "model.layers.5.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
385
+ "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
386
+ "model.layers.5.self_attn.sinks": "model-00002-of-00003.safetensors",
387
+ "model.layers.5.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
388
+ "model.layers.5.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
389
+ "model.layers.6.input_layernorm.weight": "model-00002-of-00003.safetensors",
390
+ "model.layers.6.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
391
+ "model.layers.6.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
392
+ "model.layers.6.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
393
+ "model.layers.6.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
394
+ "model.layers.6.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
395
+ "model.layers.6.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
396
+ "model.layers.6.mlp.router.bias": "model-00002-of-00003.safetensors",
397
+ "model.layers.6.mlp.router.weight": "model-00002-of-00003.safetensors",
398
+ "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
399
+ "model.layers.6.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
400
+ "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
401
+ "model.layers.6.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
402
+ "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
403
+ "model.layers.6.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
404
+ "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
405
+ "model.layers.6.self_attn.sinks": "model-00002-of-00003.safetensors",
406
+ "model.layers.6.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
407
+ "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
408
+ "model.layers.7.input_layernorm.weight": "model-00002-of-00003.safetensors",
409
+ "model.layers.7.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
410
+ "model.layers.7.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
411
+ "model.layers.7.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
412
+ "model.layers.7.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
413
+ "model.layers.7.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
414
+ "model.layers.7.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
415
+ "model.layers.7.mlp.router.bias": "model-00002-of-00003.safetensors",
416
+ "model.layers.7.mlp.router.weight": "model-00002-of-00003.safetensors",
417
+ "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
418
+ "model.layers.7.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
419
+ "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
420
+ "model.layers.7.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
421
+ "model.layers.7.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
422
+ "model.layers.7.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
423
+ "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
424
+ "model.layers.7.self_attn.sinks": "model-00002-of-00003.safetensors",
425
+ "model.layers.7.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
426
+ "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
427
+ "model.layers.8.input_layernorm.weight": "model-00002-of-00003.safetensors",
428
+ "model.layers.8.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
429
+ "model.layers.8.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
430
+ "model.layers.8.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
431
+ "model.layers.8.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
432
+ "model.layers.8.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
433
+ "model.layers.8.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
434
+ "model.layers.8.mlp.router.bias": "model-00002-of-00003.safetensors",
435
+ "model.layers.8.mlp.router.weight": "model-00002-of-00003.safetensors",
436
+ "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
437
+ "model.layers.8.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
438
+ "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
439
+ "model.layers.8.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
440
+ "model.layers.8.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
441
+ "model.layers.8.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
442
+ "model.layers.8.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
443
+ "model.layers.8.self_attn.sinks": "model-00002-of-00003.safetensors",
444
+ "model.layers.8.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
445
+ "model.layers.8.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
446
+ "model.layers.9.input_layernorm.weight": "model-00002-of-00003.safetensors",
447
+ "model.layers.9.mlp.experts.down_proj_bias": "model-00002-of-00003.safetensors",
448
+ "model.layers.9.mlp.experts.down_proj_blocks": "model-00002-of-00003.safetensors",
449
+ "model.layers.9.mlp.experts.down_proj_scales": "model-00002-of-00003.safetensors",
450
+ "model.layers.9.mlp.experts.gate_up_proj_bias": "model-00002-of-00003.safetensors",
451
+ "model.layers.9.mlp.experts.gate_up_proj_blocks": "model-00002-of-00003.safetensors",
452
+ "model.layers.9.mlp.experts.gate_up_proj_scales": "model-00002-of-00003.safetensors",
453
+ "model.layers.9.mlp.router.bias": "model-00002-of-00003.safetensors",
454
+ "model.layers.9.mlp.router.weight": "model-00002-of-00003.safetensors",
455
+ "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00003.safetensors",
456
+ "model.layers.9.self_attn.k_proj.bias": "model-00002-of-00003.safetensors",
457
+ "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00003.safetensors",
458
+ "model.layers.9.self_attn.o_proj.bias": "model-00002-of-00003.safetensors",
459
+ "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00003.safetensors",
460
+ "model.layers.9.self_attn.q_proj.bias": "model-00002-of-00003.safetensors",
461
+ "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00003.safetensors",
462
+ "model.layers.9.self_attn.sinks": "model-00002-of-00003.safetensors",
463
+ "model.layers.9.self_attn.v_proj.bias": "model-00002-of-00003.safetensors",
464
+ "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00003.safetensors",
465
+ "model.norm.weight": "model-00003-of-00003.safetensors"
466
+ }
467
+ }
tokenizer/chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
tokenizer/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0614fe83cadab421296e664e1f48f4261fa8fef6e03e63bb75c20f38e37d07d3
3
+ size 27868174
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<|startoftext|>",
4
+ "clean_up_tokenization_spaces": false,
5
+ "eos_token": "<|return|>",
6
+ "is_local": false,
7
+ "local_files_only": false,
8
+ "model_input_names": [
9
+ "input_ids",
10
+ "attention_mask"
11
+ ],
12
+ "model_max_length": 1000000000000000019884624838656,
13
+ "pad_token": "<|endoftext|>",
14
+ "tokenizer_class": "TokenizersBackend"
15
+ }
transformer/config.json ADDED
@@ -0,0 +1,476 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "LensTransformer2DModel",
3
+ "_diffusers_version": "0.38.0",
4
+ "_name_or_path": "microsoft/Lens",
5
+ "attention_head_dim": 64,
6
+ "axes_dims_rope": [
7
+ 8,
8
+ 28,
9
+ 28
10
+ ],
11
+ "enc_hidden_dim": 2880,
12
+ "gate_mlp": true,
13
+ "in_channels": 128,
14
+ "inner_dim": 1536,
15
+ "multi_layer_encoder_feature": true,
16
+ "num_attention_heads": 24,
17
+ "num_layers": 48,
18
+ "out_channels": 32,
19
+ "patch_size": 2,
20
+ "quantization_config": {
21
+ "add_skip_keys": false,
22
+ "dequantize_fp32": false,
23
+ "dynamic_loss_threshold": null,
24
+ "group_size": 0,
25
+ "hadamard_group_size": 128,
26
+ "is_integer": true,
27
+ "is_training": false,
28
+ "modules_dtype_dict": {},
29
+ "modules_quant_config": {},
30
+ "modules_to_not_convert": [
31
+ ".emb_in",
32
+ ".emb_out",
33
+ "norm",
34
+ ".y_embedder",
35
+ "patch_emb",
36
+ "lm_head",
37
+ ".condition_embedder",
38
+ ".norm_out",
39
+ ".t_embedder",
40
+ "patch_embedding",
41
+ ".vid_in",
42
+ ".txt_in",
43
+ ".txt_out",
44
+ ".time_embed",
45
+ "*.img_mod.*",
46
+ ".proj_out",
47
+ ".img_out",
48
+ "*.txt_mod.*",
49
+ ".context_embedder",
50
+ ".vid_out",
51
+ "time_text_embed",
52
+ "patch_embed",
53
+ "wte",
54
+ ".img_in",
55
+ ".final_layer",
56
+ ".x_embedder",
57
+ "multi_modal_projector",
58
+ "pos_embed",
59
+ "txt_norm.0.weight",
60
+ "txt_norm.1.weight",
61
+ "txt_norm.2.weight",
62
+ "txt_norm.3.weight",
63
+ "transformer_blocks.0.attn.norm_q.weight",
64
+ "transformer_blocks.0.attn.norm_k.weight",
65
+ "transformer_blocks.0.attn.norm_added_q.weight",
66
+ "transformer_blocks.0.attn.norm_added_k.weight",
67
+ "transformer_blocks.0.img_norm1.weight",
68
+ "transformer_blocks.0.img_norm2.weight",
69
+ "transformer_blocks.0.txt_norm1.weight",
70
+ "transformer_blocks.0.txt_norm2.weight",
71
+ "transformer_blocks.1.attn.norm_q.weight",
72
+ "transformer_blocks.1.attn.norm_k.weight",
73
+ "transformer_blocks.1.attn.norm_added_q.weight",
74
+ "transformer_blocks.1.attn.norm_added_k.weight",
75
+ "transformer_blocks.1.img_norm1.weight",
76
+ "transformer_blocks.1.img_norm2.weight",
77
+ "transformer_blocks.1.txt_norm1.weight",
78
+ "transformer_blocks.1.txt_norm2.weight",
79
+ "transformer_blocks.2.attn.norm_q.weight",
80
+ "transformer_blocks.2.attn.norm_k.weight",
81
+ "transformer_blocks.2.attn.norm_added_q.weight",
82
+ "transformer_blocks.2.attn.norm_added_k.weight",
83
+ "transformer_blocks.2.img_norm1.weight",
84
+ "transformer_blocks.2.img_norm2.weight",
85
+ "transformer_blocks.2.txt_norm1.weight",
86
+ "transformer_blocks.2.txt_norm2.weight",
87
+ "transformer_blocks.3.attn.norm_q.weight",
88
+ "transformer_blocks.3.attn.norm_k.weight",
89
+ "transformer_blocks.3.attn.norm_added_q.weight",
90
+ "transformer_blocks.3.attn.norm_added_k.weight",
91
+ "transformer_blocks.3.img_norm1.weight",
92
+ "transformer_blocks.3.img_norm2.weight",
93
+ "transformer_blocks.3.txt_norm1.weight",
94
+ "transformer_blocks.3.txt_norm2.weight",
95
+ "transformer_blocks.4.attn.norm_q.weight",
96
+ "transformer_blocks.4.attn.norm_k.weight",
97
+ "transformer_blocks.4.attn.norm_added_q.weight",
98
+ "transformer_blocks.4.attn.norm_added_k.weight",
99
+ "transformer_blocks.4.img_norm1.weight",
100
+ "transformer_blocks.4.img_norm2.weight",
101
+ "transformer_blocks.4.txt_norm1.weight",
102
+ "transformer_blocks.4.txt_norm2.weight",
103
+ "transformer_blocks.5.attn.norm_q.weight",
104
+ "transformer_blocks.5.attn.norm_k.weight",
105
+ "transformer_blocks.5.attn.norm_added_q.weight",
106
+ "transformer_blocks.5.attn.norm_added_k.weight",
107
+ "transformer_blocks.5.img_norm1.weight",
108
+ "transformer_blocks.5.img_norm2.weight",
109
+ "transformer_blocks.5.txt_norm1.weight",
110
+ "transformer_blocks.5.txt_norm2.weight",
111
+ "transformer_blocks.6.attn.norm_q.weight",
112
+ "transformer_blocks.6.attn.norm_k.weight",
113
+ "transformer_blocks.6.attn.norm_added_q.weight",
114
+ "transformer_blocks.6.attn.norm_added_k.weight",
115
+ "transformer_blocks.6.img_norm1.weight",
116
+ "transformer_blocks.6.img_norm2.weight",
117
+ "transformer_blocks.6.txt_norm1.weight",
118
+ "transformer_blocks.6.txt_norm2.weight",
119
+ "transformer_blocks.7.attn.norm_q.weight",
120
+ "transformer_blocks.7.attn.norm_k.weight",
121
+ "transformer_blocks.7.attn.norm_added_q.weight",
122
+ "transformer_blocks.7.attn.norm_added_k.weight",
123
+ "transformer_blocks.7.img_norm1.weight",
124
+ "transformer_blocks.7.img_norm2.weight",
125
+ "transformer_blocks.7.txt_norm1.weight",
126
+ "transformer_blocks.7.txt_norm2.weight",
127
+ "transformer_blocks.8.attn.norm_q.weight",
128
+ "transformer_blocks.8.attn.norm_k.weight",
129
+ "transformer_blocks.8.attn.norm_added_q.weight",
130
+ "transformer_blocks.8.attn.norm_added_k.weight",
131
+ "transformer_blocks.8.img_norm1.weight",
132
+ "transformer_blocks.8.img_norm2.weight",
133
+ "transformer_blocks.8.txt_norm1.weight",
134
+ "transformer_blocks.8.txt_norm2.weight",
135
+ "transformer_blocks.9.attn.norm_q.weight",
136
+ "transformer_blocks.9.attn.norm_k.weight",
137
+ "transformer_blocks.9.attn.norm_added_q.weight",
138
+ "transformer_blocks.9.attn.norm_added_k.weight",
139
+ "transformer_blocks.9.img_norm1.weight",
140
+ "transformer_blocks.9.img_norm2.weight",
141
+ "transformer_blocks.9.txt_norm1.weight",
142
+ "transformer_blocks.9.txt_norm2.weight",
143
+ "transformer_blocks.10.attn.norm_q.weight",
144
+ "transformer_blocks.10.attn.norm_k.weight",
145
+ "transformer_blocks.10.attn.norm_added_q.weight",
146
+ "transformer_blocks.10.attn.norm_added_k.weight",
147
+ "transformer_blocks.10.img_norm1.weight",
148
+ "transformer_blocks.10.img_norm2.weight",
149
+ "transformer_blocks.10.txt_norm1.weight",
150
+ "transformer_blocks.10.txt_norm2.weight",
151
+ "transformer_blocks.11.attn.norm_q.weight",
152
+ "transformer_blocks.11.attn.norm_k.weight",
153
+ "transformer_blocks.11.attn.norm_added_q.weight",
154
+ "transformer_blocks.11.attn.norm_added_k.weight",
155
+ "transformer_blocks.11.img_norm1.weight",
156
+ "transformer_blocks.11.img_norm2.weight",
157
+ "transformer_blocks.11.txt_norm1.weight",
158
+ "transformer_blocks.11.txt_norm2.weight",
159
+ "transformer_blocks.12.attn.norm_q.weight",
160
+ "transformer_blocks.12.attn.norm_k.weight",
161
+ "transformer_blocks.12.attn.norm_added_q.weight",
162
+ "transformer_blocks.12.attn.norm_added_k.weight",
163
+ "transformer_blocks.12.img_norm1.weight",
164
+ "transformer_blocks.12.img_norm2.weight",
165
+ "transformer_blocks.12.txt_norm1.weight",
166
+ "transformer_blocks.12.txt_norm2.weight",
167
+ "transformer_blocks.13.attn.norm_q.weight",
168
+ "transformer_blocks.13.attn.norm_k.weight",
169
+ "transformer_blocks.13.attn.norm_added_q.weight",
170
+ "transformer_blocks.13.attn.norm_added_k.weight",
171
+ "transformer_blocks.13.img_norm1.weight",
172
+ "transformer_blocks.13.img_norm2.weight",
173
+ "transformer_blocks.13.txt_norm1.weight",
174
+ "transformer_blocks.13.txt_norm2.weight",
175
+ "transformer_blocks.14.attn.norm_q.weight",
176
+ "transformer_blocks.14.attn.norm_k.weight",
177
+ "transformer_blocks.14.attn.norm_added_q.weight",
178
+ "transformer_blocks.14.attn.norm_added_k.weight",
179
+ "transformer_blocks.14.img_norm1.weight",
180
+ "transformer_blocks.14.img_norm2.weight",
181
+ "transformer_blocks.14.txt_norm1.weight",
182
+ "transformer_blocks.14.txt_norm2.weight",
183
+ "transformer_blocks.15.attn.norm_q.weight",
184
+ "transformer_blocks.15.attn.norm_k.weight",
185
+ "transformer_blocks.15.attn.norm_added_q.weight",
186
+ "transformer_blocks.15.attn.norm_added_k.weight",
187
+ "transformer_blocks.15.img_norm1.weight",
188
+ "transformer_blocks.15.img_norm2.weight",
189
+ "transformer_blocks.15.txt_norm1.weight",
190
+ "transformer_blocks.15.txt_norm2.weight",
191
+ "transformer_blocks.16.attn.norm_q.weight",
192
+ "transformer_blocks.16.attn.norm_k.weight",
193
+ "transformer_blocks.16.attn.norm_added_q.weight",
194
+ "transformer_blocks.16.attn.norm_added_k.weight",
195
+ "transformer_blocks.16.img_norm1.weight",
196
+ "transformer_blocks.16.img_norm2.weight",
197
+ "transformer_blocks.16.txt_norm1.weight",
198
+ "transformer_blocks.16.txt_norm2.weight",
199
+ "transformer_blocks.17.attn.norm_q.weight",
200
+ "transformer_blocks.17.attn.norm_k.weight",
201
+ "transformer_blocks.17.attn.norm_added_q.weight",
202
+ "transformer_blocks.17.attn.norm_added_k.weight",
203
+ "transformer_blocks.17.img_norm1.weight",
204
+ "transformer_blocks.17.img_norm2.weight",
205
+ "transformer_blocks.17.txt_norm1.weight",
206
+ "transformer_blocks.17.txt_norm2.weight",
207
+ "transformer_blocks.18.attn.norm_q.weight",
208
+ "transformer_blocks.18.attn.norm_k.weight",
209
+ "transformer_blocks.18.attn.norm_added_q.weight",
210
+ "transformer_blocks.18.attn.norm_added_k.weight",
211
+ "transformer_blocks.18.img_norm1.weight",
212
+ "transformer_blocks.18.img_norm2.weight",
213
+ "transformer_blocks.18.txt_norm1.weight",
214
+ "transformer_blocks.18.txt_norm2.weight",
215
+ "transformer_blocks.19.attn.norm_q.weight",
216
+ "transformer_blocks.19.attn.norm_k.weight",
217
+ "transformer_blocks.19.attn.norm_added_q.weight",
218
+ "transformer_blocks.19.attn.norm_added_k.weight",
219
+ "transformer_blocks.19.img_norm1.weight",
220
+ "transformer_blocks.19.img_norm2.weight",
221
+ "transformer_blocks.19.txt_norm1.weight",
222
+ "transformer_blocks.19.txt_norm2.weight",
223
+ "transformer_blocks.20.attn.norm_q.weight",
224
+ "transformer_blocks.20.attn.norm_k.weight",
225
+ "transformer_blocks.20.attn.norm_added_q.weight",
226
+ "transformer_blocks.20.attn.norm_added_k.weight",
227
+ "transformer_blocks.20.img_norm1.weight",
228
+ "transformer_blocks.20.img_norm2.weight",
229
+ "transformer_blocks.20.txt_norm1.weight",
230
+ "transformer_blocks.20.txt_norm2.weight",
231
+ "transformer_blocks.21.attn.norm_q.weight",
232
+ "transformer_blocks.21.attn.norm_k.weight",
233
+ "transformer_blocks.21.attn.norm_added_q.weight",
234
+ "transformer_blocks.21.attn.norm_added_k.weight",
235
+ "transformer_blocks.21.img_norm1.weight",
236
+ "transformer_blocks.21.img_norm2.weight",
237
+ "transformer_blocks.21.txt_norm1.weight",
238
+ "transformer_blocks.21.txt_norm2.weight",
239
+ "transformer_blocks.22.attn.norm_q.weight",
240
+ "transformer_blocks.22.attn.norm_k.weight",
241
+ "transformer_blocks.22.attn.norm_added_q.weight",
242
+ "transformer_blocks.22.attn.norm_added_k.weight",
243
+ "transformer_blocks.22.img_norm1.weight",
244
+ "transformer_blocks.22.img_norm2.weight",
245
+ "transformer_blocks.22.txt_norm1.weight",
246
+ "transformer_blocks.22.txt_norm2.weight",
247
+ "transformer_blocks.23.attn.norm_q.weight",
248
+ "transformer_blocks.23.attn.norm_k.weight",
249
+ "transformer_blocks.23.attn.norm_added_q.weight",
250
+ "transformer_blocks.23.attn.norm_added_k.weight",
251
+ "transformer_blocks.23.img_norm1.weight",
252
+ "transformer_blocks.23.img_norm2.weight",
253
+ "transformer_blocks.23.txt_norm1.weight",
254
+ "transformer_blocks.23.txt_norm2.weight",
255
+ "transformer_blocks.24.attn.norm_q.weight",
256
+ "transformer_blocks.24.attn.norm_k.weight",
257
+ "transformer_blocks.24.attn.norm_added_q.weight",
258
+ "transformer_blocks.24.attn.norm_added_k.weight",
259
+ "transformer_blocks.24.img_norm1.weight",
260
+ "transformer_blocks.24.img_norm2.weight",
261
+ "transformer_blocks.24.txt_norm1.weight",
262
+ "transformer_blocks.24.txt_norm2.weight",
263
+ "transformer_blocks.25.attn.norm_q.weight",
264
+ "transformer_blocks.25.attn.norm_k.weight",
265
+ "transformer_blocks.25.attn.norm_added_q.weight",
266
+ "transformer_blocks.25.attn.norm_added_k.weight",
267
+ "transformer_blocks.25.img_norm1.weight",
268
+ "transformer_blocks.25.img_norm2.weight",
269
+ "transformer_blocks.25.txt_norm1.weight",
270
+ "transformer_blocks.25.txt_norm2.weight",
271
+ "transformer_blocks.26.attn.norm_q.weight",
272
+ "transformer_blocks.26.attn.norm_k.weight",
273
+ "transformer_blocks.26.attn.norm_added_q.weight",
274
+ "transformer_blocks.26.attn.norm_added_k.weight",
275
+ "transformer_blocks.26.img_norm1.weight",
276
+ "transformer_blocks.26.img_norm2.weight",
277
+ "transformer_blocks.26.txt_norm1.weight",
278
+ "transformer_blocks.26.txt_norm2.weight",
279
+ "transformer_blocks.27.attn.norm_q.weight",
280
+ "transformer_blocks.27.attn.norm_k.weight",
281
+ "transformer_blocks.27.attn.norm_added_q.weight",
282
+ "transformer_blocks.27.attn.norm_added_k.weight",
283
+ "transformer_blocks.27.img_norm1.weight",
284
+ "transformer_blocks.27.img_norm2.weight",
285
+ "transformer_blocks.27.txt_norm1.weight",
286
+ "transformer_blocks.27.txt_norm2.weight",
287
+ "transformer_blocks.28.attn.norm_q.weight",
288
+ "transformer_blocks.28.attn.norm_k.weight",
289
+ "transformer_blocks.28.attn.norm_added_q.weight",
290
+ "transformer_blocks.28.attn.norm_added_k.weight",
291
+ "transformer_blocks.28.img_norm1.weight",
292
+ "transformer_blocks.28.img_norm2.weight",
293
+ "transformer_blocks.28.txt_norm1.weight",
294
+ "transformer_blocks.28.txt_norm2.weight",
295
+ "transformer_blocks.29.attn.norm_q.weight",
296
+ "transformer_blocks.29.attn.norm_k.weight",
297
+ "transformer_blocks.29.attn.norm_added_q.weight",
298
+ "transformer_blocks.29.attn.norm_added_k.weight",
299
+ "transformer_blocks.29.img_norm1.weight",
300
+ "transformer_blocks.29.img_norm2.weight",
301
+ "transformer_blocks.29.txt_norm1.weight",
302
+ "transformer_blocks.29.txt_norm2.weight",
303
+ "transformer_blocks.30.attn.norm_q.weight",
304
+ "transformer_blocks.30.attn.norm_k.weight",
305
+ "transformer_blocks.30.attn.norm_added_q.weight",
306
+ "transformer_blocks.30.attn.norm_added_k.weight",
307
+ "transformer_blocks.30.img_norm1.weight",
308
+ "transformer_blocks.30.img_norm2.weight",
309
+ "transformer_blocks.30.txt_norm1.weight",
310
+ "transformer_blocks.30.txt_norm2.weight",
311
+ "transformer_blocks.31.attn.norm_q.weight",
312
+ "transformer_blocks.31.attn.norm_k.weight",
313
+ "transformer_blocks.31.attn.norm_added_q.weight",
314
+ "transformer_blocks.31.attn.norm_added_k.weight",
315
+ "transformer_blocks.31.img_norm1.weight",
316
+ "transformer_blocks.31.img_norm2.weight",
317
+ "transformer_blocks.31.txt_norm1.weight",
318
+ "transformer_blocks.31.txt_norm2.weight",
319
+ "transformer_blocks.32.attn.norm_q.weight",
320
+ "transformer_blocks.32.attn.norm_k.weight",
321
+ "transformer_blocks.32.attn.norm_added_q.weight",
322
+ "transformer_blocks.32.attn.norm_added_k.weight",
323
+ "transformer_blocks.32.img_norm1.weight",
324
+ "transformer_blocks.32.img_norm2.weight",
325
+ "transformer_blocks.32.txt_norm1.weight",
326
+ "transformer_blocks.32.txt_norm2.weight",
327
+ "transformer_blocks.33.attn.norm_q.weight",
328
+ "transformer_blocks.33.attn.norm_k.weight",
329
+ "transformer_blocks.33.attn.norm_added_q.weight",
330
+ "transformer_blocks.33.attn.norm_added_k.weight",
331
+ "transformer_blocks.33.img_norm1.weight",
332
+ "transformer_blocks.33.img_norm2.weight",
333
+ "transformer_blocks.33.txt_norm1.weight",
334
+ "transformer_blocks.33.txt_norm2.weight",
335
+ "transformer_blocks.34.attn.norm_q.weight",
336
+ "transformer_blocks.34.attn.norm_k.weight",
337
+ "transformer_blocks.34.attn.norm_added_q.weight",
338
+ "transformer_blocks.34.attn.norm_added_k.weight",
339
+ "transformer_blocks.34.img_norm1.weight",
340
+ "transformer_blocks.34.img_norm2.weight",
341
+ "transformer_blocks.34.txt_norm1.weight",
342
+ "transformer_blocks.34.txt_norm2.weight",
343
+ "transformer_blocks.35.attn.norm_q.weight",
344
+ "transformer_blocks.35.attn.norm_k.weight",
345
+ "transformer_blocks.35.attn.norm_added_q.weight",
346
+ "transformer_blocks.35.attn.norm_added_k.weight",
347
+ "transformer_blocks.35.img_norm1.weight",
348
+ "transformer_blocks.35.img_norm2.weight",
349
+ "transformer_blocks.35.txt_norm1.weight",
350
+ "transformer_blocks.35.txt_norm2.weight",
351
+ "transformer_blocks.36.attn.norm_q.weight",
352
+ "transformer_blocks.36.attn.norm_k.weight",
353
+ "transformer_blocks.36.attn.norm_added_q.weight",
354
+ "transformer_blocks.36.attn.norm_added_k.weight",
355
+ "transformer_blocks.36.img_norm1.weight",
356
+ "transformer_blocks.36.img_norm2.weight",
357
+ "transformer_blocks.36.txt_norm1.weight",
358
+ "transformer_blocks.36.txt_norm2.weight",
359
+ "transformer_blocks.37.attn.norm_q.weight",
360
+ "transformer_blocks.37.attn.norm_k.weight",
361
+ "transformer_blocks.37.attn.norm_added_q.weight",
362
+ "transformer_blocks.37.attn.norm_added_k.weight",
363
+ "transformer_blocks.37.img_norm1.weight",
364
+ "transformer_blocks.37.img_norm2.weight",
365
+ "transformer_blocks.37.txt_norm1.weight",
366
+ "transformer_blocks.37.txt_norm2.weight",
367
+ "transformer_blocks.38.attn.norm_q.weight",
368
+ "transformer_blocks.38.attn.norm_k.weight",
369
+ "transformer_blocks.38.attn.norm_added_q.weight",
370
+ "transformer_blocks.38.attn.norm_added_k.weight",
371
+ "transformer_blocks.38.img_norm1.weight",
372
+ "transformer_blocks.38.img_norm2.weight",
373
+ "transformer_blocks.38.txt_norm1.weight",
374
+ "transformer_blocks.38.txt_norm2.weight",
375
+ "transformer_blocks.39.attn.norm_q.weight",
376
+ "transformer_blocks.39.attn.norm_k.weight",
377
+ "transformer_blocks.39.attn.norm_added_q.weight",
378
+ "transformer_blocks.39.attn.norm_added_k.weight",
379
+ "transformer_blocks.39.img_norm1.weight",
380
+ "transformer_blocks.39.img_norm2.weight",
381
+ "transformer_blocks.39.txt_norm1.weight",
382
+ "transformer_blocks.39.txt_norm2.weight",
383
+ "transformer_blocks.40.attn.norm_q.weight",
384
+ "transformer_blocks.40.attn.norm_k.weight",
385
+ "transformer_blocks.40.attn.norm_added_q.weight",
386
+ "transformer_blocks.40.attn.norm_added_k.weight",
387
+ "transformer_blocks.40.img_norm1.weight",
388
+ "transformer_blocks.40.img_norm2.weight",
389
+ "transformer_blocks.40.txt_norm1.weight",
390
+ "transformer_blocks.40.txt_norm2.weight",
391
+ "transformer_blocks.41.attn.norm_q.weight",
392
+ "transformer_blocks.41.attn.norm_k.weight",
393
+ "transformer_blocks.41.attn.norm_added_q.weight",
394
+ "transformer_blocks.41.attn.norm_added_k.weight",
395
+ "transformer_blocks.41.img_norm1.weight",
396
+ "transformer_blocks.41.img_norm2.weight",
397
+ "transformer_blocks.41.txt_norm1.weight",
398
+ "transformer_blocks.41.txt_norm2.weight",
399
+ "transformer_blocks.42.attn.norm_q.weight",
400
+ "transformer_blocks.42.attn.norm_k.weight",
401
+ "transformer_blocks.42.attn.norm_added_q.weight",
402
+ "transformer_blocks.42.attn.norm_added_k.weight",
403
+ "transformer_blocks.42.img_norm1.weight",
404
+ "transformer_blocks.42.img_norm2.weight",
405
+ "transformer_blocks.42.txt_norm1.weight",
406
+ "transformer_blocks.42.txt_norm2.weight",
407
+ "transformer_blocks.43.attn.norm_q.weight",
408
+ "transformer_blocks.43.attn.norm_k.weight",
409
+ "transformer_blocks.43.attn.norm_added_q.weight",
410
+ "transformer_blocks.43.attn.norm_added_k.weight",
411
+ "transformer_blocks.43.img_norm1.weight",
412
+ "transformer_blocks.43.img_norm2.weight",
413
+ "transformer_blocks.43.txt_norm1.weight",
414
+ "transformer_blocks.43.txt_norm2.weight",
415
+ "transformer_blocks.44.attn.norm_q.weight",
416
+ "transformer_blocks.44.attn.norm_k.weight",
417
+ "transformer_blocks.44.attn.norm_added_q.weight",
418
+ "transformer_blocks.44.attn.norm_added_k.weight",
419
+ "transformer_blocks.44.img_norm1.weight",
420
+ "transformer_blocks.44.img_norm2.weight",
421
+ "transformer_blocks.44.txt_norm1.weight",
422
+ "transformer_blocks.44.txt_norm2.weight",
423
+ "transformer_blocks.45.attn.norm_q.weight",
424
+ "transformer_blocks.45.attn.norm_k.weight",
425
+ "transformer_blocks.45.attn.norm_added_q.weight",
426
+ "transformer_blocks.45.attn.norm_added_k.weight",
427
+ "transformer_blocks.45.img_norm1.weight",
428
+ "transformer_blocks.45.img_norm2.weight",
429
+ "transformer_blocks.45.txt_norm1.weight",
430
+ "transformer_blocks.45.txt_norm2.weight",
431
+ "transformer_blocks.46.attn.norm_q.weight",
432
+ "transformer_blocks.46.attn.norm_k.weight",
433
+ "transformer_blocks.46.attn.norm_added_q.weight",
434
+ "transformer_blocks.46.attn.norm_added_k.weight",
435
+ "transformer_blocks.46.img_norm1.weight",
436
+ "transformer_blocks.46.img_norm2.weight",
437
+ "transformer_blocks.46.txt_norm1.weight",
438
+ "transformer_blocks.46.txt_norm2.weight",
439
+ "transformer_blocks.47.attn.norm_q.weight",
440
+ "transformer_blocks.47.attn.norm_k.weight",
441
+ "transformer_blocks.47.attn.norm_added_q.weight",
442
+ "transformer_blocks.47.attn.norm_added_k.weight",
443
+ "transformer_blocks.47.img_norm1.weight",
444
+ "transformer_blocks.47.img_norm2.weight",
445
+ "transformer_blocks.47.txt_norm1.weight",
446
+ "transformer_blocks.47.txt_norm2.weight"
447
+ ],
448
+ "modules_to_not_use_matmul": [],
449
+ "non_blocking": false,
450
+ "quant_conv": false,
451
+ "quant_embedding": false,
452
+ "quant_method": "sdnq",
453
+ "quantization_device": null,
454
+ "quantized_matmul_dtype": "int8",
455
+ "return_device": null,
456
+ "sdnq_version": "0.2.0",
457
+ "svd_rank": 32,
458
+ "svd_steps": 8,
459
+ "use_dynamic_quantization": false,
460
+ "use_grad_ckpt": true,
461
+ "use_hadamard": false,
462
+ "use_quantized_matmul": true,
463
+ "use_quantized_matmul_conv": false,
464
+ "use_static_quantization": true,
465
+ "use_stochastic_rounding": false,
466
+ "use_svd": false,
467
+ "weights_dtype": "uint4"
468
+ },
469
+ "rms_norm": true,
470
+ "selected_layer_index": [
471
+ 5,
472
+ 11,
473
+ 17,
474
+ 23
475
+ ]
476
+ }
transformer/diffusion_pytorch_model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd3791d4c163f82fb8e95f7f53bd7af38043e24b19bc5bcab600e2c2633ec87
3
+ size 3987262976
transformer/diffusion_pytorch_model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1065a7a189f5d7dbe23820538667563f615c92685e566e2c8b7d8777ea350c5e
3
+ size 314450920
transformer/diffusion_pytorch_model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
transformer/quantization_config.json ADDED
@@ -0,0 +1,449 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_skip_keys": false,
3
+ "dequantize_fp32": false,
4
+ "dynamic_loss_threshold": null,
5
+ "group_size": 0,
6
+ "hadamard_group_size": 128,
7
+ "is_integer": true,
8
+ "is_training": false,
9
+ "modules_dtype_dict": {},
10
+ "modules_quant_config": {},
11
+ "modules_to_not_convert": [
12
+ ".emb_in",
13
+ ".emb_out",
14
+ "norm",
15
+ ".y_embedder",
16
+ "patch_emb",
17
+ "lm_head",
18
+ ".condition_embedder",
19
+ ".norm_out",
20
+ ".t_embedder",
21
+ "patch_embedding",
22
+ ".vid_in",
23
+ ".txt_in",
24
+ ".txt_out",
25
+ ".time_embed",
26
+ "*.img_mod.*",
27
+ ".proj_out",
28
+ ".img_out",
29
+ "*.txt_mod.*",
30
+ ".context_embedder",
31
+ ".vid_out",
32
+ "time_text_embed",
33
+ "patch_embed",
34
+ "wte",
35
+ ".img_in",
36
+ ".final_layer",
37
+ ".x_embedder",
38
+ "multi_modal_projector",
39
+ "pos_embed",
40
+ "txt_norm.0.weight",
41
+ "txt_norm.1.weight",
42
+ "txt_norm.2.weight",
43
+ "txt_norm.3.weight",
44
+ "transformer_blocks.0.attn.norm_q.weight",
45
+ "transformer_blocks.0.attn.norm_k.weight",
46
+ "transformer_blocks.0.attn.norm_added_q.weight",
47
+ "transformer_blocks.0.attn.norm_added_k.weight",
48
+ "transformer_blocks.0.img_norm1.weight",
49
+ "transformer_blocks.0.img_norm2.weight",
50
+ "transformer_blocks.0.txt_norm1.weight",
51
+ "transformer_blocks.0.txt_norm2.weight",
52
+ "transformer_blocks.1.attn.norm_q.weight",
53
+ "transformer_blocks.1.attn.norm_k.weight",
54
+ "transformer_blocks.1.attn.norm_added_q.weight",
55
+ "transformer_blocks.1.attn.norm_added_k.weight",
56
+ "transformer_blocks.1.img_norm1.weight",
57
+ "transformer_blocks.1.img_norm2.weight",
58
+ "transformer_blocks.1.txt_norm1.weight",
59
+ "transformer_blocks.1.txt_norm2.weight",
60
+ "transformer_blocks.2.attn.norm_q.weight",
61
+ "transformer_blocks.2.attn.norm_k.weight",
62
+ "transformer_blocks.2.attn.norm_added_q.weight",
63
+ "transformer_blocks.2.attn.norm_added_k.weight",
64
+ "transformer_blocks.2.img_norm1.weight",
65
+ "transformer_blocks.2.img_norm2.weight",
66
+ "transformer_blocks.2.txt_norm1.weight",
67
+ "transformer_blocks.2.txt_norm2.weight",
68
+ "transformer_blocks.3.attn.norm_q.weight",
69
+ "transformer_blocks.3.attn.norm_k.weight",
70
+ "transformer_blocks.3.attn.norm_added_q.weight",
71
+ "transformer_blocks.3.attn.norm_added_k.weight",
72
+ "transformer_blocks.3.img_norm1.weight",
73
+ "transformer_blocks.3.img_norm2.weight",
74
+ "transformer_blocks.3.txt_norm1.weight",
75
+ "transformer_blocks.3.txt_norm2.weight",
76
+ "transformer_blocks.4.attn.norm_q.weight",
77
+ "transformer_blocks.4.attn.norm_k.weight",
78
+ "transformer_blocks.4.attn.norm_added_q.weight",
79
+ "transformer_blocks.4.attn.norm_added_k.weight",
80
+ "transformer_blocks.4.img_norm1.weight",
81
+ "transformer_blocks.4.img_norm2.weight",
82
+ "transformer_blocks.4.txt_norm1.weight",
83
+ "transformer_blocks.4.txt_norm2.weight",
84
+ "transformer_blocks.5.attn.norm_q.weight",
85
+ "transformer_blocks.5.attn.norm_k.weight",
86
+ "transformer_blocks.5.attn.norm_added_q.weight",
87
+ "transformer_blocks.5.attn.norm_added_k.weight",
88
+ "transformer_blocks.5.img_norm1.weight",
89
+ "transformer_blocks.5.img_norm2.weight",
90
+ "transformer_blocks.5.txt_norm1.weight",
91
+ "transformer_blocks.5.txt_norm2.weight",
92
+ "transformer_blocks.6.attn.norm_q.weight",
93
+ "transformer_blocks.6.attn.norm_k.weight",
94
+ "transformer_blocks.6.attn.norm_added_q.weight",
95
+ "transformer_blocks.6.attn.norm_added_k.weight",
96
+ "transformer_blocks.6.img_norm1.weight",
97
+ "transformer_blocks.6.img_norm2.weight",
98
+ "transformer_blocks.6.txt_norm1.weight",
99
+ "transformer_blocks.6.txt_norm2.weight",
100
+ "transformer_blocks.7.attn.norm_q.weight",
101
+ "transformer_blocks.7.attn.norm_k.weight",
102
+ "transformer_blocks.7.attn.norm_added_q.weight",
103
+ "transformer_blocks.7.attn.norm_added_k.weight",
104
+ "transformer_blocks.7.img_norm1.weight",
105
+ "transformer_blocks.7.img_norm2.weight",
106
+ "transformer_blocks.7.txt_norm1.weight",
107
+ "transformer_blocks.7.txt_norm2.weight",
108
+ "transformer_blocks.8.attn.norm_q.weight",
109
+ "transformer_blocks.8.attn.norm_k.weight",
110
+ "transformer_blocks.8.attn.norm_added_q.weight",
111
+ "transformer_blocks.8.attn.norm_added_k.weight",
112
+ "transformer_blocks.8.img_norm1.weight",
113
+ "transformer_blocks.8.img_norm2.weight",
114
+ "transformer_blocks.8.txt_norm1.weight",
115
+ "transformer_blocks.8.txt_norm2.weight",
116
+ "transformer_blocks.9.attn.norm_q.weight",
117
+ "transformer_blocks.9.attn.norm_k.weight",
118
+ "transformer_blocks.9.attn.norm_added_q.weight",
119
+ "transformer_blocks.9.attn.norm_added_k.weight",
120
+ "transformer_blocks.9.img_norm1.weight",
121
+ "transformer_blocks.9.img_norm2.weight",
122
+ "transformer_blocks.9.txt_norm1.weight",
123
+ "transformer_blocks.9.txt_norm2.weight",
124
+ "transformer_blocks.10.attn.norm_q.weight",
125
+ "transformer_blocks.10.attn.norm_k.weight",
126
+ "transformer_blocks.10.attn.norm_added_q.weight",
127
+ "transformer_blocks.10.attn.norm_added_k.weight",
128
+ "transformer_blocks.10.img_norm1.weight",
129
+ "transformer_blocks.10.img_norm2.weight",
130
+ "transformer_blocks.10.txt_norm1.weight",
131
+ "transformer_blocks.10.txt_norm2.weight",
132
+ "transformer_blocks.11.attn.norm_q.weight",
133
+ "transformer_blocks.11.attn.norm_k.weight",
134
+ "transformer_blocks.11.attn.norm_added_q.weight",
135
+ "transformer_blocks.11.attn.norm_added_k.weight",
136
+ "transformer_blocks.11.img_norm1.weight",
137
+ "transformer_blocks.11.img_norm2.weight",
138
+ "transformer_blocks.11.txt_norm1.weight",
139
+ "transformer_blocks.11.txt_norm2.weight",
140
+ "transformer_blocks.12.attn.norm_q.weight",
141
+ "transformer_blocks.12.attn.norm_k.weight",
142
+ "transformer_blocks.12.attn.norm_added_q.weight",
143
+ "transformer_blocks.12.attn.norm_added_k.weight",
144
+ "transformer_blocks.12.img_norm1.weight",
145
+ "transformer_blocks.12.img_norm2.weight",
146
+ "transformer_blocks.12.txt_norm1.weight",
147
+ "transformer_blocks.12.txt_norm2.weight",
148
+ "transformer_blocks.13.attn.norm_q.weight",
149
+ "transformer_blocks.13.attn.norm_k.weight",
150
+ "transformer_blocks.13.attn.norm_added_q.weight",
151
+ "transformer_blocks.13.attn.norm_added_k.weight",
152
+ "transformer_blocks.13.img_norm1.weight",
153
+ "transformer_blocks.13.img_norm2.weight",
154
+ "transformer_blocks.13.txt_norm1.weight",
155
+ "transformer_blocks.13.txt_norm2.weight",
156
+ "transformer_blocks.14.attn.norm_q.weight",
157
+ "transformer_blocks.14.attn.norm_k.weight",
158
+ "transformer_blocks.14.attn.norm_added_q.weight",
159
+ "transformer_blocks.14.attn.norm_added_k.weight",
160
+ "transformer_blocks.14.img_norm1.weight",
161
+ "transformer_blocks.14.img_norm2.weight",
162
+ "transformer_blocks.14.txt_norm1.weight",
163
+ "transformer_blocks.14.txt_norm2.weight",
164
+ "transformer_blocks.15.attn.norm_q.weight",
165
+ "transformer_blocks.15.attn.norm_k.weight",
166
+ "transformer_blocks.15.attn.norm_added_q.weight",
167
+ "transformer_blocks.15.attn.norm_added_k.weight",
168
+ "transformer_blocks.15.img_norm1.weight",
169
+ "transformer_blocks.15.img_norm2.weight",
170
+ "transformer_blocks.15.txt_norm1.weight",
171
+ "transformer_blocks.15.txt_norm2.weight",
172
+ "transformer_blocks.16.attn.norm_q.weight",
173
+ "transformer_blocks.16.attn.norm_k.weight",
174
+ "transformer_blocks.16.attn.norm_added_q.weight",
175
+ "transformer_blocks.16.attn.norm_added_k.weight",
176
+ "transformer_blocks.16.img_norm1.weight",
177
+ "transformer_blocks.16.img_norm2.weight",
178
+ "transformer_blocks.16.txt_norm1.weight",
179
+ "transformer_blocks.16.txt_norm2.weight",
180
+ "transformer_blocks.17.attn.norm_q.weight",
181
+ "transformer_blocks.17.attn.norm_k.weight",
182
+ "transformer_blocks.17.attn.norm_added_q.weight",
183
+ "transformer_blocks.17.attn.norm_added_k.weight",
184
+ "transformer_blocks.17.img_norm1.weight",
185
+ "transformer_blocks.17.img_norm2.weight",
186
+ "transformer_blocks.17.txt_norm1.weight",
187
+ "transformer_blocks.17.txt_norm2.weight",
188
+ "transformer_blocks.18.attn.norm_q.weight",
189
+ "transformer_blocks.18.attn.norm_k.weight",
190
+ "transformer_blocks.18.attn.norm_added_q.weight",
191
+ "transformer_blocks.18.attn.norm_added_k.weight",
192
+ "transformer_blocks.18.img_norm1.weight",
193
+ "transformer_blocks.18.img_norm2.weight",
194
+ "transformer_blocks.18.txt_norm1.weight",
195
+ "transformer_blocks.18.txt_norm2.weight",
196
+ "transformer_blocks.19.attn.norm_q.weight",
197
+ "transformer_blocks.19.attn.norm_k.weight",
198
+ "transformer_blocks.19.attn.norm_added_q.weight",
199
+ "transformer_blocks.19.attn.norm_added_k.weight",
200
+ "transformer_blocks.19.img_norm1.weight",
201
+ "transformer_blocks.19.img_norm2.weight",
202
+ "transformer_blocks.19.txt_norm1.weight",
203
+ "transformer_blocks.19.txt_norm2.weight",
204
+ "transformer_blocks.20.attn.norm_q.weight",
205
+ "transformer_blocks.20.attn.norm_k.weight",
206
+ "transformer_blocks.20.attn.norm_added_q.weight",
207
+ "transformer_blocks.20.attn.norm_added_k.weight",
208
+ "transformer_blocks.20.img_norm1.weight",
209
+ "transformer_blocks.20.img_norm2.weight",
210
+ "transformer_blocks.20.txt_norm1.weight",
211
+ "transformer_blocks.20.txt_norm2.weight",
212
+ "transformer_blocks.21.attn.norm_q.weight",
213
+ "transformer_blocks.21.attn.norm_k.weight",
214
+ "transformer_blocks.21.attn.norm_added_q.weight",
215
+ "transformer_blocks.21.attn.norm_added_k.weight",
216
+ "transformer_blocks.21.img_norm1.weight",
217
+ "transformer_blocks.21.img_norm2.weight",
218
+ "transformer_blocks.21.txt_norm1.weight",
219
+ "transformer_blocks.21.txt_norm2.weight",
220
+ "transformer_blocks.22.attn.norm_q.weight",
221
+ "transformer_blocks.22.attn.norm_k.weight",
222
+ "transformer_blocks.22.attn.norm_added_q.weight",
223
+ "transformer_blocks.22.attn.norm_added_k.weight",
224
+ "transformer_blocks.22.img_norm1.weight",
225
+ "transformer_blocks.22.img_norm2.weight",
226
+ "transformer_blocks.22.txt_norm1.weight",
227
+ "transformer_blocks.22.txt_norm2.weight",
228
+ "transformer_blocks.23.attn.norm_q.weight",
229
+ "transformer_blocks.23.attn.norm_k.weight",
230
+ "transformer_blocks.23.attn.norm_added_q.weight",
231
+ "transformer_blocks.23.attn.norm_added_k.weight",
232
+ "transformer_blocks.23.img_norm1.weight",
233
+ "transformer_blocks.23.img_norm2.weight",
234
+ "transformer_blocks.23.txt_norm1.weight",
235
+ "transformer_blocks.23.txt_norm2.weight",
236
+ "transformer_blocks.24.attn.norm_q.weight",
237
+ "transformer_blocks.24.attn.norm_k.weight",
238
+ "transformer_blocks.24.attn.norm_added_q.weight",
239
+ "transformer_blocks.24.attn.norm_added_k.weight",
240
+ "transformer_blocks.24.img_norm1.weight",
241
+ "transformer_blocks.24.img_norm2.weight",
242
+ "transformer_blocks.24.txt_norm1.weight",
243
+ "transformer_blocks.24.txt_norm2.weight",
244
+ "transformer_blocks.25.attn.norm_q.weight",
245
+ "transformer_blocks.25.attn.norm_k.weight",
246
+ "transformer_blocks.25.attn.norm_added_q.weight",
247
+ "transformer_blocks.25.attn.norm_added_k.weight",
248
+ "transformer_blocks.25.img_norm1.weight",
249
+ "transformer_blocks.25.img_norm2.weight",
250
+ "transformer_blocks.25.txt_norm1.weight",
251
+ "transformer_blocks.25.txt_norm2.weight",
252
+ "transformer_blocks.26.attn.norm_q.weight",
253
+ "transformer_blocks.26.attn.norm_k.weight",
254
+ "transformer_blocks.26.attn.norm_added_q.weight",
255
+ "transformer_blocks.26.attn.norm_added_k.weight",
256
+ "transformer_blocks.26.img_norm1.weight",
257
+ "transformer_blocks.26.img_norm2.weight",
258
+ "transformer_blocks.26.txt_norm1.weight",
259
+ "transformer_blocks.26.txt_norm2.weight",
260
+ "transformer_blocks.27.attn.norm_q.weight",
261
+ "transformer_blocks.27.attn.norm_k.weight",
262
+ "transformer_blocks.27.attn.norm_added_q.weight",
263
+ "transformer_blocks.27.attn.norm_added_k.weight",
264
+ "transformer_blocks.27.img_norm1.weight",
265
+ "transformer_blocks.27.img_norm2.weight",
266
+ "transformer_blocks.27.txt_norm1.weight",
267
+ "transformer_blocks.27.txt_norm2.weight",
268
+ "transformer_blocks.28.attn.norm_q.weight",
269
+ "transformer_blocks.28.attn.norm_k.weight",
270
+ "transformer_blocks.28.attn.norm_added_q.weight",
271
+ "transformer_blocks.28.attn.norm_added_k.weight",
272
+ "transformer_blocks.28.img_norm1.weight",
273
+ "transformer_blocks.28.img_norm2.weight",
274
+ "transformer_blocks.28.txt_norm1.weight",
275
+ "transformer_blocks.28.txt_norm2.weight",
276
+ "transformer_blocks.29.attn.norm_q.weight",
277
+ "transformer_blocks.29.attn.norm_k.weight",
278
+ "transformer_blocks.29.attn.norm_added_q.weight",
279
+ "transformer_blocks.29.attn.norm_added_k.weight",
280
+ "transformer_blocks.29.img_norm1.weight",
281
+ "transformer_blocks.29.img_norm2.weight",
282
+ "transformer_blocks.29.txt_norm1.weight",
283
+ "transformer_blocks.29.txt_norm2.weight",
284
+ "transformer_blocks.30.attn.norm_q.weight",
285
+ "transformer_blocks.30.attn.norm_k.weight",
286
+ "transformer_blocks.30.attn.norm_added_q.weight",
287
+ "transformer_blocks.30.attn.norm_added_k.weight",
288
+ "transformer_blocks.30.img_norm1.weight",
289
+ "transformer_blocks.30.img_norm2.weight",
290
+ "transformer_blocks.30.txt_norm1.weight",
291
+ "transformer_blocks.30.txt_norm2.weight",
292
+ "transformer_blocks.31.attn.norm_q.weight",
293
+ "transformer_blocks.31.attn.norm_k.weight",
294
+ "transformer_blocks.31.attn.norm_added_q.weight",
295
+ "transformer_blocks.31.attn.norm_added_k.weight",
296
+ "transformer_blocks.31.img_norm1.weight",
297
+ "transformer_blocks.31.img_norm2.weight",
298
+ "transformer_blocks.31.txt_norm1.weight",
299
+ "transformer_blocks.31.txt_norm2.weight",
300
+ "transformer_blocks.32.attn.norm_q.weight",
301
+ "transformer_blocks.32.attn.norm_k.weight",
302
+ "transformer_blocks.32.attn.norm_added_q.weight",
303
+ "transformer_blocks.32.attn.norm_added_k.weight",
304
+ "transformer_blocks.32.img_norm1.weight",
305
+ "transformer_blocks.32.img_norm2.weight",
306
+ "transformer_blocks.32.txt_norm1.weight",
307
+ "transformer_blocks.32.txt_norm2.weight",
308
+ "transformer_blocks.33.attn.norm_q.weight",
309
+ "transformer_blocks.33.attn.norm_k.weight",
310
+ "transformer_blocks.33.attn.norm_added_q.weight",
311
+ "transformer_blocks.33.attn.norm_added_k.weight",
312
+ "transformer_blocks.33.img_norm1.weight",
313
+ "transformer_blocks.33.img_norm2.weight",
314
+ "transformer_blocks.33.txt_norm1.weight",
315
+ "transformer_blocks.33.txt_norm2.weight",
316
+ "transformer_blocks.34.attn.norm_q.weight",
317
+ "transformer_blocks.34.attn.norm_k.weight",
318
+ "transformer_blocks.34.attn.norm_added_q.weight",
319
+ "transformer_blocks.34.attn.norm_added_k.weight",
320
+ "transformer_blocks.34.img_norm1.weight",
321
+ "transformer_blocks.34.img_norm2.weight",
322
+ "transformer_blocks.34.txt_norm1.weight",
323
+ "transformer_blocks.34.txt_norm2.weight",
324
+ "transformer_blocks.35.attn.norm_q.weight",
325
+ "transformer_blocks.35.attn.norm_k.weight",
326
+ "transformer_blocks.35.attn.norm_added_q.weight",
327
+ "transformer_blocks.35.attn.norm_added_k.weight",
328
+ "transformer_blocks.35.img_norm1.weight",
329
+ "transformer_blocks.35.img_norm2.weight",
330
+ "transformer_blocks.35.txt_norm1.weight",
331
+ "transformer_blocks.35.txt_norm2.weight",
332
+ "transformer_blocks.36.attn.norm_q.weight",
333
+ "transformer_blocks.36.attn.norm_k.weight",
334
+ "transformer_blocks.36.attn.norm_added_q.weight",
335
+ "transformer_blocks.36.attn.norm_added_k.weight",
336
+ "transformer_blocks.36.img_norm1.weight",
337
+ "transformer_blocks.36.img_norm2.weight",
338
+ "transformer_blocks.36.txt_norm1.weight",
339
+ "transformer_blocks.36.txt_norm2.weight",
340
+ "transformer_blocks.37.attn.norm_q.weight",
341
+ "transformer_blocks.37.attn.norm_k.weight",
342
+ "transformer_blocks.37.attn.norm_added_q.weight",
343
+ "transformer_blocks.37.attn.norm_added_k.weight",
344
+ "transformer_blocks.37.img_norm1.weight",
345
+ "transformer_blocks.37.img_norm2.weight",
346
+ "transformer_blocks.37.txt_norm1.weight",
347
+ "transformer_blocks.37.txt_norm2.weight",
348
+ "transformer_blocks.38.attn.norm_q.weight",
349
+ "transformer_blocks.38.attn.norm_k.weight",
350
+ "transformer_blocks.38.attn.norm_added_q.weight",
351
+ "transformer_blocks.38.attn.norm_added_k.weight",
352
+ "transformer_blocks.38.img_norm1.weight",
353
+ "transformer_blocks.38.img_norm2.weight",
354
+ "transformer_blocks.38.txt_norm1.weight",
355
+ "transformer_blocks.38.txt_norm2.weight",
356
+ "transformer_blocks.39.attn.norm_q.weight",
357
+ "transformer_blocks.39.attn.norm_k.weight",
358
+ "transformer_blocks.39.attn.norm_added_q.weight",
359
+ "transformer_blocks.39.attn.norm_added_k.weight",
360
+ "transformer_blocks.39.img_norm1.weight",
361
+ "transformer_blocks.39.img_norm2.weight",
362
+ "transformer_blocks.39.txt_norm1.weight",
363
+ "transformer_blocks.39.txt_norm2.weight",
364
+ "transformer_blocks.40.attn.norm_q.weight",
365
+ "transformer_blocks.40.attn.norm_k.weight",
366
+ "transformer_blocks.40.attn.norm_added_q.weight",
367
+ "transformer_blocks.40.attn.norm_added_k.weight",
368
+ "transformer_blocks.40.img_norm1.weight",
369
+ "transformer_blocks.40.img_norm2.weight",
370
+ "transformer_blocks.40.txt_norm1.weight",
371
+ "transformer_blocks.40.txt_norm2.weight",
372
+ "transformer_blocks.41.attn.norm_q.weight",
373
+ "transformer_blocks.41.attn.norm_k.weight",
374
+ "transformer_blocks.41.attn.norm_added_q.weight",
375
+ "transformer_blocks.41.attn.norm_added_k.weight",
376
+ "transformer_blocks.41.img_norm1.weight",
377
+ "transformer_blocks.41.img_norm2.weight",
378
+ "transformer_blocks.41.txt_norm1.weight",
379
+ "transformer_blocks.41.txt_norm2.weight",
380
+ "transformer_blocks.42.attn.norm_q.weight",
381
+ "transformer_blocks.42.attn.norm_k.weight",
382
+ "transformer_blocks.42.attn.norm_added_q.weight",
383
+ "transformer_blocks.42.attn.norm_added_k.weight",
384
+ "transformer_blocks.42.img_norm1.weight",
385
+ "transformer_blocks.42.img_norm2.weight",
386
+ "transformer_blocks.42.txt_norm1.weight",
387
+ "transformer_blocks.42.txt_norm2.weight",
388
+ "transformer_blocks.43.attn.norm_q.weight",
389
+ "transformer_blocks.43.attn.norm_k.weight",
390
+ "transformer_blocks.43.attn.norm_added_q.weight",
391
+ "transformer_blocks.43.attn.norm_added_k.weight",
392
+ "transformer_blocks.43.img_norm1.weight",
393
+ "transformer_blocks.43.img_norm2.weight",
394
+ "transformer_blocks.43.txt_norm1.weight",
395
+ "transformer_blocks.43.txt_norm2.weight",
396
+ "transformer_blocks.44.attn.norm_q.weight",
397
+ "transformer_blocks.44.attn.norm_k.weight",
398
+ "transformer_blocks.44.attn.norm_added_q.weight",
399
+ "transformer_blocks.44.attn.norm_added_k.weight",
400
+ "transformer_blocks.44.img_norm1.weight",
401
+ "transformer_blocks.44.img_norm2.weight",
402
+ "transformer_blocks.44.txt_norm1.weight",
403
+ "transformer_blocks.44.txt_norm2.weight",
404
+ "transformer_blocks.45.attn.norm_q.weight",
405
+ "transformer_blocks.45.attn.norm_k.weight",
406
+ "transformer_blocks.45.attn.norm_added_q.weight",
407
+ "transformer_blocks.45.attn.norm_added_k.weight",
408
+ "transformer_blocks.45.img_norm1.weight",
409
+ "transformer_blocks.45.img_norm2.weight",
410
+ "transformer_blocks.45.txt_norm1.weight",
411
+ "transformer_blocks.45.txt_norm2.weight",
412
+ "transformer_blocks.46.attn.norm_q.weight",
413
+ "transformer_blocks.46.attn.norm_k.weight",
414
+ "transformer_blocks.46.attn.norm_added_q.weight",
415
+ "transformer_blocks.46.attn.norm_added_k.weight",
416
+ "transformer_blocks.46.img_norm1.weight",
417
+ "transformer_blocks.46.img_norm2.weight",
418
+ "transformer_blocks.46.txt_norm1.weight",
419
+ "transformer_blocks.46.txt_norm2.weight",
420
+ "transformer_blocks.47.attn.norm_q.weight",
421
+ "transformer_blocks.47.attn.norm_k.weight",
422
+ "transformer_blocks.47.attn.norm_added_q.weight",
423
+ "transformer_blocks.47.attn.norm_added_k.weight",
424
+ "transformer_blocks.47.img_norm1.weight",
425
+ "transformer_blocks.47.img_norm2.weight",
426
+ "transformer_blocks.47.txt_norm1.weight",
427
+ "transformer_blocks.47.txt_norm2.weight"
428
+ ],
429
+ "modules_to_not_use_matmul": [],
430
+ "non_blocking": false,
431
+ "quant_conv": false,
432
+ "quant_embedding": false,
433
+ "quant_method": "sdnq",
434
+ "quantization_device": null,
435
+ "quantized_matmul_dtype": "int8",
436
+ "return_device": null,
437
+ "sdnq_version": "0.2.0",
438
+ "svd_rank": 32,
439
+ "svd_steps": 8,
440
+ "use_dynamic_quantization": false,
441
+ "use_grad_ckpt": true,
442
+ "use_hadamard": false,
443
+ "use_quantized_matmul": true,
444
+ "use_quantized_matmul_conv": false,
445
+ "use_static_quantization": true,
446
+ "use_stochastic_rounding": false,
447
+ "use_svd": false,
448
+ "weights_dtype": "uint4"
449
+ }
vae/config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKLFlux2",
3
+ "_diffusers_version": "0.37.1",
4
+ "_name_or_path": "black-forest-labs/FLUX.2-dev",
5
+ "act_fn": "silu",
6
+ "batch_norm_eps": 0.0001,
7
+ "batch_norm_momentum": 0.1,
8
+ "block_out_channels": [
9
+ 128,
10
+ 256,
11
+ 512,
12
+ 512
13
+ ],
14
+ "down_block_types": [
15
+ "DownEncoderBlock2D",
16
+ "DownEncoderBlock2D",
17
+ "DownEncoderBlock2D",
18
+ "DownEncoderBlock2D"
19
+ ],
20
+ "force_upcast": true,
21
+ "in_channels": 3,
22
+ "latent_channels": 32,
23
+ "layers_per_block": 2,
24
+ "mid_block_add_attention": true,
25
+ "norm_num_groups": 32,
26
+ "out_channels": 3,
27
+ "patch_size": [
28
+ 2,
29
+ 2
30
+ ],
31
+ "sample_size": 1024,
32
+ "up_block_types": [
33
+ "UpDecoderBlock2D",
34
+ "UpDecoderBlock2D",
35
+ "UpDecoderBlock2D",
36
+ "UpDecoderBlock2D"
37
+ ],
38
+ "use_post_quant_conv": true,
39
+ "use_quant_conv": true
40
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d64f3a68e1cc4f9f4e29b6e0da38a0204fe9a49f2d4053f0ec1fa1ca02f9c4b5
3
+ size 336213556