WaveCut commited on
Commit
09f4a4a
·
verified ·
1 Parent(s): c08ce47

Upload SDNQ Uint Static quantized Lens-Turbo

Browse files
Files changed (42) hide show
  1. .gitattributes +21 -0
  2. README.md +199 -0
  3. assets/comparison/p01_original.png +3 -0
  4. assets/comparison/p01_sdnq_uint_static.png +3 -0
  5. assets/comparison/p02_original.png +3 -0
  6. assets/comparison/p02_sdnq_uint_static.png +3 -0
  7. assets/comparison/p03_original.png +3 -0
  8. assets/comparison/p03_sdnq_uint_static.png +3 -0
  9. assets/comparison/p04_original.png +3 -0
  10. assets/comparison/p04_sdnq_uint_static.png +3 -0
  11. assets/comparison/p05_original.png +3 -0
  12. assets/comparison/p05_sdnq_uint_static.png +3 -0
  13. assets/comparison/p06_original.png +3 -0
  14. assets/comparison/p06_sdnq_uint_static.png +3 -0
  15. assets/comparison/p07_original.png +3 -0
  16. assets/comparison/p07_sdnq_uint_static.png +3 -0
  17. assets/comparison/p08_original.png +3 -0
  18. assets/comparison/p08_sdnq_uint_static.png +3 -0
  19. assets/comparison/p09_original.png +3 -0
  20. assets/comparison/p09_sdnq_uint_static.png +3 -0
  21. assets/comparison/p10_original.png +3 -0
  22. assets/comparison/p10_sdnq_uint_static.png +3 -0
  23. benchmark_metrics.json +19 -0
  24. comparison_matrix.json +312 -0
  25. model_index.json +25 -0
  26. scheduler/scheduler_config.json +18 -0
  27. sdnq_quantization_summary.json +22 -0
  28. text_encoder/config.json +78 -0
  29. text_encoder/generation_config.json +7 -0
  30. text_encoder/model-00001-of-00004.safetensors +3 -0
  31. text_encoder/model-00002-of-00004.safetensors +3 -0
  32. text_encoder/model-00003-of-00004.safetensors +3 -0
  33. text_encoder/model-00004-of-00004.safetensors +3 -0
  34. text_encoder/model.safetensors.index.json +467 -0
  35. tokenizer/chat_template.jinja +331 -0
  36. tokenizer/tokenizer.json +3 -0
  37. tokenizer/tokenizer_config.json +15 -0
  38. transformer/config.json +474 -0
  39. transformer/diffusion_pytorch_model.safetensors +3 -0
  40. transformer/quantization_config.json +447 -0
  41. vae/config.json +41 -0
  42. vae/diffusion_pytorch_model.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,24 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/comparison/p01_original.png filter=lfs diff=lfs merge=lfs -text
37
+ assets/comparison/p01_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
38
+ assets/comparison/p02_original.png filter=lfs diff=lfs merge=lfs -text
39
+ assets/comparison/p02_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
40
+ assets/comparison/p03_original.png filter=lfs diff=lfs merge=lfs -text
41
+ assets/comparison/p03_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
42
+ assets/comparison/p04_original.png filter=lfs diff=lfs merge=lfs -text
43
+ assets/comparison/p04_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
44
+ assets/comparison/p05_original.png filter=lfs diff=lfs merge=lfs -text
45
+ assets/comparison/p05_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
46
+ assets/comparison/p06_original.png filter=lfs diff=lfs merge=lfs -text
47
+ assets/comparison/p06_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
48
+ assets/comparison/p07_original.png filter=lfs diff=lfs merge=lfs -text
49
+ assets/comparison/p07_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
50
+ assets/comparison/p08_original.png filter=lfs diff=lfs merge=lfs -text
51
+ assets/comparison/p08_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
52
+ assets/comparison/p09_original.png filter=lfs diff=lfs merge=lfs -text
53
+ assets/comparison/p09_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
54
+ assets/comparison/p10_original.png filter=lfs diff=lfs merge=lfs -text
55
+ assets/comparison/p10_sdnq_uint_static.png filter=lfs diff=lfs merge=lfs -text
56
+ tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,199 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ language:
4
+ - en
5
+ - ru
6
+ pipeline_tag: text-to-image
7
+ tags:
8
+ - diffusers
9
+ - safetensors
10
+ - text-to-image
11
+ - LensPipeline
12
+ - sdnq
13
+ - quantized
14
+ - uint4
15
+ - static-quantization
16
+ base_model: microsoft/Lens-Turbo
17
+ ---
18
+
19
+ # Lens-Turbo SDNQ Uint Static
20
+
21
+ This is an SDNQ static UINT4 quantized variant of [microsoft/Lens-Turbo](https://huggingface.co/microsoft/Lens-Turbo).
22
+ It keeps the Lens pipeline structure intact and focuses quantization on the denoising transformer, which is the main generation component.
23
+
24
+ The original Lens card describes Lens as a 3.8B-parameter text-to-image model using dense-caption training, GPT-OSS multi-layer text features, and the FLUX.2 semantic VAE. Lens-Turbo is the distilled 4-step variant.
25
+
26
+ ## Quantization
27
+
28
+ | Field | Value |
29
+ | --- | --- |
30
+ | Method | SDNQ Uint Static |
31
+ | Quantized component | `transformer` / `LensTransformer2DModel` |
32
+ | Weight dtype | `uint4` |
33
+ | Quantized matmul | enabled |
34
+ | Quantized matmul dtype | `int8` |
35
+ | Static quantization | enabled |
36
+ | Dynamic quantization | disabled |
37
+ | SVDQuant | disabled |
38
+ | Hadamard rotation | disabled |
39
+ | Convolution quantization | disabled |
40
+ | Embedding quantization | disabled |
41
+ | Text encoder | unchanged from source checkpoint |
42
+ | VAE | unchanged from source checkpoint |
43
+ | Compute dtype | `torch.bfloat16` |
44
+
45
+ Raw config:
46
+
47
+ ```json
48
+ {
49
+ "weights_dtype": "uint4",
50
+ "quantized_matmul_dtype": "int8",
51
+ "group_size": "0",
52
+ "use_static_quantization": "True",
53
+ "use_dynamic_quantization": "False",
54
+ "use_quantized_matmul": "True",
55
+ "use_svd": "False",
56
+ "use_hadamard": "False",
57
+ "quant_conv": "False",
58
+ "quant_embedding": "False",
59
+ "dequantize_fp32": "False",
60
+ "quantization_device": "cuda",
61
+ "return_device": "cuda"
62
+ }
63
+ ```
64
+
65
+ ## Usage
66
+
67
+ Install the Lens inference code and SDNQ, then download the repo snapshot and load the quantized transformer explicitly:
68
+
69
+ ```python
70
+ import torch
71
+ from huggingface_hub import snapshot_download
72
+ from lens import LensPipeline, LensTransformer2DModel
73
+ from sdnq import load_sdnq_model
74
+
75
+ repo_id = "WaveCut/Lens-Turbo-SDNQ-Uint-Static"
76
+ model_dir = snapshot_download(repo_id)
77
+
78
+ transformer = load_sdnq_model(
79
+ model_dir + "/transformer",
80
+ model_cls=LensTransformer2DModel,
81
+ dtype=torch.bfloat16,
82
+ device=torch.device("cuda"),
83
+ dequantize_fp32=False,
84
+ use_quantized_matmul=True,
85
+ )
86
+
87
+ pipe = LensPipeline.from_pretrained(
88
+ model_dir,
89
+ transformer=transformer,
90
+ torch_dtype=torch.bfloat16,
91
+ ).to("cuda")
92
+
93
+ image = pipe(
94
+ "A cat holding a sign that says hello world",
95
+ base_resolution=1024,
96
+ aspect_ratio="1:1",
97
+ num_inference_steps=4,
98
+ guidance_scale=1.0,
99
+ generator=torch.Generator("cuda").manual_seed(0),
100
+ ).images[0]
101
+ ```
102
+
103
+ ## Benchmark
104
+
105
+ Benchmark date: 2026-05-24. Hardware: RunPod NVIDIA H100 80GB HBM3, PyTorch 2.8.0 CUDA 12.8 container, no network volume, local container disk only.
106
+ Each prompt used `base_resolution=1024`, `aspect_ratio="1:1"`, `num_inference_steps=4`, `guidance_scale=1.0`, `torch.bfloat16`, and a fixed CUDA seed.
107
+
108
+ | Metric | Original Lens-Turbo | SDNQ Uint Static |
109
+ | --- | ---: | ---: |
110
+ | Load time, seconds | 59.316 | 16.861 |
111
+ | Load peak allocated VRAM, GB | 20.807 | 15.281 |
112
+ | Load peak reserved VRAM, GB | 20.928 | 15.344 |
113
+ | Load end allocated VRAM, GB | 20.807 | 15.281 |
114
+ | Average prompt runtime, seconds | 2.206 | 3.394 |
115
+ | Average runtime delta | baseline | +53.8% |
116
+
117
+ ## 10-Prompt Comparison Matrix
118
+
119
+ | ID | Scenario | Seed | Original time, s | Quant time, s | Delta | Original peak reserved VRAM, GB | Quant peak reserved VRAM, GB | Original | Quant |
120
+ | --- | --- | ---: | ---: | ---: | ---: | ---: | ---: | --- | --- |
121
+ | P01 | Orbital Night Market | 101 | 6.902 | 7.980 | +15.6% | 25.438 | 19.746 | ![](assets/comparison/p01_original.png) | ![](assets/comparison/p01_sdnq_uint_static.png) |
122
+ | P02 | Arctic Research Desk | 102 | 1.347 | 3.126 | +132.1% | 25.434 | 19.740 | ![](assets/comparison/p02_original.png) | ![](assets/comparison/p02_sdnq_uint_static.png) |
123
+ | P03 | Victorian Automaton Repair | 103 | 2.901 | 2.846 | -1.9% | 25.438 | 19.744 | ![](assets/comparison/p03_original.png) | ![](assets/comparison/p03_sdnq_uint_static.png) |
124
+ | P04 | Mars Greenhouse Control Room | 104 | 1.186 | 2.846 | +140.0% | 25.438 | 19.725 | ![](assets/comparison/p04_original.png) | ![](assets/comparison/p04_sdnq_uint_static.png) |
125
+ | P05 | Lost Railway Poster Wall | 105 | 1.185 | 2.877 | +142.8% | 25.438 | 19.725 | ![](assets/comparison/p05_original.png) | ![](assets/comparison/p05_sdnq_uint_static.png) |
126
+ | P06 | Miniature Courtroom Diorama | 106 | 1.186 | 2.836 | +139.1% | 25.438 | 19.744 | ![](assets/comparison/p06_original.png) | ![](assets/comparison/p06_sdnq_uint_static.png) |
127
+ | P07 | Rainy Seoul Book Cafe | 107 | 1.243 | 2.835 | +128.1% | 25.438 | 19.744 | ![](assets/comparison/p07_original.png) | ![](assets/comparison/p07_sdnq_uint_static.png) |
128
+ | P08 | Oceanographic Expedition Map | 108 | 1.181 | 2.847 | +141.1% | 25.438 | 19.744 | ![](assets/comparison/p08_original.png) | ![](assets/comparison/p08_sdnq_uint_static.png) |
129
+ | P09 | Renaissance Lab Notebook | 109 | 1.180 | 2.855 | +141.9% | 25.438 | 19.719 | ![](assets/comparison/p09_original.png) | ![](assets/comparison/p09_sdnq_uint_static.png) |
130
+ | P10 | Russian Provincial Print Shop | 110 | 3.749 | 2.888 | -23.0% | 25.459 | 19.766 | ![](assets/comparison/p10_original.png) | ![](assets/comparison/p10_sdnq_uint_static.png) |
131
+
132
+ ## Full Prompts
133
+
134
+ <details><summary>P01 - Orbital Night Market</summary>
135
+
136
+ A dense cinematic night market inside a transparent orbital habitat, with Earth curving below the glass floor, vendors selling glowing algae noodles and tiny repair drones, rain droplets floating in zero gravity, reflections on wet metal, and at least six readable signs in different places: a vertical neon sign saying "ORBITAL TEA HOUSE", a handwritten chalk menu saying "NO GRAVITY REFUNDS", a yellow safety placard saying "MAG BOOTS REQUIRED", a small receipt printer label saying "BAY 12 PICKUP", a red banner saying "FRESH SYNTH-MANGO", and a blue customs notice saying "DECLARE ALL MOON ROCKS". Ultra detailed, wide angle, layered crowd, realistic lens flare, crisp small typography.
137
+
138
+ </details>
139
+ <details><summary>P02 - Arctic Research Desk</summary>
140
+
141
+ A top-down documentary photo of an Arctic climate research desk inside a weather station during a blizzard, with ice crystals on the window, a rugged laptop displaying a complex map, three paper field notebooks, sample vials, a steaming enamel mug, and long English text on multiple objects: the notebook cover reads "FIELD LOG: STATION NORD, WEEK 17", a whiteboard in the background reads "CORE DEPTH 42.8m / TEMP -31C / WIND 62 km/h", a red tag on a sample tube reads "DO NOT THAW", and a printed memo reads "CALIBRATE SENSORS BEFORE SUNRISE". Natural cold light, precise shadows, photorealistic texture, no blurry text.
142
+
143
+ </details>
144
+ <details><summary>P03 - Victorian Automaton Repair</summary>
145
+
146
+ A richly detailed Victorian workshop where a brass clockwork automaton is being repaired under green banker lamps, with tiny gears, pearl inlays, oiled leather belts, smoke from a soldering iron, magnifying glass distortion, and handwritten labels everywhere. The main blueprint title must read "AUTOMATON HAND ASSEMBLY REV. C", a drawer label says "SPRINGS / EYES / MEMORY CAMS", a dangling tag says "CLIENT: LADY ADA", and a note pinned to the wall says "DO NOT WIND PAST MIDNIGHT". Moody chiaroscuro, shallow depth of field, extremely fine mechanical detail.
147
+
148
+ </details>
149
+ <details><summary>P04 - Mars Greenhouse Control Room</summary>
150
+
151
+ A believable Mars greenhouse control room at dawn, red dust outside the curved windows, rows of tomatoes and dwarf wheat under violet grow lights, condensation on transparent tubes, a tired botanist reflected in a touchscreen, and several readable UI panels in English: "OXYGEN LOOP STABLE", "WATER RECOVERY 98.4%", "SECTOR C: POLLINATION DRONES ACTIVE", and a sticky note saying "Tell Earth the basil survived". Technical but warm, high resolution, realistic sci-fi, detailed glass and plant textures.
152
+
153
+ </details>
154
+ <details><summary>P05 - Lost Railway Poster Wall</summary>
155
+
156
+ An abandoned underground railway platform turned into an accidental archive of travel posters, peeling ceramic tiles, puddles reflecting amber emergency lights, old suitcases, vines growing through cracked concrete, and five large posters with distinct readable titles: "THE NORTHERN COMET EXPRESS", "SLEEPER TO ISTANBUL", "MIDNIGHT PLATFORM 7", "COASTAL ROUTE REOPENING SOON", and "KEEP YOUR TICKET VISIBLE". Cinematic composition, wet surfaces, layered typography, realistic grime, strong perspective down the tracks.
157
+
158
+ </details>
159
+ <details><summary>P06 - Miniature Courtroom Diorama</summary>
160
+
161
+ A hyperreal macro photograph of a miniature courtroom diorama built inside an antique wooden drawer, with tiny judge bench, brass lamps, dust motes, paper exhibits smaller than postage stamps, a mouse-sized witness chair, and readable text on tiny documents: a case file labeled "CASE 1842-B: THE MISSING ORRERY", an evidence tag saying "EXHIBIT C", a court calendar reading "HEARING AT 9:30", and a placard on the judge bench saying "TRUTH IN SMALL THINGS". Macro lens, tactile materials, careful scale cues.
162
+
163
+ </details>
164
+ <details><summary>P07 - Rainy Seoul Book Cafe</summary>
165
+
166
+ A cozy but complex rainy evening scene in a narrow Seoul book cafe, viewed through a window covered in raindrops, shelves packed with art books, two students annotating a map, a barista steaming milk, warm tungsten light, street reflections, and multiple readable English text elements: a chalkboard says "TONIGHT: QUIET READING CLUB", a receipt says "OAT LATTE / CINNAMON BUN", a book spine says "ARCHITECTURE OF DREAMS", and a window sticker says "OPEN UNTIL THE LAST TRAIN". Photorealistic, cinematic, intricate reflections.
167
+
168
+ </details>
169
+ <details><summary>P08 - Oceanographic Expedition Map</summary>
170
+
171
+ A dramatic captain's table aboard a storm-tossed oceanographic research vessel, with a wet nautical chart, brass dividers, sonar printouts, bioluminescent plankton glowing in a glass jar, a cracked tablet, and readable labels distributed across the image: "TRENCH SURVEY LINE B", "DEPTH 10,928m", "ROV SIGNAL WEAK", "SAMPLE: BLUE VENT WATER", and a torn note saying "If the lights pulse twice, turn back". High detail, realistic water droplets, dark blue-green atmosphere, sharp text.
172
+
173
+ </details>
174
+ <details><summary>P09 - Renaissance Lab Notebook</summary>
175
+
176
+ An alternate-history Renaissance laboratory where an astronomer-painter is combining oil pigments with early electrical apparatus, with celestial globes, copper coils, stained glass sunlight, anatomical sketches, a half-finished portrait, and Latin-English notebook text visible on several pages: "LIGHT STUDY: BLUE VERDITER", "GALVANIC TEST NO. 8", "VENUS RISES BEFORE DAWN", and a folded letter sealed in wax reading "FOR THE WORKSHOP MASTER ONLY". Painterly realism, ornate detail, coherent objects, readable calligraphy.
177
+
178
+ </details>
179
+ <details><summary>P10 - Russian Provincial Print Shop</summary>
180
+
181
+ Сложная фотореалистичная сцена в старой провинциальной типографии поздним зимним вечером: за большим деревянным столом лежат металлические литеры, корректурные листы, линейки, чашка крепкого чая, заснеженное окно, тусклая лампа и следы типографской краски на пальцах наборщика. На разных элементах изображения должен быть длинный и хорошо читаемый русский текст: на вывеске над дверью написано "ТИПОГРАФИЯ СЕВЕРНЫЙ ЛИСТОК", на корректуре заголовок "СРОЧНО В НОМЕР: ГОРОДСКОЙ СОВЕТ ОТКРЫВАЕТ НОВУЮ БИБЛИОТЕКУ", на маленькой записке фраза "Проверить букву Ё во втором абзаце", а на календаре дата "Пятница, 24 января". Много бытовых деталей, глубокие тени, реалистичная кириллица, никакой размытой каши вместо текста.
182
+
183
+ </details>
184
+
185
+ ## Notes
186
+
187
+ This checkpoint is intended for research and evaluation. It inherits the upstream Lens limitations and responsible AI considerations from the source model.
188
+ The comparison images are deterministic for the listed seeds under this environment but may vary across driver, PyTorch, SDNQ, or kernel versions.
189
+
190
+ ## Citation
191
+
192
+ ```bibtex
193
+ @article{zhao2026lens,
194
+ title = {Lens: Rethinking Training Efficiency for Foundational Text-to-Image Models},
195
+ author = {Guo, Baining and Luo, Chong and Chen, Dong and Chen, Dongdong and Wei, Fangyun and Li, Ji and Bao, Jianmin and Zhang, Jiawei and Zhao, Jinjing and Shi, Lei and Yang, Qinhong and Zhang, Sirui and Wu, Xiuyu and Feng, Xuelu and Lu, Yan and Dong, Yanchen and Yue, Yang and Wang, Yitong and Chen, Yunuo and Liang, Zhiyang and Wan, Ziyu},
196
+ journal = {arXiv preprint arXiv:2605.21573},
197
+ year = {2026}
198
+ }
199
+ ```
assets/comparison/p01_original.png ADDED

Git LFS Details

  • SHA256: 07ff62c7bd7c8a35f8eeb59342a7272d1948e3c3615779a31f14745f1ba50bcc
  • Pointer size: 132 Bytes
  • Size of remote file: 1.69 MB
assets/comparison/p01_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: e51440ee27c7fa8463bb345547d8045ac84dfb834dfccd092b07cd27e70caf6a
  • Pointer size: 132 Bytes
  • Size of remote file: 1.88 MB
assets/comparison/p02_original.png ADDED

Git LFS Details

  • SHA256: 7bef1fb076bfbc7f9872a658f8756da47bb1b2ed454053dc52369377be5dd7b6
  • Pointer size: 132 Bytes
  • Size of remote file: 1.39 MB
assets/comparison/p02_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 74f0d22281206e9ec86514b0ce2752830d9833c222a14c509954d31406d02ac3
  • Pointer size: 132 Bytes
  • Size of remote file: 1.64 MB
assets/comparison/p03_original.png ADDED

Git LFS Details

  • SHA256: f75a4fc927983a265c911da0149fc5120517f96bfbb7de2516182fdde5f5b71e
  • Pointer size: 132 Bytes
  • Size of remote file: 1.37 MB
assets/comparison/p03_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: bbffa720e5133ec44269490a73544426fcb391aae1b728142a319fea0ba473c1
  • Pointer size: 132 Bytes
  • Size of remote file: 1.69 MB
assets/comparison/p04_original.png ADDED

Git LFS Details

  • SHA256: fd53585d228c6633ed66382be44bfdbaea130cf259be40f7299e04ec320fbfa8
  • Pointer size: 132 Bytes
  • Size of remote file: 1.5 MB
assets/comparison/p04_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 4c1325ccb6a5022e5d3383d0ae3529a29974deddccb22778468a080f43210ba0
  • Pointer size: 132 Bytes
  • Size of remote file: 1.65 MB
assets/comparison/p05_original.png ADDED

Git LFS Details

  • SHA256: 6b709ef1033189c919f46ac737cf8b1d475cffd09c1d4c78f762e1e7d9218dcd
  • Pointer size: 132 Bytes
  • Size of remote file: 1.6 MB
assets/comparison/p05_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 6186beff60be0902f10d1ea877eb13cc323caec81dd24f569803304e14e38f42
  • Pointer size: 132 Bytes
  • Size of remote file: 1.84 MB
assets/comparison/p06_original.png ADDED

Git LFS Details

  • SHA256: fb24a667dd4616cf8e2b9e6b6a0db37b0f3b8e32f43ebdc86d00f9e9d8806a19
  • Pointer size: 132 Bytes
  • Size of remote file: 1.34 MB
assets/comparison/p06_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 54c3f8a94a143bc6fa7851b5f360d4bca2216630c0cab69d5dae24ed3418f0a0
  • Pointer size: 132 Bytes
  • Size of remote file: 1.62 MB
assets/comparison/p07_original.png ADDED

Git LFS Details

  • SHA256: 0087c5ffd383a45982ad64b7aa7ccd132ba59fbbc71d995c075f6c9758549f71
  • Pointer size: 132 Bytes
  • Size of remote file: 1.52 MB
assets/comparison/p07_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 04e4a7d5892c4f66dfaaa6aeb2e0798dfd01910aea9f39441fa85ccd71d93b84
  • Pointer size: 132 Bytes
  • Size of remote file: 1.8 MB
assets/comparison/p08_original.png ADDED

Git LFS Details

  • SHA256: 43902d8261a3517d8448f343967f11c8cb44085d6601d14d4bc125506fbd76b4
  • Pointer size: 132 Bytes
  • Size of remote file: 1.53 MB
assets/comparison/p08_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 3dc804aa79a395734a2f8d9ecbf2e7ab2423a24ed55d806cc05a2292f4567a0b
  • Pointer size: 132 Bytes
  • Size of remote file: 1.77 MB
assets/comparison/p09_original.png ADDED

Git LFS Details

  • SHA256: fcaadea6c20013b256216763a0929a8d053e7f2666e2eb9d2c3ee49ddca85642
  • Pointer size: 132 Bytes
  • Size of remote file: 1.62 MB
assets/comparison/p09_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: ad479c80be3979906974c820ed598d5e07197e0e24f482a24075ec348b470e15
  • Pointer size: 132 Bytes
  • Size of remote file: 1.91 MB
assets/comparison/p10_original.png ADDED

Git LFS Details

  • SHA256: 5cfd2d364f77a951479c1a41b8ce171d48367889cf355e999ea149aaa56085e4
  • Pointer size: 132 Bytes
  • Size of remote file: 1.34 MB
assets/comparison/p10_sdnq_uint_static.png ADDED

Git LFS Details

  • SHA256: 832c210e821c44af361b96e592f46ef4e2913db92e4dc1c08528de06819f728b
  • Pointer size: 132 Bytes
  • Size of remote file: 1.63 MB
benchmark_metrics.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "load": {
3
+ "base": {
4
+ "load_time_s": 59.316,
5
+ "peak_allocated_gb": 20.807,
6
+ "peak_reserved_gb": 20.928,
7
+ "end_allocated_gb": 20.807,
8
+ "end_reserved_gb": 20.928
9
+ },
10
+ "quant": {
11
+ "load_time_s": 16.861,
12
+ "peak_allocated_gb": 15.281,
13
+ "peak_reserved_gb": 15.344,
14
+ "end_allocated_gb": 15.281,
15
+ "end_reserved_gb": 15.344
16
+ }
17
+ },
18
+ "quantization_time_s": null
19
+ }
comparison_matrix.json ADDED
@@ -0,0 +1,312 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "id": "P01",
4
+ "title": "Orbital Night Market",
5
+ "seed": 101,
6
+ "prompt": "A dense cinematic night market inside a transparent orbital habitat, with Earth curving below the glass floor, vendors selling glowing algae noodles and tiny repair drones, rain droplets floating in zero gravity, reflections on wet metal, and at least six readable signs in different places: a vertical neon sign saying \"ORBITAL TEA HOUSE\", a handwritten chalk menu saying \"NO GRAVITY REFUNDS\", a yellow safety placard saying \"MAG BOOTS REQUIRED\", a small receipt printer label saying \"BAY 12 PICKUP\", a red banner saying \"FRESH SYNTH-MANGO\", and a blue customs notice saying \"DECLARE ALL MOON ROCKS\". Ultra detailed, wide angle, layered crowd, realistic lens flare, crisp small typography.",
7
+ "base": {
8
+ "id": "P01",
9
+ "title": "Orbital Night Market",
10
+ "seed": 101,
11
+ "prompt": "A dense cinematic night market inside a transparent orbital habitat, with Earth curving below the glass floor, vendors selling glowing algae noodles and tiny repair drones, rain droplets floating in zero gravity, reflections on wet metal, and at least six readable signs in different places: a vertical neon sign saying \"ORBITAL TEA HOUSE\", a handwritten chalk menu saying \"NO GRAVITY REFUNDS\", a yellow safety placard saying \"MAG BOOTS REQUIRED\", a small receipt printer label saying \"BAY 12 PICKUP\", a red banner saying \"FRESH SYNTH-MANGO\", and a blue customs notice saying \"DECLARE ALL MOON ROCKS\". Ultra detailed, wide angle, layered crowd, realistic lens flare, crisp small typography.",
12
+ "image": "assets/comparison/p01_original.png",
13
+ "time_s": 6.902,
14
+ "peak_allocated_gb": 23.245,
15
+ "peak_reserved_gb": 25.438,
16
+ "end_allocated_gb": 20.841,
17
+ "end_reserved_gb": 25.438
18
+ },
19
+ "quant": {
20
+ "id": "P01",
21
+ "title": "Orbital Night Market",
22
+ "seed": 101,
23
+ "prompt": "A dense cinematic night market inside a transparent orbital habitat, with Earth curving below the glass floor, vendors selling glowing algae noodles and tiny repair drones, rain droplets floating in zero gravity, reflections on wet metal, and at least six readable signs in different places: a vertical neon sign saying \"ORBITAL TEA HOUSE\", a handwritten chalk menu saying \"NO GRAVITY REFUNDS\", a yellow safety placard saying \"MAG BOOTS REQUIRED\", a small receipt printer label saying \"BAY 12 PICKUP\", a red banner saying \"FRESH SYNTH-MANGO\", and a blue customs notice saying \"DECLARE ALL MOON ROCKS\". Ultra detailed, wide angle, layered crowd, realistic lens flare, crisp small typography.",
24
+ "image": "assets/comparison/p01_sdnq_uint_static.png",
25
+ "time_s": 7.98,
26
+ "peak_allocated_gb": 17.687,
27
+ "peak_reserved_gb": 19.746,
28
+ "end_allocated_gb": 15.283,
29
+ "end_reserved_gb": 19.746
30
+ },
31
+ "speed_delta_pct": 15.6
32
+ },
33
+ {
34
+ "id": "P02",
35
+ "title": "Arctic Research Desk",
36
+ "seed": 102,
37
+ "prompt": "A top-down documentary photo of an Arctic climate research desk inside a weather station during a blizzard, with ice crystals on the window, a rugged laptop displaying a complex map, three paper field notebooks, sample vials, a steaming enamel mug, and long English text on multiple objects: the notebook cover reads \"FIELD LOG: STATION NORD, WEEK 17\", a whiteboard in the background reads \"CORE DEPTH 42.8m / TEMP -31C / WIND 62 km/h\", a red tag on a sample tube reads \"DO NOT THAW\", and a printed memo reads \"CALIBRATE SENSORS BEFORE SUNRISE\". Natural cold light, precise shadows, photorealistic texture, no blurry text.",
38
+ "base": {
39
+ "id": "P02",
40
+ "title": "Arctic Research Desk",
41
+ "seed": 102,
42
+ "prompt": "A top-down documentary photo of an Arctic climate research desk inside a weather station during a blizzard, with ice crystals on the window, a rugged laptop displaying a complex map, three paper field notebooks, sample vials, a steaming enamel mug, and long English text on multiple objects: the notebook cover reads \"FIELD LOG: STATION NORD, WEEK 17\", a whiteboard in the background reads \"CORE DEPTH 42.8m / TEMP -31C / WIND 62 km/h\", a red tag on a sample tube reads \"DO NOT THAW\", and a printed memo reads \"CALIBRATE SENSORS BEFORE SUNRISE\". Natural cold light, precise shadows, photorealistic texture, no blurry text.",
43
+ "image": "assets/comparison/p02_original.png",
44
+ "time_s": 1.347,
45
+ "peak_allocated_gb": 23.245,
46
+ "peak_reserved_gb": 25.434,
47
+ "end_allocated_gb": 20.841,
48
+ "end_reserved_gb": 25.434
49
+ },
50
+ "quant": {
51
+ "id": "P02",
52
+ "title": "Arctic Research Desk",
53
+ "seed": 102,
54
+ "prompt": "A top-down documentary photo of an Arctic climate research desk inside a weather station during a blizzard, with ice crystals on the window, a rugged laptop displaying a complex map, three paper field notebooks, sample vials, a steaming enamel mug, and long English text on multiple objects: the notebook cover reads \"FIELD LOG: STATION NORD, WEEK 17\", a whiteboard in the background reads \"CORE DEPTH 42.8m / TEMP -31C / WIND 62 km/h\", a red tag on a sample tube reads \"DO NOT THAW\", and a printed memo reads \"CALIBRATE SENSORS BEFORE SUNRISE\". Natural cold light, precise shadows, photorealistic texture, no blurry text.",
55
+ "image": "assets/comparison/p02_sdnq_uint_static.png",
56
+ "time_s": 3.126,
57
+ "peak_allocated_gb": 17.687,
58
+ "peak_reserved_gb": 19.74,
59
+ "end_allocated_gb": 15.283,
60
+ "end_reserved_gb": 19.74
61
+ },
62
+ "speed_delta_pct": 132.1
63
+ },
64
+ {
65
+ "id": "P03",
66
+ "title": "Victorian Automaton Repair",
67
+ "seed": 103,
68
+ "prompt": "A richly detailed Victorian workshop where a brass clockwork automaton is being repaired under green banker lamps, with tiny gears, pearl inlays, oiled leather belts, smoke from a soldering iron, magnifying glass distortion, and handwritten labels everywhere. The main blueprint title must read \"AUTOMATON HAND ASSEMBLY REV. C\", a drawer label says \"SPRINGS / EYES / MEMORY CAMS\", a dangling tag says \"CLIENT: LADY ADA\", and a note pinned to the wall says \"DO NOT WIND PAST MIDNIGHT\". Moody chiaroscuro, shallow depth of field, extremely fine mechanical detail.",
69
+ "base": {
70
+ "id": "P03",
71
+ "title": "Victorian Automaton Repair",
72
+ "seed": 103,
73
+ "prompt": "A richly detailed Victorian workshop where a brass clockwork automaton is being repaired under green banker lamps, with tiny gears, pearl inlays, oiled leather belts, smoke from a soldering iron, magnifying glass distortion, and handwritten labels everywhere. The main blueprint title must read \"AUTOMATON HAND ASSEMBLY REV. C\", a drawer label says \"SPRINGS / EYES / MEMORY CAMS\", a dangling tag says \"CLIENT: LADY ADA\", and a note pinned to the wall says \"DO NOT WIND PAST MIDNIGHT\". Moody chiaroscuro, shallow depth of field, extremely fine mechanical detail.",
74
+ "image": "assets/comparison/p03_original.png",
75
+ "time_s": 2.901,
76
+ "peak_allocated_gb": 23.244,
77
+ "peak_reserved_gb": 25.438,
78
+ "end_allocated_gb": 20.841,
79
+ "end_reserved_gb": 25.438
80
+ },
81
+ "quant": {
82
+ "id": "P03",
83
+ "title": "Victorian Automaton Repair",
84
+ "seed": 103,
85
+ "prompt": "A richly detailed Victorian workshop where a brass clockwork automaton is being repaired under green banker lamps, with tiny gears, pearl inlays, oiled leather belts, smoke from a soldering iron, magnifying glass distortion, and handwritten labels everywhere. The main blueprint title must read \"AUTOMATON HAND ASSEMBLY REV. C\", a drawer label says \"SPRINGS / EYES / MEMORY CAMS\", a dangling tag says \"CLIENT: LADY ADA\", and a note pinned to the wall says \"DO NOT WIND PAST MIDNIGHT\". Moody chiaroscuro, shallow depth of field, extremely fine mechanical detail.",
86
+ "image": "assets/comparison/p03_sdnq_uint_static.png",
87
+ "time_s": 2.846,
88
+ "peak_allocated_gb": 17.686,
89
+ "peak_reserved_gb": 19.744,
90
+ "end_allocated_gb": 15.283,
91
+ "end_reserved_gb": 19.744
92
+ },
93
+ "speed_delta_pct": -1.9
94
+ },
95
+ {
96
+ "id": "P04",
97
+ "title": "Mars Greenhouse Control Room",
98
+ "seed": 104,
99
+ "prompt": "A believable Mars greenhouse control room at dawn, red dust outside the curved windows, rows of tomatoes and dwarf wheat under violet grow lights, condensation on transparent tubes, a tired botanist reflected in a touchscreen, and several readable UI panels in English: \"OXYGEN LOOP STABLE\", \"WATER RECOVERY 98.4%\", \"SECTOR C: POLLINATION DRONES ACTIVE\", and a sticky note saying \"Tell Earth the basil survived\". Technical but warm, high resolution, realistic sci-fi, detailed glass and plant textures.",
100
+ "base": {
101
+ "id": "P04",
102
+ "title": "Mars Greenhouse Control Room",
103
+ "seed": 104,
104
+ "prompt": "A believable Mars greenhouse control room at dawn, red dust outside the curved windows, rows of tomatoes and dwarf wheat under violet grow lights, condensation on transparent tubes, a tired botanist reflected in a touchscreen, and several readable UI panels in English: \"OXYGEN LOOP STABLE\", \"WATER RECOVERY 98.4%\", \"SECTOR C: POLLINATION DRONES ACTIVE\", and a sticky note saying \"Tell Earth the basil survived\". Technical but warm, high resolution, realistic sci-fi, detailed glass and plant textures.",
105
+ "image": "assets/comparison/p04_original.png",
106
+ "time_s": 1.186,
107
+ "peak_allocated_gb": 23.242,
108
+ "peak_reserved_gb": 25.438,
109
+ "end_allocated_gb": 20.841,
110
+ "end_reserved_gb": 25.438
111
+ },
112
+ "quant": {
113
+ "id": "P04",
114
+ "title": "Mars Greenhouse Control Room",
115
+ "seed": 104,
116
+ "prompt": "A believable Mars greenhouse control room at dawn, red dust outside the curved windows, rows of tomatoes and dwarf wheat under violet grow lights, condensation on transparent tubes, a tired botanist reflected in a touchscreen, and several readable UI panels in English: \"OXYGEN LOOP STABLE\", \"WATER RECOVERY 98.4%\", \"SECTOR C: POLLINATION DRONES ACTIVE\", and a sticky note saying \"Tell Earth the basil survived\". Technical but warm, high resolution, realistic sci-fi, detailed glass and plant textures.",
117
+ "image": "assets/comparison/p04_sdnq_uint_static.png",
118
+ "time_s": 2.846,
119
+ "peak_allocated_gb": 17.684,
120
+ "peak_reserved_gb": 19.725,
121
+ "end_allocated_gb": 15.283,
122
+ "end_reserved_gb": 19.725
123
+ },
124
+ "speed_delta_pct": 140.0
125
+ },
126
+ {
127
+ "id": "P05",
128
+ "title": "Lost Railway Poster Wall",
129
+ "seed": 105,
130
+ "prompt": "An abandoned underground railway platform turned into an accidental archive of travel posters, peeling ceramic tiles, puddles reflecting amber emergency lights, old suitcases, vines growing through cracked concrete, and five large posters with distinct readable titles: \"THE NORTHERN COMET EXPRESS\", \"SLEEPER TO ISTANBUL\", \"MIDNIGHT PLATFORM 7\", \"COASTAL ROUTE REOPENING SOON\", and \"KEEP YOUR TICKET VISIBLE\". Cinematic composition, wet surfaces, layered typography, realistic grime, strong perspective down the tracks.",
131
+ "base": {
132
+ "id": "P05",
133
+ "title": "Lost Railway Poster Wall",
134
+ "seed": 105,
135
+ "prompt": "An abandoned underground railway platform turned into an accidental archive of travel posters, peeling ceramic tiles, puddles reflecting amber emergency lights, old suitcases, vines growing through cracked concrete, and five large posters with distinct readable titles: \"THE NORTHERN COMET EXPRESS\", \"SLEEPER TO ISTANBUL\", \"MIDNIGHT PLATFORM 7\", \"COASTAL ROUTE REOPENING SOON\", and \"KEEP YOUR TICKET VISIBLE\". Cinematic composition, wet surfaces, layered typography, realistic grime, strong perspective down the tracks.",
136
+ "image": "assets/comparison/p05_original.png",
137
+ "time_s": 1.185,
138
+ "peak_allocated_gb": 23.242,
139
+ "peak_reserved_gb": 25.438,
140
+ "end_allocated_gb": 20.841,
141
+ "end_reserved_gb": 25.438
142
+ },
143
+ "quant": {
144
+ "id": "P05",
145
+ "title": "Lost Railway Poster Wall",
146
+ "seed": 105,
147
+ "prompt": "An abandoned underground railway platform turned into an accidental archive of travel posters, peeling ceramic tiles, puddles reflecting amber emergency lights, old suitcases, vines growing through cracked concrete, and five large posters with distinct readable titles: \"THE NORTHERN COMET EXPRESS\", \"SLEEPER TO ISTANBUL\", \"MIDNIGHT PLATFORM 7\", \"COASTAL ROUTE REOPENING SOON\", and \"KEEP YOUR TICKET VISIBLE\". Cinematic composition, wet surfaces, layered typography, realistic grime, strong perspective down the tracks.",
148
+ "image": "assets/comparison/p05_sdnq_uint_static.png",
149
+ "time_s": 2.877,
150
+ "peak_allocated_gb": 17.684,
151
+ "peak_reserved_gb": 19.725,
152
+ "end_allocated_gb": 15.283,
153
+ "end_reserved_gb": 19.725
154
+ },
155
+ "speed_delta_pct": 142.8
156
+ },
157
+ {
158
+ "id": "P06",
159
+ "title": "Miniature Courtroom Diorama",
160
+ "seed": 106,
161
+ "prompt": "A hyperreal macro photograph of a miniature courtroom diorama built inside an antique wooden drawer, with tiny judge bench, brass lamps, dust motes, paper exhibits smaller than postage stamps, a mouse-sized witness chair, and readable text on tiny documents: a case file labeled \"CASE 1842-B: THE MISSING ORRERY\", an evidence tag saying \"EXHIBIT C\", a court calendar reading \"HEARING AT 9:30\", and a placard on the judge bench saying \"TRUTH IN SMALL THINGS\". Macro lens, tactile materials, careful scale cues.",
162
+ "base": {
163
+ "id": "P06",
164
+ "title": "Miniature Courtroom Diorama",
165
+ "seed": 106,
166
+ "prompt": "A hyperreal macro photograph of a miniature courtroom diorama built inside an antique wooden drawer, with tiny judge bench, brass lamps, dust motes, paper exhibits smaller than postage stamps, a mouse-sized witness chair, and readable text on tiny documents: a case file labeled \"CASE 1842-B: THE MISSING ORRERY\", an evidence tag saying \"EXHIBIT C\", a court calendar reading \"HEARING AT 9:30\", and a placard on the judge bench saying \"TRUTH IN SMALL THINGS\". Macro lens, tactile materials, careful scale cues.",
167
+ "image": "assets/comparison/p06_original.png",
168
+ "time_s": 1.186,
169
+ "peak_allocated_gb": 23.244,
170
+ "peak_reserved_gb": 25.438,
171
+ "end_allocated_gb": 20.841,
172
+ "end_reserved_gb": 25.438
173
+ },
174
+ "quant": {
175
+ "id": "P06",
176
+ "title": "Miniature Courtroom Diorama",
177
+ "seed": 106,
178
+ "prompt": "A hyperreal macro photograph of a miniature courtroom diorama built inside an antique wooden drawer, with tiny judge bench, brass lamps, dust motes, paper exhibits smaller than postage stamps, a mouse-sized witness chair, and readable text on tiny documents: a case file labeled \"CASE 1842-B: THE MISSING ORRERY\", an evidence tag saying \"EXHIBIT C\", a court calendar reading \"HEARING AT 9:30\", and a placard on the judge bench saying \"TRUTH IN SMALL THINGS\". Macro lens, tactile materials, careful scale cues.",
179
+ "image": "assets/comparison/p06_sdnq_uint_static.png",
180
+ "time_s": 2.836,
181
+ "peak_allocated_gb": 17.686,
182
+ "peak_reserved_gb": 19.744,
183
+ "end_allocated_gb": 15.283,
184
+ "end_reserved_gb": 19.744
185
+ },
186
+ "speed_delta_pct": 139.1
187
+ },
188
+ {
189
+ "id": "P07",
190
+ "title": "Rainy Seoul Book Cafe",
191
+ "seed": 107,
192
+ "prompt": "A cozy but complex rainy evening scene in a narrow Seoul book cafe, viewed through a window covered in raindrops, shelves packed with art books, two students annotating a map, a barista steaming milk, warm tungsten light, street reflections, and multiple readable English text elements: a chalkboard says \"TONIGHT: QUIET READING CLUB\", a receipt says \"OAT LATTE / CINNAMON BUN\", a book spine says \"ARCHITECTURE OF DREAMS\", and a window sticker says \"OPEN UNTIL THE LAST TRAIN\". Photorealistic, cinematic, intricate reflections.",
193
+ "base": {
194
+ "id": "P07",
195
+ "title": "Rainy Seoul Book Cafe",
196
+ "seed": 107,
197
+ "prompt": "A cozy but complex rainy evening scene in a narrow Seoul book cafe, viewed through a window covered in raindrops, shelves packed with art books, two students annotating a map, a barista steaming milk, warm tungsten light, street reflections, and multiple readable English text elements: a chalkboard says \"TONIGHT: QUIET READING CLUB\", a receipt says \"OAT LATTE / CINNAMON BUN\", a book spine says \"ARCHITECTURE OF DREAMS\", and a window sticker says \"OPEN UNTIL THE LAST TRAIN\". Photorealistic, cinematic, intricate reflections.",
198
+ "image": "assets/comparison/p07_original.png",
199
+ "time_s": 1.243,
200
+ "peak_allocated_gb": 23.244,
201
+ "peak_reserved_gb": 25.438,
202
+ "end_allocated_gb": 20.841,
203
+ "end_reserved_gb": 25.438
204
+ },
205
+ "quant": {
206
+ "id": "P07",
207
+ "title": "Rainy Seoul Book Cafe",
208
+ "seed": 107,
209
+ "prompt": "A cozy but complex rainy evening scene in a narrow Seoul book cafe, viewed through a window covered in raindrops, shelves packed with art books, two students annotating a map, a barista steaming milk, warm tungsten light, street reflections, and multiple readable English text elements: a chalkboard says \"TONIGHT: QUIET READING CLUB\", a receipt says \"OAT LATTE / CINNAMON BUN\", a book spine says \"ARCHITECTURE OF DREAMS\", and a window sticker says \"OPEN UNTIL THE LAST TRAIN\". Photorealistic, cinematic, intricate reflections.",
210
+ "image": "assets/comparison/p07_sdnq_uint_static.png",
211
+ "time_s": 2.835,
212
+ "peak_allocated_gb": 17.686,
213
+ "peak_reserved_gb": 19.744,
214
+ "end_allocated_gb": 15.283,
215
+ "end_reserved_gb": 19.744
216
+ },
217
+ "speed_delta_pct": 128.1
218
+ },
219
+ {
220
+ "id": "P08",
221
+ "title": "Oceanographic Expedition Map",
222
+ "seed": 108,
223
+ "prompt": "A dramatic captain's table aboard a storm-tossed oceanographic research vessel, with a wet nautical chart, brass dividers, sonar printouts, bioluminescent plankton glowing in a glass jar, a cracked tablet, and readable labels distributed across the image: \"TRENCH SURVEY LINE B\", \"DEPTH 10,928m\", \"ROV SIGNAL WEAK\", \"SAMPLE: BLUE VENT WATER\", and a torn note saying \"If the lights pulse twice, turn back\". High detail, realistic water droplets, dark blue-green atmosphere, sharp text.",
224
+ "base": {
225
+ "id": "P08",
226
+ "title": "Oceanographic Expedition Map",
227
+ "seed": 108,
228
+ "prompt": "A dramatic captain's table aboard a storm-tossed oceanographic research vessel, with a wet nautical chart, brass dividers, sonar printouts, bioluminescent plankton glowing in a glass jar, a cracked tablet, and readable labels distributed across the image: \"TRENCH SURVEY LINE B\", \"DEPTH 10,928m\", \"ROV SIGNAL WEAK\", \"SAMPLE: BLUE VENT WATER\", and a torn note saying \"If the lights pulse twice, turn back\". High detail, realistic water droplets, dark blue-green atmosphere, sharp text.",
229
+ "image": "assets/comparison/p08_original.png",
230
+ "time_s": 1.181,
231
+ "peak_allocated_gb": 23.244,
232
+ "peak_reserved_gb": 25.438,
233
+ "end_allocated_gb": 20.841,
234
+ "end_reserved_gb": 25.438
235
+ },
236
+ "quant": {
237
+ "id": "P08",
238
+ "title": "Oceanographic Expedition Map",
239
+ "seed": 108,
240
+ "prompt": "A dramatic captain's table aboard a storm-tossed oceanographic research vessel, with a wet nautical chart, brass dividers, sonar printouts, bioluminescent plankton glowing in a glass jar, a cracked tablet, and readable labels distributed across the image: \"TRENCH SURVEY LINE B\", \"DEPTH 10,928m\", \"ROV SIGNAL WEAK\", \"SAMPLE: BLUE VENT WATER\", and a torn note saying \"If the lights pulse twice, turn back\". High detail, realistic water droplets, dark blue-green atmosphere, sharp text.",
241
+ "image": "assets/comparison/p08_sdnq_uint_static.png",
242
+ "time_s": 2.847,
243
+ "peak_allocated_gb": 17.686,
244
+ "peak_reserved_gb": 19.744,
245
+ "end_allocated_gb": 15.283,
246
+ "end_reserved_gb": 19.744
247
+ },
248
+ "speed_delta_pct": 141.1
249
+ },
250
+ {
251
+ "id": "P09",
252
+ "title": "Renaissance Lab Notebook",
253
+ "seed": 109,
254
+ "prompt": "An alternate-history Renaissance laboratory where an astronomer-painter is combining oil pigments with early electrical apparatus, with celestial globes, copper coils, stained glass sunlight, anatomical sketches, a half-finished portrait, and Latin-English notebook text visible on several pages: \"LIGHT STUDY: BLUE VERDITER\", \"GALVANIC TEST NO. 8\", \"VENUS RISES BEFORE DAWN\", and a folded letter sealed in wax reading \"FOR THE WORKSHOP MASTER ONLY\". Painterly realism, ornate detail, coherent objects, readable calligraphy.",
255
+ "base": {
256
+ "id": "P09",
257
+ "title": "Renaissance Lab Notebook",
258
+ "seed": 109,
259
+ "prompt": "An alternate-history Renaissance laboratory where an astronomer-painter is combining oil pigments with early electrical apparatus, with celestial globes, copper coils, stained glass sunlight, anatomical sketches, a half-finished portrait, and Latin-English notebook text visible on several pages: \"LIGHT STUDY: BLUE VERDITER\", \"GALVANIC TEST NO. 8\", \"VENUS RISES BEFORE DAWN\", and a folded letter sealed in wax reading \"FOR THE WORKSHOP MASTER ONLY\". Painterly realism, ornate detail, coherent objects, readable calligraphy.",
260
+ "image": "assets/comparison/p09_original.png",
261
+ "time_s": 1.18,
262
+ "peak_allocated_gb": 23.242,
263
+ "peak_reserved_gb": 25.438,
264
+ "end_allocated_gb": 20.841,
265
+ "end_reserved_gb": 25.438
266
+ },
267
+ "quant": {
268
+ "id": "P09",
269
+ "title": "Renaissance Lab Notebook",
270
+ "seed": 109,
271
+ "prompt": "An alternate-history Renaissance laboratory where an astronomer-painter is combining oil pigments with early electrical apparatus, with celestial globes, copper coils, stained glass sunlight, anatomical sketches, a half-finished portrait, and Latin-English notebook text visible on several pages: \"LIGHT STUDY: BLUE VERDITER\", \"GALVANIC TEST NO. 8\", \"VENUS RISES BEFORE DAWN\", and a folded letter sealed in wax reading \"FOR THE WORKSHOP MASTER ONLY\". Painterly realism, ornate detail, coherent objects, readable calligraphy.",
272
+ "image": "assets/comparison/p09_sdnq_uint_static.png",
273
+ "time_s": 2.855,
274
+ "peak_allocated_gb": 17.684,
275
+ "peak_reserved_gb": 19.719,
276
+ "end_allocated_gb": 15.283,
277
+ "end_reserved_gb": 19.719
278
+ },
279
+ "speed_delta_pct": 141.9
280
+ },
281
+ {
282
+ "id": "P10",
283
+ "title": "Russian Provincial Print Shop",
284
+ "seed": 110,
285
+ "prompt": "Сложная фотореалистичная сцена в старой провинциальной типографии поздним зимним вечером: за большим деревянным столом лежат металлические литеры, корректурные листы, линейки, чашка крепкого чая, заснеженное окно, тусклая лампа и следы типографской краски на пальцах наборщика. На разных элементах изображения должен быть длинный и хорошо читаемый русский текст: на вывеске над дверью написано \"ТИПОГРАФИЯ СЕВЕРНЫЙ ЛИСТОК\", на корректуре заголовок \"СРОЧНО В НОМЕР: ГОРОДСКОЙ СОВЕТ ОТКРЫВАЕТ НОВУЮ БИБЛИОТЕКУ\", на маленькой записке фраза \"Проверить букву Ё во втором абзаце\", а на календаре дата \"Пятница, 24 января\". Много бытовых деталей, глубокие тени, реалистичная кириллица, никакой размытой каши вместо текста.",
286
+ "base": {
287
+ "id": "P10",
288
+ "title": "Russian Provincial Print Shop",
289
+ "seed": 110,
290
+ "prompt": "Сложная фотореалистичная сцена в старой провинциальной типографии поздним зимним вечером: за большим деревянным столом лежат металлические литеры, корректурные листы, линейки, чашка крепкого чая, заснеженное окно, тусклая лампа и следы типографской краски на пальцах наборщика. На разных элементах изображения должен быть длинный и хорошо читаемый русский текст: на вывеске над дверью написано \"ТИПОГРАФИЯ СЕВЕРНЫЙ ЛИСТОК\", на корректуре заголовок \"СРОЧНО В НОМЕР: ГОРОДСКОЙ СОВЕТ ОТКРЫВАЕТ НОВУЮ БИБЛИОТЕКУ\", на маленькой записке фраза \"Проверить букву Ё во втором абзаце\", а на календаре дата \"Пятница, 24 января\". Много бытовых деталей, глубокие тени, реалистичная кириллица, никакой размытой каши вместо текста.",
291
+ "image": "assets/comparison/p10_original.png",
292
+ "time_s": 3.749,
293
+ "peak_allocated_gb": 23.252,
294
+ "peak_reserved_gb": 25.459,
295
+ "end_allocated_gb": 20.841,
296
+ "end_reserved_gb": 25.459
297
+ },
298
+ "quant": {
299
+ "id": "P10",
300
+ "title": "Russian Provincial Print Shop",
301
+ "seed": 110,
302
+ "prompt": "Сложная фотореалистичная сцена в старой провинциальной типографии поздним зимним вечером: за большим деревянным столом лежат металлические литеры, корректурные листы, линейки, чашка крепкого чая, заснеженное окно, тусклая лампа и следы типографской краски на пальцах наборщика. На разных элементах изображения должен быть длинный и хорошо читаемый русский текст: на вывеске над дверью написано \"ТИПОГРАФИЯ СЕВЕРНЫЙ ЛИСТОК\", на корректуре заголовок \"СРОЧНО В НОМЕР: ГОРОДСКОЙ СОВЕТ ОТКРЫВАЕТ НОВУЮ БИБЛИОТЕКУ\", на маленькой записке фраза \"Проверить букву Ё во втором абзаце\", а на календаре дата \"Пятница, 24 января\". Много бытовых деталей, глубокие тени, реалистичная кириллица, никакой размытой каши вместо текста.",
303
+ "image": "assets/comparison/p10_sdnq_uint_static.png",
304
+ "time_s": 2.888,
305
+ "peak_allocated_gb": 17.695,
306
+ "peak_reserved_gb": 19.766,
307
+ "end_allocated_gb": 15.283,
308
+ "end_reserved_gb": 19.766
309
+ },
310
+ "speed_delta_pct": -23.0
311
+ }
312
+ ]
model_index.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "LensPipeline",
3
+ "_diffusers_version": "0.38.0",
4
+ "_name_or_path": "microsoft/Lens-Turbo",
5
+ "scheduler": [
6
+ "diffusers",
7
+ "FlowMatchEulerDiscreteScheduler"
8
+ ],
9
+ "text_encoder": [
10
+ "transformers",
11
+ "LensGptOssEncoder"
12
+ ],
13
+ "tokenizer": [
14
+ "transformers",
15
+ "PreTrainedTokenizerFast"
16
+ ],
17
+ "transformer": [
18
+ "diffusers",
19
+ "LensTransformer2DModel"
20
+ ],
21
+ "vae": [
22
+ "diffusers",
23
+ "AutoencoderKLFlux2"
24
+ ]
25
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
+ "_diffusers_version": "0.38.0",
4
+ "base_image_seq_len": 256,
5
+ "base_shift": 0.5,
6
+ "invert_sigmas": false,
7
+ "max_image_seq_len": 4096,
8
+ "max_shift": 1.15,
9
+ "num_train_timesteps": 1000,
10
+ "shift": 3.0,
11
+ "shift_terminal": null,
12
+ "stochastic_sampling": false,
13
+ "time_shift_type": "exponential",
14
+ "use_beta_sigmas": false,
15
+ "use_dynamic_shifting": true,
16
+ "use_exponential_sigmas": false,
17
+ "use_karras_sigmas": false
18
+ }
sdnq_quantization_summary.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "source_model": "microsoft/Lens-Turbo",
3
+ "method": "SDNQ Uint Static",
4
+ "scope": "transformer only",
5
+ "text_encoder": "kept as provided by source checkpoint (GPT-OSS / MXFP4 path)",
6
+ "vae": "kept in bfloat16",
7
+ "config": {
8
+ "weights_dtype": "uint4",
9
+ "quantized_matmul_dtype": "int8",
10
+ "group_size": "0",
11
+ "use_static_quantization": "True",
12
+ "use_dynamic_quantization": "False",
13
+ "use_quantized_matmul": "True",
14
+ "use_svd": "False",
15
+ "use_hadamard": "False",
16
+ "quant_conv": "False",
17
+ "quant_embedding": "False",
18
+ "dequantize_fp32": "False",
19
+ "quantization_device": "cuda",
20
+ "return_device": "cuda"
21
+ }
22
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LensGptOssEncoder"
4
+ ],
5
+ "attention_bias": true,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": null,
8
+ "dtype": "bfloat16",
9
+ "eos_token_id": 200002,
10
+ "experts_per_token": 4,
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 2880,
14
+ "initial_context_length": 4096,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 2880,
17
+ "layer_types": [
18
+ "sliding_attention",
19
+ "full_attention",
20
+ "sliding_attention",
21
+ "full_attention",
22
+ "sliding_attention",
23
+ "full_attention",
24
+ "sliding_attention",
25
+ "full_attention",
26
+ "sliding_attention",
27
+ "full_attention",
28
+ "sliding_attention",
29
+ "full_attention",
30
+ "sliding_attention",
31
+ "full_attention",
32
+ "sliding_attention",
33
+ "full_attention",
34
+ "sliding_attention",
35
+ "full_attention",
36
+ "sliding_attention",
37
+ "full_attention",
38
+ "sliding_attention",
39
+ "full_attention",
40
+ "sliding_attention",
41
+ "full_attention"
42
+ ],
43
+ "max_position_embeddings": 131072,
44
+ "model_type": "gpt_oss",
45
+ "num_attention_heads": 64,
46
+ "num_experts_per_tok": 4,
47
+ "num_hidden_layers": 24,
48
+ "num_key_value_heads": 8,
49
+ "num_local_experts": 32,
50
+ "output_router_logits": false,
51
+ "pad_token_id": 199999,
52
+ "quantization_config": {
53
+ "modules_to_not_convert": [
54
+ "model.layers.*.self_attn",
55
+ "model.layers.*.mlp.router",
56
+ "model.embed_tokens",
57
+ "lm_head"
58
+ ],
59
+ "quant_method": "mxfp4"
60
+ },
61
+ "rms_norm_eps": 1e-05,
62
+ "rope_parameters": {
63
+ "beta_fast": 32.0,
64
+ "beta_slow": 1.0,
65
+ "factor": 32.0,
66
+ "original_max_position_embeddings": 4096,
67
+ "rope_theta": 150000,
68
+ "rope_type": "yarn",
69
+ "truncate": false
70
+ },
71
+ "router_aux_loss_coef": 0.9,
72
+ "sliding_window": 128,
73
+ "swiglu_limit": 7.0,
74
+ "tie_word_embeddings": false,
75
+ "transformers_version": "5.8.0",
76
+ "use_cache": true,
77
+ "vocab_size": 201088
78
+ }
text_encoder/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "eos_token_id": 200002,
4
+ "pad_token_id": 199999,
5
+ "transformers_version": "5.8.0",
6
+ "use_cache": true
7
+ }
text_encoder/model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:417c7e4acfe883a1b65991f8be06f1bcbc09cf8b4d86c92330a0ad6b58b75029
3
+ size 3890907096
text_encoder/model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c13b97cbe252920b15f21d3aa400ae35fb32775081d69b8d3bccc8f71eaf00e6
3
+ size 3819349232
text_encoder/model-00003-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0be677cf3d3500be5e93e4e66f331c827dc6a36db407f75a1ae569b75da6a646
3
+ size 3819349368
text_encoder/model-00004-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48bbcc91f726dc52c0577b773a00222ed89c17a8c947b20570c514fa4b93f1a5
3
+ size 2244982120
text_encoder/model.safetensors.index.json ADDED
@@ -0,0 +1,467 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_parameters": 1804459584,
4
+ "total_size": 13774535808
5
+ },
6
+ "weight_map": {
7
+ "lm_head.weight": "model-00001-of-00004.safetensors",
8
+ "model.embed_tokens.weight": "model-00001-of-00004.safetensors",
9
+ "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors",
10
+ "model.layers.0.mlp.experts.down_proj_bias": "model-00001-of-00004.safetensors",
11
+ "model.layers.0.mlp.experts.down_proj_blocks": "model-00001-of-00004.safetensors",
12
+ "model.layers.0.mlp.experts.down_proj_scales": "model-00001-of-00004.safetensors",
13
+ "model.layers.0.mlp.experts.gate_up_proj_bias": "model-00001-of-00004.safetensors",
14
+ "model.layers.0.mlp.experts.gate_up_proj_blocks": "model-00001-of-00004.safetensors",
15
+ "model.layers.0.mlp.experts.gate_up_proj_scales": "model-00001-of-00004.safetensors",
16
+ "model.layers.0.mlp.router.bias": "model-00001-of-00004.safetensors",
17
+ "model.layers.0.mlp.router.weight": "model-00001-of-00004.safetensors",
18
+ "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
19
+ "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
20
+ "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
21
+ "model.layers.0.self_attn.o_proj.bias": "model-00001-of-00004.safetensors",
22
+ "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
23
+ "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
24
+ "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
25
+ "model.layers.0.self_attn.sinks": "model-00001-of-00004.safetensors",
26
+ "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
27
+ "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
28
+ "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors",
29
+ "model.layers.1.mlp.experts.down_proj_bias": "model-00001-of-00004.safetensors",
30
+ "model.layers.1.mlp.experts.down_proj_blocks": "model-00001-of-00004.safetensors",
31
+ "model.layers.1.mlp.experts.down_proj_scales": "model-00001-of-00004.safetensors",
32
+ "model.layers.1.mlp.experts.gate_up_proj_bias": "model-00001-of-00004.safetensors",
33
+ "model.layers.1.mlp.experts.gate_up_proj_blocks": "model-00001-of-00004.safetensors",
34
+ "model.layers.1.mlp.experts.gate_up_proj_scales": "model-00001-of-00004.safetensors",
35
+ "model.layers.1.mlp.router.bias": "model-00001-of-00004.safetensors",
36
+ "model.layers.1.mlp.router.weight": "model-00001-of-00004.safetensors",
37
+ "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
38
+ "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
39
+ "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
40
+ "model.layers.1.self_attn.o_proj.bias": "model-00001-of-00004.safetensors",
41
+ "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
42
+ "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
43
+ "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
44
+ "model.layers.1.self_attn.sinks": "model-00001-of-00004.safetensors",
45
+ "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
46
+ "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
47
+ "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors",
48
+ "model.layers.10.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
49
+ "model.layers.10.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
50
+ "model.layers.10.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
51
+ "model.layers.10.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
52
+ "model.layers.10.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
53
+ "model.layers.10.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
54
+ "model.layers.10.mlp.router.bias": "model-00002-of-00004.safetensors",
55
+ "model.layers.10.mlp.router.weight": "model-00002-of-00004.safetensors",
56
+ "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
57
+ "model.layers.10.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
58
+ "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
59
+ "model.layers.10.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
60
+ "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
61
+ "model.layers.10.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
62
+ "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
63
+ "model.layers.10.self_attn.sinks": "model-00002-of-00004.safetensors",
64
+ "model.layers.10.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
65
+ "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
66
+ "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors",
67
+ "model.layers.11.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
68
+ "model.layers.11.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
69
+ "model.layers.11.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
70
+ "model.layers.11.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
71
+ "model.layers.11.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
72
+ "model.layers.11.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
73
+ "model.layers.11.mlp.router.bias": "model-00003-of-00004.safetensors",
74
+ "model.layers.11.mlp.router.weight": "model-00003-of-00004.safetensors",
75
+ "model.layers.11.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
76
+ "model.layers.11.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
77
+ "model.layers.11.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
78
+ "model.layers.11.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
79
+ "model.layers.11.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
80
+ "model.layers.11.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
81
+ "model.layers.11.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
82
+ "model.layers.11.self_attn.sinks": "model-00003-of-00004.safetensors",
83
+ "model.layers.11.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
84
+ "model.layers.11.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
85
+ "model.layers.12.input_layernorm.weight": "model-00003-of-00004.safetensors",
86
+ "model.layers.12.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
87
+ "model.layers.12.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
88
+ "model.layers.12.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
89
+ "model.layers.12.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
90
+ "model.layers.12.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
91
+ "model.layers.12.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
92
+ "model.layers.12.mlp.router.bias": "model-00003-of-00004.safetensors",
93
+ "model.layers.12.mlp.router.weight": "model-00003-of-00004.safetensors",
94
+ "model.layers.12.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
95
+ "model.layers.12.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
96
+ "model.layers.12.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
97
+ "model.layers.12.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
98
+ "model.layers.12.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
99
+ "model.layers.12.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
100
+ "model.layers.12.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
101
+ "model.layers.12.self_attn.sinks": "model-00003-of-00004.safetensors",
102
+ "model.layers.12.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
103
+ "model.layers.12.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
104
+ "model.layers.13.input_layernorm.weight": "model-00003-of-00004.safetensors",
105
+ "model.layers.13.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
106
+ "model.layers.13.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
107
+ "model.layers.13.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
108
+ "model.layers.13.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
109
+ "model.layers.13.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
110
+ "model.layers.13.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
111
+ "model.layers.13.mlp.router.bias": "model-00003-of-00004.safetensors",
112
+ "model.layers.13.mlp.router.weight": "model-00003-of-00004.safetensors",
113
+ "model.layers.13.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
114
+ "model.layers.13.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
115
+ "model.layers.13.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
116
+ "model.layers.13.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
117
+ "model.layers.13.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
118
+ "model.layers.13.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
119
+ "model.layers.13.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
120
+ "model.layers.13.self_attn.sinks": "model-00003-of-00004.safetensors",
121
+ "model.layers.13.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
122
+ "model.layers.13.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
123
+ "model.layers.14.input_layernorm.weight": "model-00003-of-00004.safetensors",
124
+ "model.layers.14.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
125
+ "model.layers.14.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
126
+ "model.layers.14.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
127
+ "model.layers.14.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
128
+ "model.layers.14.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
129
+ "model.layers.14.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
130
+ "model.layers.14.mlp.router.bias": "model-00003-of-00004.safetensors",
131
+ "model.layers.14.mlp.router.weight": "model-00003-of-00004.safetensors",
132
+ "model.layers.14.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
133
+ "model.layers.14.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
134
+ "model.layers.14.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
135
+ "model.layers.14.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
136
+ "model.layers.14.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
137
+ "model.layers.14.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
138
+ "model.layers.14.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
139
+ "model.layers.14.self_attn.sinks": "model-00003-of-00004.safetensors",
140
+ "model.layers.14.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
141
+ "model.layers.14.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
142
+ "model.layers.15.input_layernorm.weight": "model-00003-of-00004.safetensors",
143
+ "model.layers.15.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
144
+ "model.layers.15.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
145
+ "model.layers.15.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
146
+ "model.layers.15.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
147
+ "model.layers.15.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
148
+ "model.layers.15.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
149
+ "model.layers.15.mlp.router.bias": "model-00003-of-00004.safetensors",
150
+ "model.layers.15.mlp.router.weight": "model-00003-of-00004.safetensors",
151
+ "model.layers.15.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
152
+ "model.layers.15.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
153
+ "model.layers.15.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
154
+ "model.layers.15.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
155
+ "model.layers.15.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
156
+ "model.layers.15.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
157
+ "model.layers.15.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
158
+ "model.layers.15.self_attn.sinks": "model-00003-of-00004.safetensors",
159
+ "model.layers.15.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
160
+ "model.layers.15.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
161
+ "model.layers.16.input_layernorm.weight": "model-00003-of-00004.safetensors",
162
+ "model.layers.16.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
163
+ "model.layers.16.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
164
+ "model.layers.16.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
165
+ "model.layers.16.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
166
+ "model.layers.16.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
167
+ "model.layers.16.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
168
+ "model.layers.16.mlp.router.bias": "model-00003-of-00004.safetensors",
169
+ "model.layers.16.mlp.router.weight": "model-00003-of-00004.safetensors",
170
+ "model.layers.16.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
171
+ "model.layers.16.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
172
+ "model.layers.16.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
173
+ "model.layers.16.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
174
+ "model.layers.16.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
175
+ "model.layers.16.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
176
+ "model.layers.16.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
177
+ "model.layers.16.self_attn.sinks": "model-00003-of-00004.safetensors",
178
+ "model.layers.16.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
179
+ "model.layers.16.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
180
+ "model.layers.17.input_layernorm.weight": "model-00003-of-00004.safetensors",
181
+ "model.layers.17.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
182
+ "model.layers.17.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
183
+ "model.layers.17.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
184
+ "model.layers.17.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
185
+ "model.layers.17.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
186
+ "model.layers.17.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
187
+ "model.layers.17.mlp.router.bias": "model-00003-of-00004.safetensors",
188
+ "model.layers.17.mlp.router.weight": "model-00003-of-00004.safetensors",
189
+ "model.layers.17.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
190
+ "model.layers.17.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
191
+ "model.layers.17.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
192
+ "model.layers.17.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
193
+ "model.layers.17.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
194
+ "model.layers.17.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
195
+ "model.layers.17.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
196
+ "model.layers.17.self_attn.sinks": "model-00003-of-00004.safetensors",
197
+ "model.layers.17.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
198
+ "model.layers.17.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
199
+ "model.layers.18.input_layernorm.weight": "model-00003-of-00004.safetensors",
200
+ "model.layers.18.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
201
+ "model.layers.18.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
202
+ "model.layers.18.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
203
+ "model.layers.18.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
204
+ "model.layers.18.mlp.experts.gate_up_proj_blocks": "model-00003-of-00004.safetensors",
205
+ "model.layers.18.mlp.experts.gate_up_proj_scales": "model-00003-of-00004.safetensors",
206
+ "model.layers.18.mlp.router.bias": "model-00003-of-00004.safetensors",
207
+ "model.layers.18.mlp.router.weight": "model-00003-of-00004.safetensors",
208
+ "model.layers.18.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
209
+ "model.layers.18.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
210
+ "model.layers.18.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
211
+ "model.layers.18.self_attn.o_proj.bias": "model-00003-of-00004.safetensors",
212
+ "model.layers.18.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
213
+ "model.layers.18.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
214
+ "model.layers.18.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
215
+ "model.layers.18.self_attn.sinks": "model-00003-of-00004.safetensors",
216
+ "model.layers.18.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
217
+ "model.layers.18.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
218
+ "model.layers.19.input_layernorm.weight": "model-00003-of-00004.safetensors",
219
+ "model.layers.19.mlp.experts.down_proj_bias": "model-00003-of-00004.safetensors",
220
+ "model.layers.19.mlp.experts.down_proj_blocks": "model-00003-of-00004.safetensors",
221
+ "model.layers.19.mlp.experts.down_proj_scales": "model-00003-of-00004.safetensors",
222
+ "model.layers.19.mlp.experts.gate_up_proj_bias": "model-00003-of-00004.safetensors",
223
+ "model.layers.19.mlp.experts.gate_up_proj_blocks": "model-00004-of-00004.safetensors",
224
+ "model.layers.19.mlp.experts.gate_up_proj_scales": "model-00004-of-00004.safetensors",
225
+ "model.layers.19.mlp.router.bias": "model-00004-of-00004.safetensors",
226
+ "model.layers.19.mlp.router.weight": "model-00004-of-00004.safetensors",
227
+ "model.layers.19.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
228
+ "model.layers.19.self_attn.k_proj.bias": "model-00004-of-00004.safetensors",
229
+ "model.layers.19.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
230
+ "model.layers.19.self_attn.o_proj.bias": "model-00004-of-00004.safetensors",
231
+ "model.layers.19.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
232
+ "model.layers.19.self_attn.q_proj.bias": "model-00004-of-00004.safetensors",
233
+ "model.layers.19.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
234
+ "model.layers.19.self_attn.sinks": "model-00004-of-00004.safetensors",
235
+ "model.layers.19.self_attn.v_proj.bias": "model-00004-of-00004.safetensors",
236
+ "model.layers.19.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
237
+ "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors",
238
+ "model.layers.2.mlp.experts.down_proj_bias": "model-00001-of-00004.safetensors",
239
+ "model.layers.2.mlp.experts.down_proj_blocks": "model-00001-of-00004.safetensors",
240
+ "model.layers.2.mlp.experts.down_proj_scales": "model-00001-of-00004.safetensors",
241
+ "model.layers.2.mlp.experts.gate_up_proj_bias": "model-00001-of-00004.safetensors",
242
+ "model.layers.2.mlp.experts.gate_up_proj_blocks": "model-00001-of-00004.safetensors",
243
+ "model.layers.2.mlp.experts.gate_up_proj_scales": "model-00001-of-00004.safetensors",
244
+ "model.layers.2.mlp.router.bias": "model-00001-of-00004.safetensors",
245
+ "model.layers.2.mlp.router.weight": "model-00001-of-00004.safetensors",
246
+ "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
247
+ "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
248
+ "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
249
+ "model.layers.2.self_attn.o_proj.bias": "model-00001-of-00004.safetensors",
250
+ "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
251
+ "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
252
+ "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
253
+ "model.layers.2.self_attn.sinks": "model-00001-of-00004.safetensors",
254
+ "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
255
+ "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
256
+ "model.layers.20.input_layernorm.weight": "model-00004-of-00004.safetensors",
257
+ "model.layers.20.mlp.experts.down_proj_bias": "model-00004-of-00004.safetensors",
258
+ "model.layers.20.mlp.experts.down_proj_blocks": "model-00004-of-00004.safetensors",
259
+ "model.layers.20.mlp.experts.down_proj_scales": "model-00004-of-00004.safetensors",
260
+ "model.layers.20.mlp.experts.gate_up_proj_bias": "model-00004-of-00004.safetensors",
261
+ "model.layers.20.mlp.experts.gate_up_proj_blocks": "model-00004-of-00004.safetensors",
262
+ "model.layers.20.mlp.experts.gate_up_proj_scales": "model-00004-of-00004.safetensors",
263
+ "model.layers.20.mlp.router.bias": "model-00004-of-00004.safetensors",
264
+ "model.layers.20.mlp.router.weight": "model-00004-of-00004.safetensors",
265
+ "model.layers.20.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
266
+ "model.layers.20.self_attn.k_proj.bias": "model-00004-of-00004.safetensors",
267
+ "model.layers.20.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
268
+ "model.layers.20.self_attn.o_proj.bias": "model-00004-of-00004.safetensors",
269
+ "model.layers.20.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
270
+ "model.layers.20.self_attn.q_proj.bias": "model-00004-of-00004.safetensors",
271
+ "model.layers.20.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
272
+ "model.layers.20.self_attn.sinks": "model-00004-of-00004.safetensors",
273
+ "model.layers.20.self_attn.v_proj.bias": "model-00004-of-00004.safetensors",
274
+ "model.layers.20.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
275
+ "model.layers.21.input_layernorm.weight": "model-00004-of-00004.safetensors",
276
+ "model.layers.21.mlp.experts.down_proj_bias": "model-00004-of-00004.safetensors",
277
+ "model.layers.21.mlp.experts.down_proj_blocks": "model-00004-of-00004.safetensors",
278
+ "model.layers.21.mlp.experts.down_proj_scales": "model-00004-of-00004.safetensors",
279
+ "model.layers.21.mlp.experts.gate_up_proj_bias": "model-00004-of-00004.safetensors",
280
+ "model.layers.21.mlp.experts.gate_up_proj_blocks": "model-00004-of-00004.safetensors",
281
+ "model.layers.21.mlp.experts.gate_up_proj_scales": "model-00004-of-00004.safetensors",
282
+ "model.layers.21.mlp.router.bias": "model-00004-of-00004.safetensors",
283
+ "model.layers.21.mlp.router.weight": "model-00004-of-00004.safetensors",
284
+ "model.layers.21.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
285
+ "model.layers.21.self_attn.k_proj.bias": "model-00004-of-00004.safetensors",
286
+ "model.layers.21.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
287
+ "model.layers.21.self_attn.o_proj.bias": "model-00004-of-00004.safetensors",
288
+ "model.layers.21.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
289
+ "model.layers.21.self_attn.q_proj.bias": "model-00004-of-00004.safetensors",
290
+ "model.layers.21.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
291
+ "model.layers.21.self_attn.sinks": "model-00004-of-00004.safetensors",
292
+ "model.layers.21.self_attn.v_proj.bias": "model-00004-of-00004.safetensors",
293
+ "model.layers.21.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
294
+ "model.layers.22.input_layernorm.weight": "model-00004-of-00004.safetensors",
295
+ "model.layers.22.mlp.experts.down_proj_bias": "model-00004-of-00004.safetensors",
296
+ "model.layers.22.mlp.experts.down_proj_blocks": "model-00004-of-00004.safetensors",
297
+ "model.layers.22.mlp.experts.down_proj_scales": "model-00004-of-00004.safetensors",
298
+ "model.layers.22.mlp.experts.gate_up_proj_bias": "model-00004-of-00004.safetensors",
299
+ "model.layers.22.mlp.experts.gate_up_proj_blocks": "model-00004-of-00004.safetensors",
300
+ "model.layers.22.mlp.experts.gate_up_proj_scales": "model-00004-of-00004.safetensors",
301
+ "model.layers.22.mlp.router.bias": "model-00004-of-00004.safetensors",
302
+ "model.layers.22.mlp.router.weight": "model-00004-of-00004.safetensors",
303
+ "model.layers.22.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
304
+ "model.layers.22.self_attn.k_proj.bias": "model-00004-of-00004.safetensors",
305
+ "model.layers.22.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
306
+ "model.layers.22.self_attn.o_proj.bias": "model-00004-of-00004.safetensors",
307
+ "model.layers.22.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
308
+ "model.layers.22.self_attn.q_proj.bias": "model-00004-of-00004.safetensors",
309
+ "model.layers.22.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
310
+ "model.layers.22.self_attn.sinks": "model-00004-of-00004.safetensors",
311
+ "model.layers.22.self_attn.v_proj.bias": "model-00004-of-00004.safetensors",
312
+ "model.layers.22.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
313
+ "model.layers.23.input_layernorm.weight": "model-00004-of-00004.safetensors",
314
+ "model.layers.23.mlp.experts.down_proj_bias": "model-00004-of-00004.safetensors",
315
+ "model.layers.23.mlp.experts.down_proj_blocks": "model-00004-of-00004.safetensors",
316
+ "model.layers.23.mlp.experts.down_proj_scales": "model-00004-of-00004.safetensors",
317
+ "model.layers.23.mlp.experts.gate_up_proj_bias": "model-00004-of-00004.safetensors",
318
+ "model.layers.23.mlp.experts.gate_up_proj_blocks": "model-00004-of-00004.safetensors",
319
+ "model.layers.23.mlp.experts.gate_up_proj_scales": "model-00004-of-00004.safetensors",
320
+ "model.layers.23.mlp.router.bias": "model-00004-of-00004.safetensors",
321
+ "model.layers.23.mlp.router.weight": "model-00004-of-00004.safetensors",
322
+ "model.layers.23.post_attention_layernorm.weight": "model-00004-of-00004.safetensors",
323
+ "model.layers.23.self_attn.k_proj.bias": "model-00004-of-00004.safetensors",
324
+ "model.layers.23.self_attn.k_proj.weight": "model-00004-of-00004.safetensors",
325
+ "model.layers.23.self_attn.o_proj.bias": "model-00004-of-00004.safetensors",
326
+ "model.layers.23.self_attn.o_proj.weight": "model-00004-of-00004.safetensors",
327
+ "model.layers.23.self_attn.q_proj.bias": "model-00004-of-00004.safetensors",
328
+ "model.layers.23.self_attn.q_proj.weight": "model-00004-of-00004.safetensors",
329
+ "model.layers.23.self_attn.sinks": "model-00004-of-00004.safetensors",
330
+ "model.layers.23.self_attn.v_proj.bias": "model-00004-of-00004.safetensors",
331
+ "model.layers.23.self_attn.v_proj.weight": "model-00004-of-00004.safetensors",
332
+ "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors",
333
+ "model.layers.3.mlp.experts.down_proj_bias": "model-00001-of-00004.safetensors",
334
+ "model.layers.3.mlp.experts.down_proj_blocks": "model-00001-of-00004.safetensors",
335
+ "model.layers.3.mlp.experts.down_proj_scales": "model-00001-of-00004.safetensors",
336
+ "model.layers.3.mlp.experts.gate_up_proj_bias": "model-00001-of-00004.safetensors",
337
+ "model.layers.3.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
338
+ "model.layers.3.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
339
+ "model.layers.3.mlp.router.bias": "model-00002-of-00004.safetensors",
340
+ "model.layers.3.mlp.router.weight": "model-00002-of-00004.safetensors",
341
+ "model.layers.3.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
342
+ "model.layers.3.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
343
+ "model.layers.3.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
344
+ "model.layers.3.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
345
+ "model.layers.3.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
346
+ "model.layers.3.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
347
+ "model.layers.3.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
348
+ "model.layers.3.self_attn.sinks": "model-00002-of-00004.safetensors",
349
+ "model.layers.3.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
350
+ "model.layers.3.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
351
+ "model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
352
+ "model.layers.4.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
353
+ "model.layers.4.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
354
+ "model.layers.4.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
355
+ "model.layers.4.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
356
+ "model.layers.4.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
357
+ "model.layers.4.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
358
+ "model.layers.4.mlp.router.bias": "model-00002-of-00004.safetensors",
359
+ "model.layers.4.mlp.router.weight": "model-00002-of-00004.safetensors",
360
+ "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
361
+ "model.layers.4.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
362
+ "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
363
+ "model.layers.4.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
364
+ "model.layers.4.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
365
+ "model.layers.4.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
366
+ "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
367
+ "model.layers.4.self_attn.sinks": "model-00002-of-00004.safetensors",
368
+ "model.layers.4.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
369
+ "model.layers.4.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
370
+ "model.layers.5.input_layernorm.weight": "model-00002-of-00004.safetensors",
371
+ "model.layers.5.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
372
+ "model.layers.5.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
373
+ "model.layers.5.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
374
+ "model.layers.5.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
375
+ "model.layers.5.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
376
+ "model.layers.5.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
377
+ "model.layers.5.mlp.router.bias": "model-00002-of-00004.safetensors",
378
+ "model.layers.5.mlp.router.weight": "model-00002-of-00004.safetensors",
379
+ "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
380
+ "model.layers.5.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
381
+ "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
382
+ "model.layers.5.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
383
+ "model.layers.5.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
384
+ "model.layers.5.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
385
+ "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
386
+ "model.layers.5.self_attn.sinks": "model-00002-of-00004.safetensors",
387
+ "model.layers.5.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
388
+ "model.layers.5.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
389
+ "model.layers.6.input_layernorm.weight": "model-00002-of-00004.safetensors",
390
+ "model.layers.6.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
391
+ "model.layers.6.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
392
+ "model.layers.6.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
393
+ "model.layers.6.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
394
+ "model.layers.6.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
395
+ "model.layers.6.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
396
+ "model.layers.6.mlp.router.bias": "model-00002-of-00004.safetensors",
397
+ "model.layers.6.mlp.router.weight": "model-00002-of-00004.safetensors",
398
+ "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
399
+ "model.layers.6.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
400
+ "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
401
+ "model.layers.6.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
402
+ "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
403
+ "model.layers.6.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
404
+ "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
405
+ "model.layers.6.self_attn.sinks": "model-00002-of-00004.safetensors",
406
+ "model.layers.6.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
407
+ "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
408
+ "model.layers.7.input_layernorm.weight": "model-00002-of-00004.safetensors",
409
+ "model.layers.7.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
410
+ "model.layers.7.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
411
+ "model.layers.7.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
412
+ "model.layers.7.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
413
+ "model.layers.7.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
414
+ "model.layers.7.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
415
+ "model.layers.7.mlp.router.bias": "model-00002-of-00004.safetensors",
416
+ "model.layers.7.mlp.router.weight": "model-00002-of-00004.safetensors",
417
+ "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
418
+ "model.layers.7.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
419
+ "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
420
+ "model.layers.7.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
421
+ "model.layers.7.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
422
+ "model.layers.7.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
423
+ "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
424
+ "model.layers.7.self_attn.sinks": "model-00002-of-00004.safetensors",
425
+ "model.layers.7.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
426
+ "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
427
+ "model.layers.8.input_layernorm.weight": "model-00002-of-00004.safetensors",
428
+ "model.layers.8.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
429
+ "model.layers.8.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
430
+ "model.layers.8.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
431
+ "model.layers.8.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
432
+ "model.layers.8.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
433
+ "model.layers.8.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
434
+ "model.layers.8.mlp.router.bias": "model-00002-of-00004.safetensors",
435
+ "model.layers.8.mlp.router.weight": "model-00002-of-00004.safetensors",
436
+ "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
437
+ "model.layers.8.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
438
+ "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
439
+ "model.layers.8.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
440
+ "model.layers.8.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
441
+ "model.layers.8.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
442
+ "model.layers.8.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
443
+ "model.layers.8.self_attn.sinks": "model-00002-of-00004.safetensors",
444
+ "model.layers.8.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
445
+ "model.layers.8.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
446
+ "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors",
447
+ "model.layers.9.mlp.experts.down_proj_bias": "model-00002-of-00004.safetensors",
448
+ "model.layers.9.mlp.experts.down_proj_blocks": "model-00002-of-00004.safetensors",
449
+ "model.layers.9.mlp.experts.down_proj_scales": "model-00002-of-00004.safetensors",
450
+ "model.layers.9.mlp.experts.gate_up_proj_bias": "model-00002-of-00004.safetensors",
451
+ "model.layers.9.mlp.experts.gate_up_proj_blocks": "model-00002-of-00004.safetensors",
452
+ "model.layers.9.mlp.experts.gate_up_proj_scales": "model-00002-of-00004.safetensors",
453
+ "model.layers.9.mlp.router.bias": "model-00002-of-00004.safetensors",
454
+ "model.layers.9.mlp.router.weight": "model-00002-of-00004.safetensors",
455
+ "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
456
+ "model.layers.9.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
457
+ "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
458
+ "model.layers.9.self_attn.o_proj.bias": "model-00002-of-00004.safetensors",
459
+ "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
460
+ "model.layers.9.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
461
+ "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
462
+ "model.layers.9.self_attn.sinks": "model-00002-of-00004.safetensors",
463
+ "model.layers.9.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
464
+ "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
465
+ "model.norm.weight": "model-00004-of-00004.safetensors"
466
+ }
467
+ }
tokenizer/chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
tokenizer/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:928addc4a139e5382c06af49ebd495a4aa2aca99d13b872873e27bcbacc3ae4d
3
+ size 27868440
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<|startoftext|>",
4
+ "clean_up_tokenization_spaces": false,
5
+ "eos_token": "<|return|>",
6
+ "is_local": true,
7
+ "local_files_only": false,
8
+ "model_input_names": [
9
+ "input_ids",
10
+ "attention_mask"
11
+ ],
12
+ "model_max_length": 1000000000000000019884624838656,
13
+ "pad_token": "<|endoftext|>",
14
+ "tokenizer_class": "TokenizersBackend"
15
+ }
transformer/config.json ADDED
@@ -0,0 +1,474 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "LensTransformer2DModel",
3
+ "_diffusers_version": "0.38.0",
4
+ "_name_or_path": "/workspace/.cache/huggingface/hub/models--microsoft--Lens-Turbo/snapshots/f21b81bed3bae7f93f16f5fd300af9c408f5816a/transformer",
5
+ "attention_head_dim": 64,
6
+ "axes_dims_rope": [
7
+ 8,
8
+ 28,
9
+ 28
10
+ ],
11
+ "enc_hidden_dim": 2880,
12
+ "gate_mlp": true,
13
+ "in_channels": 128,
14
+ "inner_dim": 1536,
15
+ "multi_layer_encoder_feature": true,
16
+ "num_attention_heads": 24,
17
+ "num_layers": 48,
18
+ "out_channels": 32,
19
+ "patch_size": 2,
20
+ "quantization_config": {
21
+ "add_skip_keys": false,
22
+ "dequantize_fp32": false,
23
+ "dynamic_loss_threshold": null,
24
+ "group_size": 0,
25
+ "hadamard_group_size": 128,
26
+ "is_integer": true,
27
+ "is_training": false,
28
+ "modules_dtype_dict": {},
29
+ "modules_quant_config": {},
30
+ "modules_to_not_convert": [
31
+ "wte",
32
+ "norm",
33
+ ".img_out",
34
+ "multi_modal_projector",
35
+ ".norm_out",
36
+ "patch_embedding",
37
+ ".img_in",
38
+ ".context_embedder",
39
+ ".txt_out",
40
+ "patch_embed",
41
+ ".vid_in",
42
+ ".final_layer",
43
+ "time_text_embed",
44
+ "pos_embed",
45
+ "lm_head",
46
+ ".vid_out",
47
+ ".txt_in",
48
+ ".t_embedder",
49
+ ".x_embedder",
50
+ "patch_emb",
51
+ ".y_embedder",
52
+ ".condition_embedder",
53
+ ".proj_out",
54
+ ".time_embed",
55
+ ".emb_out",
56
+ ".emb_in",
57
+ "txt_norm.0.weight",
58
+ "txt_norm.1.weight",
59
+ "txt_norm.2.weight",
60
+ "txt_norm.3.weight",
61
+ "transformer_blocks.0.attn.norm_q.weight",
62
+ "transformer_blocks.0.attn.norm_k.weight",
63
+ "transformer_blocks.0.attn.norm_added_q.weight",
64
+ "transformer_blocks.0.attn.norm_added_k.weight",
65
+ "transformer_blocks.0.img_norm1.weight",
66
+ "transformer_blocks.0.img_norm2.weight",
67
+ "transformer_blocks.0.txt_norm1.weight",
68
+ "transformer_blocks.0.txt_norm2.weight",
69
+ "transformer_blocks.1.attn.norm_q.weight",
70
+ "transformer_blocks.1.attn.norm_k.weight",
71
+ "transformer_blocks.1.attn.norm_added_q.weight",
72
+ "transformer_blocks.1.attn.norm_added_k.weight",
73
+ "transformer_blocks.1.img_norm1.weight",
74
+ "transformer_blocks.1.img_norm2.weight",
75
+ "transformer_blocks.1.txt_norm1.weight",
76
+ "transformer_blocks.1.txt_norm2.weight",
77
+ "transformer_blocks.2.attn.norm_q.weight",
78
+ "transformer_blocks.2.attn.norm_k.weight",
79
+ "transformer_blocks.2.attn.norm_added_q.weight",
80
+ "transformer_blocks.2.attn.norm_added_k.weight",
81
+ "transformer_blocks.2.img_norm1.weight",
82
+ "transformer_blocks.2.img_norm2.weight",
83
+ "transformer_blocks.2.txt_norm1.weight",
84
+ "transformer_blocks.2.txt_norm2.weight",
85
+ "transformer_blocks.3.attn.norm_q.weight",
86
+ "transformer_blocks.3.attn.norm_k.weight",
87
+ "transformer_blocks.3.attn.norm_added_q.weight",
88
+ "transformer_blocks.3.attn.norm_added_k.weight",
89
+ "transformer_blocks.3.img_norm1.weight",
90
+ "transformer_blocks.3.img_norm2.weight",
91
+ "transformer_blocks.3.txt_norm1.weight",
92
+ "transformer_blocks.3.txt_norm2.weight",
93
+ "transformer_blocks.4.attn.norm_q.weight",
94
+ "transformer_blocks.4.attn.norm_k.weight",
95
+ "transformer_blocks.4.attn.norm_added_q.weight",
96
+ "transformer_blocks.4.attn.norm_added_k.weight",
97
+ "transformer_blocks.4.img_norm1.weight",
98
+ "transformer_blocks.4.img_norm2.weight",
99
+ "transformer_blocks.4.txt_norm1.weight",
100
+ "transformer_blocks.4.txt_norm2.weight",
101
+ "transformer_blocks.5.attn.norm_q.weight",
102
+ "transformer_blocks.5.attn.norm_k.weight",
103
+ "transformer_blocks.5.attn.norm_added_q.weight",
104
+ "transformer_blocks.5.attn.norm_added_k.weight",
105
+ "transformer_blocks.5.img_norm1.weight",
106
+ "transformer_blocks.5.img_norm2.weight",
107
+ "transformer_blocks.5.txt_norm1.weight",
108
+ "transformer_blocks.5.txt_norm2.weight",
109
+ "transformer_blocks.6.attn.norm_q.weight",
110
+ "transformer_blocks.6.attn.norm_k.weight",
111
+ "transformer_blocks.6.attn.norm_added_q.weight",
112
+ "transformer_blocks.6.attn.norm_added_k.weight",
113
+ "transformer_blocks.6.img_norm1.weight",
114
+ "transformer_blocks.6.img_norm2.weight",
115
+ "transformer_blocks.6.txt_norm1.weight",
116
+ "transformer_blocks.6.txt_norm2.weight",
117
+ "transformer_blocks.7.attn.norm_q.weight",
118
+ "transformer_blocks.7.attn.norm_k.weight",
119
+ "transformer_blocks.7.attn.norm_added_q.weight",
120
+ "transformer_blocks.7.attn.norm_added_k.weight",
121
+ "transformer_blocks.7.img_norm1.weight",
122
+ "transformer_blocks.7.img_norm2.weight",
123
+ "transformer_blocks.7.txt_norm1.weight",
124
+ "transformer_blocks.7.txt_norm2.weight",
125
+ "transformer_blocks.8.attn.norm_q.weight",
126
+ "transformer_blocks.8.attn.norm_k.weight",
127
+ "transformer_blocks.8.attn.norm_added_q.weight",
128
+ "transformer_blocks.8.attn.norm_added_k.weight",
129
+ "transformer_blocks.8.img_norm1.weight",
130
+ "transformer_blocks.8.img_norm2.weight",
131
+ "transformer_blocks.8.txt_norm1.weight",
132
+ "transformer_blocks.8.txt_norm2.weight",
133
+ "transformer_blocks.9.attn.norm_q.weight",
134
+ "transformer_blocks.9.attn.norm_k.weight",
135
+ "transformer_blocks.9.attn.norm_added_q.weight",
136
+ "transformer_blocks.9.attn.norm_added_k.weight",
137
+ "transformer_blocks.9.img_norm1.weight",
138
+ "transformer_blocks.9.img_norm2.weight",
139
+ "transformer_blocks.9.txt_norm1.weight",
140
+ "transformer_blocks.9.txt_norm2.weight",
141
+ "transformer_blocks.10.attn.norm_q.weight",
142
+ "transformer_blocks.10.attn.norm_k.weight",
143
+ "transformer_blocks.10.attn.norm_added_q.weight",
144
+ "transformer_blocks.10.attn.norm_added_k.weight",
145
+ "transformer_blocks.10.img_norm1.weight",
146
+ "transformer_blocks.10.img_norm2.weight",
147
+ "transformer_blocks.10.txt_norm1.weight",
148
+ "transformer_blocks.10.txt_norm2.weight",
149
+ "transformer_blocks.11.attn.norm_q.weight",
150
+ "transformer_blocks.11.attn.norm_k.weight",
151
+ "transformer_blocks.11.attn.norm_added_q.weight",
152
+ "transformer_blocks.11.attn.norm_added_k.weight",
153
+ "transformer_blocks.11.img_norm1.weight",
154
+ "transformer_blocks.11.img_norm2.weight",
155
+ "transformer_blocks.11.txt_norm1.weight",
156
+ "transformer_blocks.11.txt_norm2.weight",
157
+ "transformer_blocks.12.attn.norm_q.weight",
158
+ "transformer_blocks.12.attn.norm_k.weight",
159
+ "transformer_blocks.12.attn.norm_added_q.weight",
160
+ "transformer_blocks.12.attn.norm_added_k.weight",
161
+ "transformer_blocks.12.img_norm1.weight",
162
+ "transformer_blocks.12.img_norm2.weight",
163
+ "transformer_blocks.12.txt_norm1.weight",
164
+ "transformer_blocks.12.txt_norm2.weight",
165
+ "transformer_blocks.13.attn.norm_q.weight",
166
+ "transformer_blocks.13.attn.norm_k.weight",
167
+ "transformer_blocks.13.attn.norm_added_q.weight",
168
+ "transformer_blocks.13.attn.norm_added_k.weight",
169
+ "transformer_blocks.13.img_norm1.weight",
170
+ "transformer_blocks.13.img_norm2.weight",
171
+ "transformer_blocks.13.txt_norm1.weight",
172
+ "transformer_blocks.13.txt_norm2.weight",
173
+ "transformer_blocks.14.attn.norm_q.weight",
174
+ "transformer_blocks.14.attn.norm_k.weight",
175
+ "transformer_blocks.14.attn.norm_added_q.weight",
176
+ "transformer_blocks.14.attn.norm_added_k.weight",
177
+ "transformer_blocks.14.img_norm1.weight",
178
+ "transformer_blocks.14.img_norm2.weight",
179
+ "transformer_blocks.14.txt_norm1.weight",
180
+ "transformer_blocks.14.txt_norm2.weight",
181
+ "transformer_blocks.15.attn.norm_q.weight",
182
+ "transformer_blocks.15.attn.norm_k.weight",
183
+ "transformer_blocks.15.attn.norm_added_q.weight",
184
+ "transformer_blocks.15.attn.norm_added_k.weight",
185
+ "transformer_blocks.15.img_norm1.weight",
186
+ "transformer_blocks.15.img_norm2.weight",
187
+ "transformer_blocks.15.txt_norm1.weight",
188
+ "transformer_blocks.15.txt_norm2.weight",
189
+ "transformer_blocks.16.attn.norm_q.weight",
190
+ "transformer_blocks.16.attn.norm_k.weight",
191
+ "transformer_blocks.16.attn.norm_added_q.weight",
192
+ "transformer_blocks.16.attn.norm_added_k.weight",
193
+ "transformer_blocks.16.img_norm1.weight",
194
+ "transformer_blocks.16.img_norm2.weight",
195
+ "transformer_blocks.16.txt_norm1.weight",
196
+ "transformer_blocks.16.txt_norm2.weight",
197
+ "transformer_blocks.17.attn.norm_q.weight",
198
+ "transformer_blocks.17.attn.norm_k.weight",
199
+ "transformer_blocks.17.attn.norm_added_q.weight",
200
+ "transformer_blocks.17.attn.norm_added_k.weight",
201
+ "transformer_blocks.17.img_norm1.weight",
202
+ "transformer_blocks.17.img_norm2.weight",
203
+ "transformer_blocks.17.txt_norm1.weight",
204
+ "transformer_blocks.17.txt_norm2.weight",
205
+ "transformer_blocks.18.attn.norm_q.weight",
206
+ "transformer_blocks.18.attn.norm_k.weight",
207
+ "transformer_blocks.18.attn.norm_added_q.weight",
208
+ "transformer_blocks.18.attn.norm_added_k.weight",
209
+ "transformer_blocks.18.img_norm1.weight",
210
+ "transformer_blocks.18.img_norm2.weight",
211
+ "transformer_blocks.18.txt_norm1.weight",
212
+ "transformer_blocks.18.txt_norm2.weight",
213
+ "transformer_blocks.19.attn.norm_q.weight",
214
+ "transformer_blocks.19.attn.norm_k.weight",
215
+ "transformer_blocks.19.attn.norm_added_q.weight",
216
+ "transformer_blocks.19.attn.norm_added_k.weight",
217
+ "transformer_blocks.19.img_norm1.weight",
218
+ "transformer_blocks.19.img_norm2.weight",
219
+ "transformer_blocks.19.txt_norm1.weight",
220
+ "transformer_blocks.19.txt_norm2.weight",
221
+ "transformer_blocks.20.attn.norm_q.weight",
222
+ "transformer_blocks.20.attn.norm_k.weight",
223
+ "transformer_blocks.20.attn.norm_added_q.weight",
224
+ "transformer_blocks.20.attn.norm_added_k.weight",
225
+ "transformer_blocks.20.img_norm1.weight",
226
+ "transformer_blocks.20.img_norm2.weight",
227
+ "transformer_blocks.20.txt_norm1.weight",
228
+ "transformer_blocks.20.txt_norm2.weight",
229
+ "transformer_blocks.21.attn.norm_q.weight",
230
+ "transformer_blocks.21.attn.norm_k.weight",
231
+ "transformer_blocks.21.attn.norm_added_q.weight",
232
+ "transformer_blocks.21.attn.norm_added_k.weight",
233
+ "transformer_blocks.21.img_norm1.weight",
234
+ "transformer_blocks.21.img_norm2.weight",
235
+ "transformer_blocks.21.txt_norm1.weight",
236
+ "transformer_blocks.21.txt_norm2.weight",
237
+ "transformer_blocks.22.attn.norm_q.weight",
238
+ "transformer_blocks.22.attn.norm_k.weight",
239
+ "transformer_blocks.22.attn.norm_added_q.weight",
240
+ "transformer_blocks.22.attn.norm_added_k.weight",
241
+ "transformer_blocks.22.img_norm1.weight",
242
+ "transformer_blocks.22.img_norm2.weight",
243
+ "transformer_blocks.22.txt_norm1.weight",
244
+ "transformer_blocks.22.txt_norm2.weight",
245
+ "transformer_blocks.23.attn.norm_q.weight",
246
+ "transformer_blocks.23.attn.norm_k.weight",
247
+ "transformer_blocks.23.attn.norm_added_q.weight",
248
+ "transformer_blocks.23.attn.norm_added_k.weight",
249
+ "transformer_blocks.23.img_norm1.weight",
250
+ "transformer_blocks.23.img_norm2.weight",
251
+ "transformer_blocks.23.txt_norm1.weight",
252
+ "transformer_blocks.23.txt_norm2.weight",
253
+ "transformer_blocks.24.attn.norm_q.weight",
254
+ "transformer_blocks.24.attn.norm_k.weight",
255
+ "transformer_blocks.24.attn.norm_added_q.weight",
256
+ "transformer_blocks.24.attn.norm_added_k.weight",
257
+ "transformer_blocks.24.img_norm1.weight",
258
+ "transformer_blocks.24.img_norm2.weight",
259
+ "transformer_blocks.24.txt_norm1.weight",
260
+ "transformer_blocks.24.txt_norm2.weight",
261
+ "transformer_blocks.25.attn.norm_q.weight",
262
+ "transformer_blocks.25.attn.norm_k.weight",
263
+ "transformer_blocks.25.attn.norm_added_q.weight",
264
+ "transformer_blocks.25.attn.norm_added_k.weight",
265
+ "transformer_blocks.25.img_norm1.weight",
266
+ "transformer_blocks.25.img_norm2.weight",
267
+ "transformer_blocks.25.txt_norm1.weight",
268
+ "transformer_blocks.25.txt_norm2.weight",
269
+ "transformer_blocks.26.attn.norm_q.weight",
270
+ "transformer_blocks.26.attn.norm_k.weight",
271
+ "transformer_blocks.26.attn.norm_added_q.weight",
272
+ "transformer_blocks.26.attn.norm_added_k.weight",
273
+ "transformer_blocks.26.img_norm1.weight",
274
+ "transformer_blocks.26.img_norm2.weight",
275
+ "transformer_blocks.26.txt_norm1.weight",
276
+ "transformer_blocks.26.txt_norm2.weight",
277
+ "transformer_blocks.27.attn.norm_q.weight",
278
+ "transformer_blocks.27.attn.norm_k.weight",
279
+ "transformer_blocks.27.attn.norm_added_q.weight",
280
+ "transformer_blocks.27.attn.norm_added_k.weight",
281
+ "transformer_blocks.27.img_norm1.weight",
282
+ "transformer_blocks.27.img_norm2.weight",
283
+ "transformer_blocks.27.txt_norm1.weight",
284
+ "transformer_blocks.27.txt_norm2.weight",
285
+ "transformer_blocks.28.attn.norm_q.weight",
286
+ "transformer_blocks.28.attn.norm_k.weight",
287
+ "transformer_blocks.28.attn.norm_added_q.weight",
288
+ "transformer_blocks.28.attn.norm_added_k.weight",
289
+ "transformer_blocks.28.img_norm1.weight",
290
+ "transformer_blocks.28.img_norm2.weight",
291
+ "transformer_blocks.28.txt_norm1.weight",
292
+ "transformer_blocks.28.txt_norm2.weight",
293
+ "transformer_blocks.29.attn.norm_q.weight",
294
+ "transformer_blocks.29.attn.norm_k.weight",
295
+ "transformer_blocks.29.attn.norm_added_q.weight",
296
+ "transformer_blocks.29.attn.norm_added_k.weight",
297
+ "transformer_blocks.29.img_norm1.weight",
298
+ "transformer_blocks.29.img_norm2.weight",
299
+ "transformer_blocks.29.txt_norm1.weight",
300
+ "transformer_blocks.29.txt_norm2.weight",
301
+ "transformer_blocks.30.attn.norm_q.weight",
302
+ "transformer_blocks.30.attn.norm_k.weight",
303
+ "transformer_blocks.30.attn.norm_added_q.weight",
304
+ "transformer_blocks.30.attn.norm_added_k.weight",
305
+ "transformer_blocks.30.img_norm1.weight",
306
+ "transformer_blocks.30.img_norm2.weight",
307
+ "transformer_blocks.30.txt_norm1.weight",
308
+ "transformer_blocks.30.txt_norm2.weight",
309
+ "transformer_blocks.31.attn.norm_q.weight",
310
+ "transformer_blocks.31.attn.norm_k.weight",
311
+ "transformer_blocks.31.attn.norm_added_q.weight",
312
+ "transformer_blocks.31.attn.norm_added_k.weight",
313
+ "transformer_blocks.31.img_norm1.weight",
314
+ "transformer_blocks.31.img_norm2.weight",
315
+ "transformer_blocks.31.txt_norm1.weight",
316
+ "transformer_blocks.31.txt_norm2.weight",
317
+ "transformer_blocks.32.attn.norm_q.weight",
318
+ "transformer_blocks.32.attn.norm_k.weight",
319
+ "transformer_blocks.32.attn.norm_added_q.weight",
320
+ "transformer_blocks.32.attn.norm_added_k.weight",
321
+ "transformer_blocks.32.img_norm1.weight",
322
+ "transformer_blocks.32.img_norm2.weight",
323
+ "transformer_blocks.32.txt_norm1.weight",
324
+ "transformer_blocks.32.txt_norm2.weight",
325
+ "transformer_blocks.33.attn.norm_q.weight",
326
+ "transformer_blocks.33.attn.norm_k.weight",
327
+ "transformer_blocks.33.attn.norm_added_q.weight",
328
+ "transformer_blocks.33.attn.norm_added_k.weight",
329
+ "transformer_blocks.33.img_norm1.weight",
330
+ "transformer_blocks.33.img_norm2.weight",
331
+ "transformer_blocks.33.txt_norm1.weight",
332
+ "transformer_blocks.33.txt_norm2.weight",
333
+ "transformer_blocks.34.attn.norm_q.weight",
334
+ "transformer_blocks.34.attn.norm_k.weight",
335
+ "transformer_blocks.34.attn.norm_added_q.weight",
336
+ "transformer_blocks.34.attn.norm_added_k.weight",
337
+ "transformer_blocks.34.img_norm1.weight",
338
+ "transformer_blocks.34.img_norm2.weight",
339
+ "transformer_blocks.34.txt_norm1.weight",
340
+ "transformer_blocks.34.txt_norm2.weight",
341
+ "transformer_blocks.35.attn.norm_q.weight",
342
+ "transformer_blocks.35.attn.norm_k.weight",
343
+ "transformer_blocks.35.attn.norm_added_q.weight",
344
+ "transformer_blocks.35.attn.norm_added_k.weight",
345
+ "transformer_blocks.35.img_norm1.weight",
346
+ "transformer_blocks.35.img_norm2.weight",
347
+ "transformer_blocks.35.txt_norm1.weight",
348
+ "transformer_blocks.35.txt_norm2.weight",
349
+ "transformer_blocks.36.attn.norm_q.weight",
350
+ "transformer_blocks.36.attn.norm_k.weight",
351
+ "transformer_blocks.36.attn.norm_added_q.weight",
352
+ "transformer_blocks.36.attn.norm_added_k.weight",
353
+ "transformer_blocks.36.img_norm1.weight",
354
+ "transformer_blocks.36.img_norm2.weight",
355
+ "transformer_blocks.36.txt_norm1.weight",
356
+ "transformer_blocks.36.txt_norm2.weight",
357
+ "transformer_blocks.37.attn.norm_q.weight",
358
+ "transformer_blocks.37.attn.norm_k.weight",
359
+ "transformer_blocks.37.attn.norm_added_q.weight",
360
+ "transformer_blocks.37.attn.norm_added_k.weight",
361
+ "transformer_blocks.37.img_norm1.weight",
362
+ "transformer_blocks.37.img_norm2.weight",
363
+ "transformer_blocks.37.txt_norm1.weight",
364
+ "transformer_blocks.37.txt_norm2.weight",
365
+ "transformer_blocks.38.attn.norm_q.weight",
366
+ "transformer_blocks.38.attn.norm_k.weight",
367
+ "transformer_blocks.38.attn.norm_added_q.weight",
368
+ "transformer_blocks.38.attn.norm_added_k.weight",
369
+ "transformer_blocks.38.img_norm1.weight",
370
+ "transformer_blocks.38.img_norm2.weight",
371
+ "transformer_blocks.38.txt_norm1.weight",
372
+ "transformer_blocks.38.txt_norm2.weight",
373
+ "transformer_blocks.39.attn.norm_q.weight",
374
+ "transformer_blocks.39.attn.norm_k.weight",
375
+ "transformer_blocks.39.attn.norm_added_q.weight",
376
+ "transformer_blocks.39.attn.norm_added_k.weight",
377
+ "transformer_blocks.39.img_norm1.weight",
378
+ "transformer_blocks.39.img_norm2.weight",
379
+ "transformer_blocks.39.txt_norm1.weight",
380
+ "transformer_blocks.39.txt_norm2.weight",
381
+ "transformer_blocks.40.attn.norm_q.weight",
382
+ "transformer_blocks.40.attn.norm_k.weight",
383
+ "transformer_blocks.40.attn.norm_added_q.weight",
384
+ "transformer_blocks.40.attn.norm_added_k.weight",
385
+ "transformer_blocks.40.img_norm1.weight",
386
+ "transformer_blocks.40.img_norm2.weight",
387
+ "transformer_blocks.40.txt_norm1.weight",
388
+ "transformer_blocks.40.txt_norm2.weight",
389
+ "transformer_blocks.41.attn.norm_q.weight",
390
+ "transformer_blocks.41.attn.norm_k.weight",
391
+ "transformer_blocks.41.attn.norm_added_q.weight",
392
+ "transformer_blocks.41.attn.norm_added_k.weight",
393
+ "transformer_blocks.41.img_norm1.weight",
394
+ "transformer_blocks.41.img_norm2.weight",
395
+ "transformer_blocks.41.txt_norm1.weight",
396
+ "transformer_blocks.41.txt_norm2.weight",
397
+ "transformer_blocks.42.attn.norm_q.weight",
398
+ "transformer_blocks.42.attn.norm_k.weight",
399
+ "transformer_blocks.42.attn.norm_added_q.weight",
400
+ "transformer_blocks.42.attn.norm_added_k.weight",
401
+ "transformer_blocks.42.img_norm1.weight",
402
+ "transformer_blocks.42.img_norm2.weight",
403
+ "transformer_blocks.42.txt_norm1.weight",
404
+ "transformer_blocks.42.txt_norm2.weight",
405
+ "transformer_blocks.43.attn.norm_q.weight",
406
+ "transformer_blocks.43.attn.norm_k.weight",
407
+ "transformer_blocks.43.attn.norm_added_q.weight",
408
+ "transformer_blocks.43.attn.norm_added_k.weight",
409
+ "transformer_blocks.43.img_norm1.weight",
410
+ "transformer_blocks.43.img_norm2.weight",
411
+ "transformer_blocks.43.txt_norm1.weight",
412
+ "transformer_blocks.43.txt_norm2.weight",
413
+ "transformer_blocks.44.attn.norm_q.weight",
414
+ "transformer_blocks.44.attn.norm_k.weight",
415
+ "transformer_blocks.44.attn.norm_added_q.weight",
416
+ "transformer_blocks.44.attn.norm_added_k.weight",
417
+ "transformer_blocks.44.img_norm1.weight",
418
+ "transformer_blocks.44.img_norm2.weight",
419
+ "transformer_blocks.44.txt_norm1.weight",
420
+ "transformer_blocks.44.txt_norm2.weight",
421
+ "transformer_blocks.45.attn.norm_q.weight",
422
+ "transformer_blocks.45.attn.norm_k.weight",
423
+ "transformer_blocks.45.attn.norm_added_q.weight",
424
+ "transformer_blocks.45.attn.norm_added_k.weight",
425
+ "transformer_blocks.45.img_norm1.weight",
426
+ "transformer_blocks.45.img_norm2.weight",
427
+ "transformer_blocks.45.txt_norm1.weight",
428
+ "transformer_blocks.45.txt_norm2.weight",
429
+ "transformer_blocks.46.attn.norm_q.weight",
430
+ "transformer_blocks.46.attn.norm_k.weight",
431
+ "transformer_blocks.46.attn.norm_added_q.weight",
432
+ "transformer_blocks.46.attn.norm_added_k.weight",
433
+ "transformer_blocks.46.img_norm1.weight",
434
+ "transformer_blocks.46.img_norm2.weight",
435
+ "transformer_blocks.46.txt_norm1.weight",
436
+ "transformer_blocks.46.txt_norm2.weight",
437
+ "transformer_blocks.47.attn.norm_q.weight",
438
+ "transformer_blocks.47.attn.norm_k.weight",
439
+ "transformer_blocks.47.attn.norm_added_q.weight",
440
+ "transformer_blocks.47.attn.norm_added_k.weight",
441
+ "transformer_blocks.47.img_norm1.weight",
442
+ "transformer_blocks.47.img_norm2.weight",
443
+ "transformer_blocks.47.txt_norm1.weight",
444
+ "transformer_blocks.47.txt_norm2.weight"
445
+ ],
446
+ "modules_to_not_use_matmul": [],
447
+ "non_blocking": false,
448
+ "quant_conv": false,
449
+ "quant_embedding": false,
450
+ "quant_method": "sdnq",
451
+ "quantization_device": null,
452
+ "quantized_matmul_dtype": "int8",
453
+ "return_device": null,
454
+ "sdnq_version": "0.2.0",
455
+ "svd_rank": 32,
456
+ "svd_steps": 8,
457
+ "use_dynamic_quantization": false,
458
+ "use_grad_ckpt": true,
459
+ "use_hadamard": false,
460
+ "use_quantized_matmul": true,
461
+ "use_quantized_matmul_conv": false,
462
+ "use_static_quantization": true,
463
+ "use_stochastic_rounding": false,
464
+ "use_svd": false,
465
+ "weights_dtype": "uint4"
466
+ },
467
+ "rms_norm": true,
468
+ "selected_layer_index": [
469
+ 5,
470
+ 11,
471
+ 17,
472
+ 23
473
+ ]
474
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbd56f77ebef9a7b262c856e1ad3fd5b28d1c1d7f0f5a3ee341276b5243a96d6
3
+ size 2348235656
transformer/quantization_config.json ADDED
@@ -0,0 +1,447 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_skip_keys": false,
3
+ "dequantize_fp32": false,
4
+ "dynamic_loss_threshold": null,
5
+ "group_size": 0,
6
+ "hadamard_group_size": 128,
7
+ "is_integer": true,
8
+ "is_training": false,
9
+ "modules_dtype_dict": {},
10
+ "modules_quant_config": {},
11
+ "modules_to_not_convert": [
12
+ "wte",
13
+ "norm",
14
+ ".img_out",
15
+ "multi_modal_projector",
16
+ ".norm_out",
17
+ "patch_embedding",
18
+ ".img_in",
19
+ ".context_embedder",
20
+ ".txt_out",
21
+ "patch_embed",
22
+ ".vid_in",
23
+ ".final_layer",
24
+ "time_text_embed",
25
+ "pos_embed",
26
+ "lm_head",
27
+ ".vid_out",
28
+ ".txt_in",
29
+ ".t_embedder",
30
+ ".x_embedder",
31
+ "patch_emb",
32
+ ".y_embedder",
33
+ ".condition_embedder",
34
+ ".proj_out",
35
+ ".time_embed",
36
+ ".emb_out",
37
+ ".emb_in",
38
+ "txt_norm.0.weight",
39
+ "txt_norm.1.weight",
40
+ "txt_norm.2.weight",
41
+ "txt_norm.3.weight",
42
+ "transformer_blocks.0.attn.norm_q.weight",
43
+ "transformer_blocks.0.attn.norm_k.weight",
44
+ "transformer_blocks.0.attn.norm_added_q.weight",
45
+ "transformer_blocks.0.attn.norm_added_k.weight",
46
+ "transformer_blocks.0.img_norm1.weight",
47
+ "transformer_blocks.0.img_norm2.weight",
48
+ "transformer_blocks.0.txt_norm1.weight",
49
+ "transformer_blocks.0.txt_norm2.weight",
50
+ "transformer_blocks.1.attn.norm_q.weight",
51
+ "transformer_blocks.1.attn.norm_k.weight",
52
+ "transformer_blocks.1.attn.norm_added_q.weight",
53
+ "transformer_blocks.1.attn.norm_added_k.weight",
54
+ "transformer_blocks.1.img_norm1.weight",
55
+ "transformer_blocks.1.img_norm2.weight",
56
+ "transformer_blocks.1.txt_norm1.weight",
57
+ "transformer_blocks.1.txt_norm2.weight",
58
+ "transformer_blocks.2.attn.norm_q.weight",
59
+ "transformer_blocks.2.attn.norm_k.weight",
60
+ "transformer_blocks.2.attn.norm_added_q.weight",
61
+ "transformer_blocks.2.attn.norm_added_k.weight",
62
+ "transformer_blocks.2.img_norm1.weight",
63
+ "transformer_blocks.2.img_norm2.weight",
64
+ "transformer_blocks.2.txt_norm1.weight",
65
+ "transformer_blocks.2.txt_norm2.weight",
66
+ "transformer_blocks.3.attn.norm_q.weight",
67
+ "transformer_blocks.3.attn.norm_k.weight",
68
+ "transformer_blocks.3.attn.norm_added_q.weight",
69
+ "transformer_blocks.3.attn.norm_added_k.weight",
70
+ "transformer_blocks.3.img_norm1.weight",
71
+ "transformer_blocks.3.img_norm2.weight",
72
+ "transformer_blocks.3.txt_norm1.weight",
73
+ "transformer_blocks.3.txt_norm2.weight",
74
+ "transformer_blocks.4.attn.norm_q.weight",
75
+ "transformer_blocks.4.attn.norm_k.weight",
76
+ "transformer_blocks.4.attn.norm_added_q.weight",
77
+ "transformer_blocks.4.attn.norm_added_k.weight",
78
+ "transformer_blocks.4.img_norm1.weight",
79
+ "transformer_blocks.4.img_norm2.weight",
80
+ "transformer_blocks.4.txt_norm1.weight",
81
+ "transformer_blocks.4.txt_norm2.weight",
82
+ "transformer_blocks.5.attn.norm_q.weight",
83
+ "transformer_blocks.5.attn.norm_k.weight",
84
+ "transformer_blocks.5.attn.norm_added_q.weight",
85
+ "transformer_blocks.5.attn.norm_added_k.weight",
86
+ "transformer_blocks.5.img_norm1.weight",
87
+ "transformer_blocks.5.img_norm2.weight",
88
+ "transformer_blocks.5.txt_norm1.weight",
89
+ "transformer_blocks.5.txt_norm2.weight",
90
+ "transformer_blocks.6.attn.norm_q.weight",
91
+ "transformer_blocks.6.attn.norm_k.weight",
92
+ "transformer_blocks.6.attn.norm_added_q.weight",
93
+ "transformer_blocks.6.attn.norm_added_k.weight",
94
+ "transformer_blocks.6.img_norm1.weight",
95
+ "transformer_blocks.6.img_norm2.weight",
96
+ "transformer_blocks.6.txt_norm1.weight",
97
+ "transformer_blocks.6.txt_norm2.weight",
98
+ "transformer_blocks.7.attn.norm_q.weight",
99
+ "transformer_blocks.7.attn.norm_k.weight",
100
+ "transformer_blocks.7.attn.norm_added_q.weight",
101
+ "transformer_blocks.7.attn.norm_added_k.weight",
102
+ "transformer_blocks.7.img_norm1.weight",
103
+ "transformer_blocks.7.img_norm2.weight",
104
+ "transformer_blocks.7.txt_norm1.weight",
105
+ "transformer_blocks.7.txt_norm2.weight",
106
+ "transformer_blocks.8.attn.norm_q.weight",
107
+ "transformer_blocks.8.attn.norm_k.weight",
108
+ "transformer_blocks.8.attn.norm_added_q.weight",
109
+ "transformer_blocks.8.attn.norm_added_k.weight",
110
+ "transformer_blocks.8.img_norm1.weight",
111
+ "transformer_blocks.8.img_norm2.weight",
112
+ "transformer_blocks.8.txt_norm1.weight",
113
+ "transformer_blocks.8.txt_norm2.weight",
114
+ "transformer_blocks.9.attn.norm_q.weight",
115
+ "transformer_blocks.9.attn.norm_k.weight",
116
+ "transformer_blocks.9.attn.norm_added_q.weight",
117
+ "transformer_blocks.9.attn.norm_added_k.weight",
118
+ "transformer_blocks.9.img_norm1.weight",
119
+ "transformer_blocks.9.img_norm2.weight",
120
+ "transformer_blocks.9.txt_norm1.weight",
121
+ "transformer_blocks.9.txt_norm2.weight",
122
+ "transformer_blocks.10.attn.norm_q.weight",
123
+ "transformer_blocks.10.attn.norm_k.weight",
124
+ "transformer_blocks.10.attn.norm_added_q.weight",
125
+ "transformer_blocks.10.attn.norm_added_k.weight",
126
+ "transformer_blocks.10.img_norm1.weight",
127
+ "transformer_blocks.10.img_norm2.weight",
128
+ "transformer_blocks.10.txt_norm1.weight",
129
+ "transformer_blocks.10.txt_norm2.weight",
130
+ "transformer_blocks.11.attn.norm_q.weight",
131
+ "transformer_blocks.11.attn.norm_k.weight",
132
+ "transformer_blocks.11.attn.norm_added_q.weight",
133
+ "transformer_blocks.11.attn.norm_added_k.weight",
134
+ "transformer_blocks.11.img_norm1.weight",
135
+ "transformer_blocks.11.img_norm2.weight",
136
+ "transformer_blocks.11.txt_norm1.weight",
137
+ "transformer_blocks.11.txt_norm2.weight",
138
+ "transformer_blocks.12.attn.norm_q.weight",
139
+ "transformer_blocks.12.attn.norm_k.weight",
140
+ "transformer_blocks.12.attn.norm_added_q.weight",
141
+ "transformer_blocks.12.attn.norm_added_k.weight",
142
+ "transformer_blocks.12.img_norm1.weight",
143
+ "transformer_blocks.12.img_norm2.weight",
144
+ "transformer_blocks.12.txt_norm1.weight",
145
+ "transformer_blocks.12.txt_norm2.weight",
146
+ "transformer_blocks.13.attn.norm_q.weight",
147
+ "transformer_blocks.13.attn.norm_k.weight",
148
+ "transformer_blocks.13.attn.norm_added_q.weight",
149
+ "transformer_blocks.13.attn.norm_added_k.weight",
150
+ "transformer_blocks.13.img_norm1.weight",
151
+ "transformer_blocks.13.img_norm2.weight",
152
+ "transformer_blocks.13.txt_norm1.weight",
153
+ "transformer_blocks.13.txt_norm2.weight",
154
+ "transformer_blocks.14.attn.norm_q.weight",
155
+ "transformer_blocks.14.attn.norm_k.weight",
156
+ "transformer_blocks.14.attn.norm_added_q.weight",
157
+ "transformer_blocks.14.attn.norm_added_k.weight",
158
+ "transformer_blocks.14.img_norm1.weight",
159
+ "transformer_blocks.14.img_norm2.weight",
160
+ "transformer_blocks.14.txt_norm1.weight",
161
+ "transformer_blocks.14.txt_norm2.weight",
162
+ "transformer_blocks.15.attn.norm_q.weight",
163
+ "transformer_blocks.15.attn.norm_k.weight",
164
+ "transformer_blocks.15.attn.norm_added_q.weight",
165
+ "transformer_blocks.15.attn.norm_added_k.weight",
166
+ "transformer_blocks.15.img_norm1.weight",
167
+ "transformer_blocks.15.img_norm2.weight",
168
+ "transformer_blocks.15.txt_norm1.weight",
169
+ "transformer_blocks.15.txt_norm2.weight",
170
+ "transformer_blocks.16.attn.norm_q.weight",
171
+ "transformer_blocks.16.attn.norm_k.weight",
172
+ "transformer_blocks.16.attn.norm_added_q.weight",
173
+ "transformer_blocks.16.attn.norm_added_k.weight",
174
+ "transformer_blocks.16.img_norm1.weight",
175
+ "transformer_blocks.16.img_norm2.weight",
176
+ "transformer_blocks.16.txt_norm1.weight",
177
+ "transformer_blocks.16.txt_norm2.weight",
178
+ "transformer_blocks.17.attn.norm_q.weight",
179
+ "transformer_blocks.17.attn.norm_k.weight",
180
+ "transformer_blocks.17.attn.norm_added_q.weight",
181
+ "transformer_blocks.17.attn.norm_added_k.weight",
182
+ "transformer_blocks.17.img_norm1.weight",
183
+ "transformer_blocks.17.img_norm2.weight",
184
+ "transformer_blocks.17.txt_norm1.weight",
185
+ "transformer_blocks.17.txt_norm2.weight",
186
+ "transformer_blocks.18.attn.norm_q.weight",
187
+ "transformer_blocks.18.attn.norm_k.weight",
188
+ "transformer_blocks.18.attn.norm_added_q.weight",
189
+ "transformer_blocks.18.attn.norm_added_k.weight",
190
+ "transformer_blocks.18.img_norm1.weight",
191
+ "transformer_blocks.18.img_norm2.weight",
192
+ "transformer_blocks.18.txt_norm1.weight",
193
+ "transformer_blocks.18.txt_norm2.weight",
194
+ "transformer_blocks.19.attn.norm_q.weight",
195
+ "transformer_blocks.19.attn.norm_k.weight",
196
+ "transformer_blocks.19.attn.norm_added_q.weight",
197
+ "transformer_blocks.19.attn.norm_added_k.weight",
198
+ "transformer_blocks.19.img_norm1.weight",
199
+ "transformer_blocks.19.img_norm2.weight",
200
+ "transformer_blocks.19.txt_norm1.weight",
201
+ "transformer_blocks.19.txt_norm2.weight",
202
+ "transformer_blocks.20.attn.norm_q.weight",
203
+ "transformer_blocks.20.attn.norm_k.weight",
204
+ "transformer_blocks.20.attn.norm_added_q.weight",
205
+ "transformer_blocks.20.attn.norm_added_k.weight",
206
+ "transformer_blocks.20.img_norm1.weight",
207
+ "transformer_blocks.20.img_norm2.weight",
208
+ "transformer_blocks.20.txt_norm1.weight",
209
+ "transformer_blocks.20.txt_norm2.weight",
210
+ "transformer_blocks.21.attn.norm_q.weight",
211
+ "transformer_blocks.21.attn.norm_k.weight",
212
+ "transformer_blocks.21.attn.norm_added_q.weight",
213
+ "transformer_blocks.21.attn.norm_added_k.weight",
214
+ "transformer_blocks.21.img_norm1.weight",
215
+ "transformer_blocks.21.img_norm2.weight",
216
+ "transformer_blocks.21.txt_norm1.weight",
217
+ "transformer_blocks.21.txt_norm2.weight",
218
+ "transformer_blocks.22.attn.norm_q.weight",
219
+ "transformer_blocks.22.attn.norm_k.weight",
220
+ "transformer_blocks.22.attn.norm_added_q.weight",
221
+ "transformer_blocks.22.attn.norm_added_k.weight",
222
+ "transformer_blocks.22.img_norm1.weight",
223
+ "transformer_blocks.22.img_norm2.weight",
224
+ "transformer_blocks.22.txt_norm1.weight",
225
+ "transformer_blocks.22.txt_norm2.weight",
226
+ "transformer_blocks.23.attn.norm_q.weight",
227
+ "transformer_blocks.23.attn.norm_k.weight",
228
+ "transformer_blocks.23.attn.norm_added_q.weight",
229
+ "transformer_blocks.23.attn.norm_added_k.weight",
230
+ "transformer_blocks.23.img_norm1.weight",
231
+ "transformer_blocks.23.img_norm2.weight",
232
+ "transformer_blocks.23.txt_norm1.weight",
233
+ "transformer_blocks.23.txt_norm2.weight",
234
+ "transformer_blocks.24.attn.norm_q.weight",
235
+ "transformer_blocks.24.attn.norm_k.weight",
236
+ "transformer_blocks.24.attn.norm_added_q.weight",
237
+ "transformer_blocks.24.attn.norm_added_k.weight",
238
+ "transformer_blocks.24.img_norm1.weight",
239
+ "transformer_blocks.24.img_norm2.weight",
240
+ "transformer_blocks.24.txt_norm1.weight",
241
+ "transformer_blocks.24.txt_norm2.weight",
242
+ "transformer_blocks.25.attn.norm_q.weight",
243
+ "transformer_blocks.25.attn.norm_k.weight",
244
+ "transformer_blocks.25.attn.norm_added_q.weight",
245
+ "transformer_blocks.25.attn.norm_added_k.weight",
246
+ "transformer_blocks.25.img_norm1.weight",
247
+ "transformer_blocks.25.img_norm2.weight",
248
+ "transformer_blocks.25.txt_norm1.weight",
249
+ "transformer_blocks.25.txt_norm2.weight",
250
+ "transformer_blocks.26.attn.norm_q.weight",
251
+ "transformer_blocks.26.attn.norm_k.weight",
252
+ "transformer_blocks.26.attn.norm_added_q.weight",
253
+ "transformer_blocks.26.attn.norm_added_k.weight",
254
+ "transformer_blocks.26.img_norm1.weight",
255
+ "transformer_blocks.26.img_norm2.weight",
256
+ "transformer_blocks.26.txt_norm1.weight",
257
+ "transformer_blocks.26.txt_norm2.weight",
258
+ "transformer_blocks.27.attn.norm_q.weight",
259
+ "transformer_blocks.27.attn.norm_k.weight",
260
+ "transformer_blocks.27.attn.norm_added_q.weight",
261
+ "transformer_blocks.27.attn.norm_added_k.weight",
262
+ "transformer_blocks.27.img_norm1.weight",
263
+ "transformer_blocks.27.img_norm2.weight",
264
+ "transformer_blocks.27.txt_norm1.weight",
265
+ "transformer_blocks.27.txt_norm2.weight",
266
+ "transformer_blocks.28.attn.norm_q.weight",
267
+ "transformer_blocks.28.attn.norm_k.weight",
268
+ "transformer_blocks.28.attn.norm_added_q.weight",
269
+ "transformer_blocks.28.attn.norm_added_k.weight",
270
+ "transformer_blocks.28.img_norm1.weight",
271
+ "transformer_blocks.28.img_norm2.weight",
272
+ "transformer_blocks.28.txt_norm1.weight",
273
+ "transformer_blocks.28.txt_norm2.weight",
274
+ "transformer_blocks.29.attn.norm_q.weight",
275
+ "transformer_blocks.29.attn.norm_k.weight",
276
+ "transformer_blocks.29.attn.norm_added_q.weight",
277
+ "transformer_blocks.29.attn.norm_added_k.weight",
278
+ "transformer_blocks.29.img_norm1.weight",
279
+ "transformer_blocks.29.img_norm2.weight",
280
+ "transformer_blocks.29.txt_norm1.weight",
281
+ "transformer_blocks.29.txt_norm2.weight",
282
+ "transformer_blocks.30.attn.norm_q.weight",
283
+ "transformer_blocks.30.attn.norm_k.weight",
284
+ "transformer_blocks.30.attn.norm_added_q.weight",
285
+ "transformer_blocks.30.attn.norm_added_k.weight",
286
+ "transformer_blocks.30.img_norm1.weight",
287
+ "transformer_blocks.30.img_norm2.weight",
288
+ "transformer_blocks.30.txt_norm1.weight",
289
+ "transformer_blocks.30.txt_norm2.weight",
290
+ "transformer_blocks.31.attn.norm_q.weight",
291
+ "transformer_blocks.31.attn.norm_k.weight",
292
+ "transformer_blocks.31.attn.norm_added_q.weight",
293
+ "transformer_blocks.31.attn.norm_added_k.weight",
294
+ "transformer_blocks.31.img_norm1.weight",
295
+ "transformer_blocks.31.img_norm2.weight",
296
+ "transformer_blocks.31.txt_norm1.weight",
297
+ "transformer_blocks.31.txt_norm2.weight",
298
+ "transformer_blocks.32.attn.norm_q.weight",
299
+ "transformer_blocks.32.attn.norm_k.weight",
300
+ "transformer_blocks.32.attn.norm_added_q.weight",
301
+ "transformer_blocks.32.attn.norm_added_k.weight",
302
+ "transformer_blocks.32.img_norm1.weight",
303
+ "transformer_blocks.32.img_norm2.weight",
304
+ "transformer_blocks.32.txt_norm1.weight",
305
+ "transformer_blocks.32.txt_norm2.weight",
306
+ "transformer_blocks.33.attn.norm_q.weight",
307
+ "transformer_blocks.33.attn.norm_k.weight",
308
+ "transformer_blocks.33.attn.norm_added_q.weight",
309
+ "transformer_blocks.33.attn.norm_added_k.weight",
310
+ "transformer_blocks.33.img_norm1.weight",
311
+ "transformer_blocks.33.img_norm2.weight",
312
+ "transformer_blocks.33.txt_norm1.weight",
313
+ "transformer_blocks.33.txt_norm2.weight",
314
+ "transformer_blocks.34.attn.norm_q.weight",
315
+ "transformer_blocks.34.attn.norm_k.weight",
316
+ "transformer_blocks.34.attn.norm_added_q.weight",
317
+ "transformer_blocks.34.attn.norm_added_k.weight",
318
+ "transformer_blocks.34.img_norm1.weight",
319
+ "transformer_blocks.34.img_norm2.weight",
320
+ "transformer_blocks.34.txt_norm1.weight",
321
+ "transformer_blocks.34.txt_norm2.weight",
322
+ "transformer_blocks.35.attn.norm_q.weight",
323
+ "transformer_blocks.35.attn.norm_k.weight",
324
+ "transformer_blocks.35.attn.norm_added_q.weight",
325
+ "transformer_blocks.35.attn.norm_added_k.weight",
326
+ "transformer_blocks.35.img_norm1.weight",
327
+ "transformer_blocks.35.img_norm2.weight",
328
+ "transformer_blocks.35.txt_norm1.weight",
329
+ "transformer_blocks.35.txt_norm2.weight",
330
+ "transformer_blocks.36.attn.norm_q.weight",
331
+ "transformer_blocks.36.attn.norm_k.weight",
332
+ "transformer_blocks.36.attn.norm_added_q.weight",
333
+ "transformer_blocks.36.attn.norm_added_k.weight",
334
+ "transformer_blocks.36.img_norm1.weight",
335
+ "transformer_blocks.36.img_norm2.weight",
336
+ "transformer_blocks.36.txt_norm1.weight",
337
+ "transformer_blocks.36.txt_norm2.weight",
338
+ "transformer_blocks.37.attn.norm_q.weight",
339
+ "transformer_blocks.37.attn.norm_k.weight",
340
+ "transformer_blocks.37.attn.norm_added_q.weight",
341
+ "transformer_blocks.37.attn.norm_added_k.weight",
342
+ "transformer_blocks.37.img_norm1.weight",
343
+ "transformer_blocks.37.img_norm2.weight",
344
+ "transformer_blocks.37.txt_norm1.weight",
345
+ "transformer_blocks.37.txt_norm2.weight",
346
+ "transformer_blocks.38.attn.norm_q.weight",
347
+ "transformer_blocks.38.attn.norm_k.weight",
348
+ "transformer_blocks.38.attn.norm_added_q.weight",
349
+ "transformer_blocks.38.attn.norm_added_k.weight",
350
+ "transformer_blocks.38.img_norm1.weight",
351
+ "transformer_blocks.38.img_norm2.weight",
352
+ "transformer_blocks.38.txt_norm1.weight",
353
+ "transformer_blocks.38.txt_norm2.weight",
354
+ "transformer_blocks.39.attn.norm_q.weight",
355
+ "transformer_blocks.39.attn.norm_k.weight",
356
+ "transformer_blocks.39.attn.norm_added_q.weight",
357
+ "transformer_blocks.39.attn.norm_added_k.weight",
358
+ "transformer_blocks.39.img_norm1.weight",
359
+ "transformer_blocks.39.img_norm2.weight",
360
+ "transformer_blocks.39.txt_norm1.weight",
361
+ "transformer_blocks.39.txt_norm2.weight",
362
+ "transformer_blocks.40.attn.norm_q.weight",
363
+ "transformer_blocks.40.attn.norm_k.weight",
364
+ "transformer_blocks.40.attn.norm_added_q.weight",
365
+ "transformer_blocks.40.attn.norm_added_k.weight",
366
+ "transformer_blocks.40.img_norm1.weight",
367
+ "transformer_blocks.40.img_norm2.weight",
368
+ "transformer_blocks.40.txt_norm1.weight",
369
+ "transformer_blocks.40.txt_norm2.weight",
370
+ "transformer_blocks.41.attn.norm_q.weight",
371
+ "transformer_blocks.41.attn.norm_k.weight",
372
+ "transformer_blocks.41.attn.norm_added_q.weight",
373
+ "transformer_blocks.41.attn.norm_added_k.weight",
374
+ "transformer_blocks.41.img_norm1.weight",
375
+ "transformer_blocks.41.img_norm2.weight",
376
+ "transformer_blocks.41.txt_norm1.weight",
377
+ "transformer_blocks.41.txt_norm2.weight",
378
+ "transformer_blocks.42.attn.norm_q.weight",
379
+ "transformer_blocks.42.attn.norm_k.weight",
380
+ "transformer_blocks.42.attn.norm_added_q.weight",
381
+ "transformer_blocks.42.attn.norm_added_k.weight",
382
+ "transformer_blocks.42.img_norm1.weight",
383
+ "transformer_blocks.42.img_norm2.weight",
384
+ "transformer_blocks.42.txt_norm1.weight",
385
+ "transformer_blocks.42.txt_norm2.weight",
386
+ "transformer_blocks.43.attn.norm_q.weight",
387
+ "transformer_blocks.43.attn.norm_k.weight",
388
+ "transformer_blocks.43.attn.norm_added_q.weight",
389
+ "transformer_blocks.43.attn.norm_added_k.weight",
390
+ "transformer_blocks.43.img_norm1.weight",
391
+ "transformer_blocks.43.img_norm2.weight",
392
+ "transformer_blocks.43.txt_norm1.weight",
393
+ "transformer_blocks.43.txt_norm2.weight",
394
+ "transformer_blocks.44.attn.norm_q.weight",
395
+ "transformer_blocks.44.attn.norm_k.weight",
396
+ "transformer_blocks.44.attn.norm_added_q.weight",
397
+ "transformer_blocks.44.attn.norm_added_k.weight",
398
+ "transformer_blocks.44.img_norm1.weight",
399
+ "transformer_blocks.44.img_norm2.weight",
400
+ "transformer_blocks.44.txt_norm1.weight",
401
+ "transformer_blocks.44.txt_norm2.weight",
402
+ "transformer_blocks.45.attn.norm_q.weight",
403
+ "transformer_blocks.45.attn.norm_k.weight",
404
+ "transformer_blocks.45.attn.norm_added_q.weight",
405
+ "transformer_blocks.45.attn.norm_added_k.weight",
406
+ "transformer_blocks.45.img_norm1.weight",
407
+ "transformer_blocks.45.img_norm2.weight",
408
+ "transformer_blocks.45.txt_norm1.weight",
409
+ "transformer_blocks.45.txt_norm2.weight",
410
+ "transformer_blocks.46.attn.norm_q.weight",
411
+ "transformer_blocks.46.attn.norm_k.weight",
412
+ "transformer_blocks.46.attn.norm_added_q.weight",
413
+ "transformer_blocks.46.attn.norm_added_k.weight",
414
+ "transformer_blocks.46.img_norm1.weight",
415
+ "transformer_blocks.46.img_norm2.weight",
416
+ "transformer_blocks.46.txt_norm1.weight",
417
+ "transformer_blocks.46.txt_norm2.weight",
418
+ "transformer_blocks.47.attn.norm_q.weight",
419
+ "transformer_blocks.47.attn.norm_k.weight",
420
+ "transformer_blocks.47.attn.norm_added_q.weight",
421
+ "transformer_blocks.47.attn.norm_added_k.weight",
422
+ "transformer_blocks.47.img_norm1.weight",
423
+ "transformer_blocks.47.img_norm2.weight",
424
+ "transformer_blocks.47.txt_norm1.weight",
425
+ "transformer_blocks.47.txt_norm2.weight"
426
+ ],
427
+ "modules_to_not_use_matmul": [],
428
+ "non_blocking": false,
429
+ "quant_conv": false,
430
+ "quant_embedding": false,
431
+ "quant_method": "sdnq",
432
+ "quantization_device": null,
433
+ "quantized_matmul_dtype": "int8",
434
+ "return_device": null,
435
+ "sdnq_version": "0.2.0",
436
+ "svd_rank": 32,
437
+ "svd_steps": 8,
438
+ "use_dynamic_quantization": false,
439
+ "use_grad_ckpt": true,
440
+ "use_hadamard": false,
441
+ "use_quantized_matmul": true,
442
+ "use_quantized_matmul_conv": false,
443
+ "use_static_quantization": true,
444
+ "use_stochastic_rounding": false,
445
+ "use_svd": false,
446
+ "weights_dtype": "uint4"
447
+ }
vae/config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKLFlux2",
3
+ "_diffusers_version": "0.38.0",
4
+ "_name_or_path": "/workspace/.cache/huggingface/hub/models--microsoft--Lens-Turbo/snapshots/f21b81bed3bae7f93f16f5fd300af9c408f5816a/vae",
5
+ "act_fn": "silu",
6
+ "batch_norm_eps": 0.0001,
7
+ "batch_norm_momentum": 0.1,
8
+ "block_out_channels": [
9
+ 128,
10
+ 256,
11
+ 512,
12
+ 512
13
+ ],
14
+ "decoder_block_out_channels": null,
15
+ "down_block_types": [
16
+ "DownEncoderBlock2D",
17
+ "DownEncoderBlock2D",
18
+ "DownEncoderBlock2D",
19
+ "DownEncoderBlock2D"
20
+ ],
21
+ "force_upcast": true,
22
+ "in_channels": 3,
23
+ "latent_channels": 32,
24
+ "layers_per_block": 2,
25
+ "mid_block_add_attention": true,
26
+ "norm_num_groups": 32,
27
+ "out_channels": 3,
28
+ "patch_size": [
29
+ 2,
30
+ 2
31
+ ],
32
+ "sample_size": 1024,
33
+ "up_block_types": [
34
+ "UpDecoderBlock2D",
35
+ "UpDecoderBlock2D",
36
+ "UpDecoderBlock2D",
37
+ "UpDecoderBlock2D"
38
+ ],
39
+ "use_post_quant_conv": true,
40
+ "use_quant_conv": true
41
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca70d2202afe6415bdbcb8793ba8cd99fd159cfe6192381504d6c4d3036e0f04
3
+ size 168120878