cocktailpeanut commited on
Commit
e0a0fb2
·
verified ·
1 Parent(s): 35dfe54

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,11 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ assets/benchmarks/design_arena.png filter=lfs diff=lfs merge=lfs -text
38
+ assets/benchmarks/design_arena2.png filter=lfs diff=lfs merge=lfs -text
39
+ assets/benchmarks/ideogram_benchmark.png filter=lfs diff=lfs merge=lfs -text
40
+ assets/benchmarks/lmarena_benchmark.png filter=lfs diff=lfs merge=lfs -text
41
+ assets/benchmarks/opensource.png filter=lfs diff=lfs merge=lfs -text
42
+ assets/benchmarks/opensource2.png filter=lfs diff=lfs merge=lfs -text
43
+ assets/samples/collage_landscape.jpg filter=lfs diff=lfs merge=lfs -text
LICENSE.md ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Ideogram Non-Commercial Model Agreement
2
+
3
+ Last Updated: June 3, 2026
4
+
5
+ This Ideogram Non-Commercial Model Agreement (“Agreement”) is a legal agreement between you and Ideogram, Inc. (“Company”, “we” or “us”). This Agreement governs your access to and use of the Models (as defined below) that we make available to you under this Agreement. You expressly agree that if you accept the terms of this Agreement or if you otherwise download, access, use or Distribute any portion of the Model or Model Derivatives, then you agree to be bound by this Agreement. Company may designate certain materials that are designed to be used with the Models (such as related inference code) under a separate license or agreement, and nothing in this Agreement will be deemed to restrict or limit any other rights or licenses granted by Company in such other materials.
6
+
7
+ If you are entering into this Agreement on behalf of an entity, then “you” means that entity, and you represent and warrant that (a) you are an authorized representative of the entity with the authority to bind the entity to this Agreement and (b) you agree to this Agreement on the entity’s behalf.
8
+
9
+ 1. Definitions.
10
+
11
+ (a) “Distribution” or “Distribute” means any distribution, making available, transmission, publication or other sharing of the Model or any Model Derivative with or to a third party, including by providing or making the Model or its functionality available as a hosted service via API, web access or any other electronic or remote means (“Hosted Service”), and including by incorporating the Model into products or services that you make available to third parties.
12
+
13
+ (b) “Model” means the machine learning model, software, algorithms, trained model weights, parameters and documentation that Company designates as subject to this Agreement. For clarity, the following are considered Models subject to this Agreement: Ideogram 4.
14
+
15
+ (c) “Model Derivative” means all (i) modifications to, and fine-tuned versions of, the Model, (ii) any other machine learning model which is created by transferring the weights and parameters of the Model (or patterns thereof) to such model in a manner that causes it to perform similar to the Model, or (iii) any other derivatives of the Model. For clarity, an Output is not a Model Derivative.
16
+
17
+ (d) “Non-Commercial Purposes” means activity or use that fits in any of the following categories: (i) use that does not directly or indirectly generate revenue and is not otherwise intended for or directed towards commercial advantage or monetary compensation, (ii) use by a for-profit entity solely for testing, evaluation, or research and development in a “non-production environment” (an environment that is not deployed in live systems, customer-facing applications or any other environment beyond internal development, testing or prototyping), (iii) personal use for research, experimentation, testing purposes as part of a personal study, private entertainment or hobby project, or (iv) use by a charitable organization for charitable purposes. Without limiting the foregoing, any use that involves training, fine tuning, or distilling AI models for commercial use or that involves generating Output to include in, or to advertise or promote, revenue-generating products or services, in each case, is not a Non-Commercial Purpose.
18
+
19
+ (e) “Output” means any content or other output generated by the inference operation of the Model or any Model Derivative, in response to an input or prompt provided by the user. For the avoidance of doubt, Outputs do not include any components of a Model, such as any fine-tuned versions of the Model, the weights, or parameters.
20
+
21
+ 2. Grant of Rights.
22
+
23
+ We hereby permit you to use, reproduce, Distribute, copy, create derivative works of (including Model Derivatives), and make modifications to the Model for Non-Commercial Purposes subject to the terms of this Agreement, including any use restrictions set forth below. For clarity, you are only authorized to exercise the rights under this Agreement for Non-Commercial Purposes only, and may not exercise any of the rights under this Agreement for other purposes unless or until Company otherwise expressly grants you such rights in a separate agreement, which Company may grant or not grant in its sole discretion.
24
+
25
+ 3. Redistribution and Use.
26
+
27
+ You may reproduce or Distribute copies of the Model or Model Derivatives only if you meet all of the following conditions: (i) all permitted use of the reproduced and re-Distributed Model or Model Derivatives must be on terms that are no less restrictive than those set forth in this Agreement for the Model (e.g., including the same standards for Non-Commercial Purposes as set forth in Section 2 above and at least the same use restrictions set forth in Section 4 below), (ii) you provide all third party recipients of the Model or Model Derivative a copy of this Agreement; (iii) you retain in all copies of the Model or Model Derivatives that you Distribute the following attribution notice within a “Notice” text file that accompanies such copy: “Ideogram 4 is provided under and subject to the Ideogram Non-Commercial Model Agreement available at https://github.com/ideogram-oss/ideogram-4/model_licenses/LICENSE-IDEOGRAM-4-NON-COMMERCIAL. All rights reserved. Copyright © Ideogram, Inc.”; (iv) you cause any modified files to carry prominent notices stating that you modified the files; (v) any terms and conditions you impose on third-party recipients must include a disclaimer of warranties and limitation of liability provisions that are at least as protective of Company as those set forth herein; and (vi) you must not misrepresent or imply that any Model Derivative made by you is an official product of Company or has been endorsed, approved or validated by Company.
28
+
29
+ 4. Use Restrictions.
30
+
31
+ Your use of the Model and any Model Derivative must comply with applicable laws and regulations (including trade compliance laws and regulations) and adhere to the Acceptable Use Policy available at https://ideogram.ai/legal/usage-policy, which is hereby incorporated by reference into this Agreement. Without limiting the foregoing, you will not (and will not permit or enable any third party to) use the Model or any Model Derivative: (a) for military purposes or purposes of surveillance, including any research or development relating to surveillance; (b) for biometric processing; (c) in any manner that infringes, misappropriates, or otherwise violates any third party’s legal rights, including rights of publicity; (d) to generate unlawful content, including child sexual abuse material or non-consensual intimate images; (e) in any manner that violates any applicable privacy or data protection laws; or (f) to make automated decisions in domains that affect material or individual rights or well-being (e.g., finance, legal, employment, healthcare, housing, insurance and social welfare) or otherwise in a manner that poses a significant risk of harm to the health, safety or fundamental rights of persons, including to influence any “consequential decision” under applicable law or for any other use case that is categorized as “high risk” under applicable law (“High Risk Use Cases”). You are responsible for implementing appropriate safety measures, including content filters and human oversight, suitable for your use case and to prevent the creation, display, generation or reproduction of unlawful or infringing content, and for including any legally required disclosure (or other provenance measures) to disclose that the Output was generated or modified using artificial intelligence technologies. However, we may also implement certain safety measures, content protections and other technological measures for the Model, including content filters and watermarking, and you agree that you will not circumvent, remove, alter, deactivate, degrade or thwart any such measures. To the extent required under applicable law, you must ensure any Output includes disclosure or other indication that the Output was generated or modified using artificial intelligence technologies.
32
+
33
+ 5. Disclaimer of Warranty.
34
+
35
+ UNLESS REQUIRED BY APPLICABLE LAW, THE MODEL, ANY MODEL DERIVATIVE AND ANY OUTPUT AND RESULTS THEREFROM ARE PROVIDED ON AN “AS IS” BASIS, WITHOUT WARRANTIES OF ANY KIND, AND WE DISCLAIM ALL WARRANTIES OF ANY KIND, BOTH EXPRESS AND IMPLIED, INCLUDING, WITHOUT LIMITATION, ANY WARRANTIES OF TITLE, NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE. YOU ARE SOLELY RESPONSIBLE FOR DETERMINING THE APPROPRIATENESS OF, AND ASSUME ALL RISKS ASSOCIATED WITH, USING, REPRODUCING, MODIFYING, PERFORMING, DISPLAYING OR DISTRIBUTING THE MODEL, ANY MODEL DERIVATIVE OR ANY OUTPUT. YOU AGREE THAT THE MODEL AND ANY MODEL DERIVATIVE ARE NOT DESIGNED OR INTENDED FOR HIGH RISK USE CASES OR AS PART OF HIGH RISK AI SYSTEMS (AS DEFINED UNDER APPLICABLE LAWS), AND ANY SUCH USE IS IN VIOLATION OF THIS AGREEMENT AND AT YOUR OWN RISK.
36
+
37
+ 6. Limitation of Liability.
38
+
39
+ IN NO EVENT WILL COMPANY OR ITS AFFILIATES BE LIABLE UNDER ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, TORT, NEGLIGENCE, PRODUCTS LIABILITY, OR OTHERWISE, ARISING OUT OF THIS AGREEMENT, FOR DAMAGES OF ANY KIND, INCLUDING DIRECT, INDIRECT, SPECIAL, CONSEQUENTIAL, INCIDENTAL, EXEMPLARY OR PUNITIVE DAMAGES OR LOST PROFITS OF ANY KIND, EVEN IF COMPANY OR ITS AFFILIATES HAVE BEEN ADVISED OF THE POSSIBILITY OF ANY OF THE FOREGOING.
40
+
41
+ 7. Intellectual Property.
42
+
43
+ Company reserves any rights not expressly granted herein. Nothing in this Agreement grants you any rights to use Company’s trademarks, trade names, or logos (except as required for the attribution described above). Subject to Company’s ownership of the Model and Model Derivatives made by or for Company, with respect to any Model Derivatives that are made by you, as between you and Company, you own any incremental rights in such Model Derivatives beyond Company’s rights in the underlying Model or its own Model Derivatives. We claim no rights in outputs you generate using the Model. You are responsible for outputs and their subsequent uses. You may not use any Output to develop, train, fine-tune or distill a model or other product or services that is competitive with the Model or any of Company’s other products or services.
44
+
45
+ 8. Indemnification.
46
+
47
+ You will indemnify and hold harmless the Company and its affiliates and each of their respective shareholders, directors, officers, employees, agents, successors, and assigns (collectively, the “Company Parties”) from and against any losses, liabilities, damages, fines, penalties, and expenses (including reasonable attorneys’ fees) incurred by any Company Party in connection with any claim, demand, allegation, lawsuit, proceeding, or investigation arising out of or related to your use, access, hosting or Distribution of the Model or Model Derivatives or any Outputs or your breach of this Agreement.
48
+
49
+ 9. Term and Termination.
50
+
51
+ This Agreement continues in full force and effect until terminated in accordance with the terms and conditions herein. We may terminate this Agreement at any time upon notice to you. We may also terminate this Agreement if you are in breach of any term or condition of this Agreement. If you institute litigation or other proceedings against Company or any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Model, Model Derivative or output, or any portion of any of the foregoing, constitutes infringement of intellectual property or other rights owned or licensable by you, then any licenses granted to you under this Agreement shall terminate as of the date such litigation or claim is filed or instituted. Upon termination of this Agreement, you shall delete and cease use or Distribution of the Model and any Model Derivative. Sections 5–10 shall survive the termination of this Agreement.
52
+
53
+ 10. General.
54
+
55
+ This Agreement will be governed and construed under the laws of the State of New York without regard to conflicts of law provisions. If any provision or part of a provision of this Agreement is unlawful, void or unenforceable, that provision or part of the provision is deemed severed from this Agreement, and will not affect the validity and enforceability of any remaining provisions. The failure of Company to exercise or enforce any right or provision of this Agreement will not operate as a waiver of such right or provision. This Agreement does not confer any third-party beneficiary rights upon any other person or entity. This Agreement contains the entire understanding between you and Company regarding the subject matter of this Agreement, and supersedes all other written or oral agreements and understandings between you and Company regarding such subject matter. You may not assign or transfer this Agreement, including any of your rights or obligations hereunder, without the prior written consent of Company. Any purported assignment not in accordance with this Section will be null and void. We may modify this Agreement from time to time in which case we will update the “Last Updated” date at the top of these Terms. It is your sole responsibility to review this Agreement from time to time to view any such changes. The updated Agreement will be effective as of the time of posting, or such later date as may be specified in the updated Agreement. Your continued access or use of the Model or any Model Derivatives after the modifications have become effective will be deemed your acceptance of the modified Agreement.
README.md ADDED
@@ -0,0 +1,329 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ license_name: ideogram-4-non-commercial
4
+ license_link: https://huggingface.co/ideogram-ai/ideogram-4-fp8/blob/main/LICENSE.md
5
+ pipeline_tag: text-to-image
6
+ tags:
7
+ - text-to-image
8
+ - image-generation
9
+ - diffusion
10
+ - flow-matching
11
+ - dit
12
+ - ideogram
13
+ ---
14
+
15
+ <p align="center"><a href="https://ideogram.ai/" target="_blank" rel="noopener noreferrer"><img src="assets/ideogram_logo.svg" alt="Ideogram" width="500"></a></p>
16
+
17
+ <p align="center"><em>Ideogram 4: Open image model at the forefront of design</em></p>
18
+
19
+ <p align="center">
20
+ <a href="https://ideogram.ai/blog/ideogram-4.0/" target="_blank" rel="noopener noreferrer"><img src="https://img.shields.io/badge/Blog-Post-orange" alt="Blog Post"></a>
21
+ <a href="https://github.com/ideogram-oss/ideogram4" target="_blank" rel="noopener noreferrer"><img src="https://img.shields.io/badge/Code-GitHub-181717?logo=github" alt="Code"></a>
22
+ <a href="https://huggingface.co/collections/ideogram-ai/ideogram-4" target="_blank" rel="noopener noreferrer"><img src="https://img.shields.io/badge/Model-HuggingFace-blue?logo=huggingface" alt="Model"></a>
23
+ <a href="https://developer.ideogram.ai/" target="_blank" rel="noopener noreferrer"><img src="https://img.shields.io/badge/API-developer.ideogram.ai-purple" alt="API"></a>
24
+ <a href="https://ideogram.ai/" target="_blank" rel="noopener noreferrer"><img src="https://img.shields.io/badge/Official%20Site-ideogram.ai-ff69b4" alt="Official Site"></a>
25
+ </p>
26
+
27
+ <p align="center">
28
+ <img src="assets/samples/collage_landscape.jpg" alt="A collage of Ideogram 4 samples spanning photorealism, illustration, typography, and poster design">
29
+ </p>
30
+
31
+
32
+ Ideogram 4 is **[Ideogram](https://ideogram.ai)'s first open-source text-to-image model**. It is a **state-of-the-art foundation model trained from scratch** — not a fine-tune of any existing model. It introduces a new structured JSON prompting interface, with best-in-class multilingual text rendering, deep language understanding, explicit bounding-box layout and color-palette controls, and native 2k resolution images. The easiest way to try the model is online at **[ideogram.ai](https://ideogram.ai/)**.
33
+
34
+ We believe openness drives innovation, and we invite the research community to innovate with us on the forefront of visual intelligence.
35
+
36
+ ## Table of Contents
37
+
38
+ 1. [News](#news)
39
+ 2. [Model Zoo](#model-zoo)
40
+ 3. [Performance](#performance)
41
+ 4. [Quick Start](#quick-start)
42
+ 5. [Model Summary](#model-summary)
43
+ 6. [Prompting Guide](#prompting-guide)
44
+ 7. [Documentation](#documentation)
45
+ 8. [Citation](#citation)
46
+
47
+ ## News
48
+
49
+ * **[2026-06-03]** **Ideogram 4 released!** Inference code and weights
50
+ are now public, and our [technical blog post](https://ideogram.ai/blog/ideogram-4.0/) is live. See the
51
+ [Quick Start](#quick-start) section to generate your first image, or try the
52
+ model online at [ideogram.ai](https://ideogram.ai/).
53
+
54
+ ## Model Zoo
55
+
56
+ | Model | Params | Weight Quantization | Supported Hardware | Diffusers Support | License |
57
+ | :--- | :---: | :---: | :---: | :---: | :---: |
58
+ | **[Ideogram 4 (nf4)](https://huggingface.co/ideogram-ai/ideogram-4-nf4)** | 9.3B | nf4 | CUDA | Yes | [Ideogram 4 Non-Commercial](https://huggingface.co/ideogram-ai/ideogram-4-nf4/blob/main/LICENSE.md) |
59
+ | **[Ideogram 4 (fp8)](https://huggingface.co/ideogram-ai/ideogram-4-fp8)** | 9.3B | fp8 | All | No | [Ideogram 4 Non-Commercial](https://huggingface.co/ideogram-ai/ideogram-4-fp8/blob/main/LICENSE.md) |
60
+
61
+ We plan to support more quantizations in the future.
62
+
63
+
64
+ ## Performance
65
+
66
+ We evaluate Ideogram 4 across third-party arenas and benchmarks, standard
67
+ open-source benchmarks, and our own internal human-preference benchmark. Across
68
+ all of them, **Ideogram 4 is the best open-weight image model by far, and sits
69
+ at the frontier of design.**
70
+
71
+ ### Design Arena
72
+
73
+ [Design Arena](https://www.designarena.ai/) is a third-party image Elo
74
+ leaderboard focused specifically on design-oriented generation. On the overall
75
+ board, Ideogram 4 is the top-ranked open-weight model, trailing only proprietary
76
+ GPT and Gemini models:
77
+
78
+ <p align="center">
79
+ <img src="assets/benchmarks/design_arena.png" alt="Design Arena overall image Elo leaderboard with Ideogram 4.0 as the top open-weight model">
80
+ </p>
81
+
82
+ Filtered to open-weight models only, Ideogram 4 leads by a commanding margin,
83
+ well ahead of the next-best open model:
84
+
85
+ <p align="center">
86
+ <img src="assets/benchmarks/design_arena2.png" alt="Design Arena open-weight image Elo leaderboard, with Ideogram 4.0 well ahead of all other open models">
87
+ </p>
88
+
89
+ ### ContraLabs
90
+
91
+ [ContraLabs](https://contralabs.com/research) ran a blind typography evaluation judged by
92
+ ten professional designers from Contra's top-earning talent. Ideogram 4 leads on
93
+ first-place win rate, picked as the best of four models 47.9% of the time
94
+ overall — well ahead of Gemini 3.1 Flash Image Preview (Nano Banana 2) at 30.0%,
95
+ FLUX.2 [max] (15.5%), and Grok Imagine 1.0 (15.0%):
96
+
97
+ <p align="center">
98
+ <img src="assets/benchmarks/contralabs_typography.png" alt="ContraLabs typography first-place win rate, with Ideogram v4 leading">
99
+ </p>
100
+
101
+ It also wins on practical usability: asked "Would you use this in real client
102
+ work?", the same designers rated Ideogram 4 highest at 3.55 / 5 — significantly
103
+ above Nano Banana 2 (2.84), Grok Imagine 1.0 (2.61), and FLUX.2 [max] (2.49):
104
+
105
+ <p align="center">
106
+ <img src="assets/benchmarks/contralabs_typography2.png" alt="ContraLabs 'would you use this in real client work?' rating, with Ideogram v4 leading">
107
+ </p>
108
+
109
+ ### LMArena
110
+
111
+ On [LMArena](https://lmarena.ai/), a third-party text-to-image leaderboard that
112
+ measures general-purpose text-to-image use cases, Ideogram is the top-ranked
113
+ open-weight lab and a top-5 image generation lab overall — beaten only by giant
114
+ companies with vastly larger budgets and resources:
115
+
116
+ <p align="center">
117
+ <img src="assets/benchmarks/lmarena_benchmark.png" alt="LMArena text-to-image lab leaderboard with Ideogram">
118
+ </p>
119
+
120
+ ### Ideogram internal eval
121
+
122
+ For our internal human-preference benchmark, focused on graphic design and
123
+ photography, we had graphic designers deeply familiar with professional design
124
+ work do the rating blind. Bradley-Terry scores rank Ideogram 4 #2 overall —
125
+ behind only GPT Image 2 medium — and the top open-weight model:
126
+
127
+ <p align="center">
128
+ <img src="assets/benchmarks/ideogram_benchmark.png" alt="Ideogram internal design leaderboard with Ideogram 4.0">
129
+ </p>
130
+
131
+ ### Open-source benchmarks
132
+
133
+ On standard open-source benchmarks measuring core capabilities — layout control
134
+ (7Bench), spatial reasoning and object fidelity (SpatialGenEval), text rendering
135
+ (X-Omni OCR), and prompt alignment (Prism) — Ideogram 4 closes the gap to the
136
+ leading closed-source models across every axis. On layout control (7Bench), it
137
+ is significantly better than all closed-source models:
138
+
139
+ <p align="center">
140
+ <img src="assets/benchmarks/opensource.png" alt="Five-axis capability radar comparing Ideogram 4.0 to leading closed-source models on layout control, spatial reasoning, object fidelity, prompt alignment, and text rendering">
141
+ </p>
142
+
143
+ At 9.3B parameters, Ideogram 4 delivers the best text rendering of any open-weight
144
+ release we benchmarked — ahead of much larger models like Qwen-Image (20B),
145
+ FLUX.2 [dev] (32B), and HunyuanImage 3.0 (80B MoE):
146
+
147
+ <p align="center">
148
+ <img src="assets/benchmarks/opensource2.png" alt="Parameter-efficiency scatter plot showing Ideogram 4.0 at 9.3B parameters leading all other open-weight models on text rendering">
149
+ </p>
150
+
151
+
152
+ ## Quick Start
153
+
154
+ ### Install
155
+
156
+ The inference code lives in the [`ideogram4`](https://github.com/ideogram-oss/ideogram4) GitHub repo. Clone it, then from the repo root:
157
+
158
+ ```bash
159
+ pip install .
160
+ ```
161
+
162
+ If you plan to modify the code, install in editable mode instead so changes
163
+ under `src/ideogram4/` take effect without reinstalling:
164
+
165
+ ```bash
166
+ pip install -e .
167
+ ```
168
+
169
+ ### CLI
170
+
171
+ The plain `--prompt` is rewritten into the structured JSON caption the model
172
+ expects by a "magic prompt" LLM. By default this uses Ideogram's hosted
173
+ magic-prompt API, which is **free** and does the expansion server-side (no local
174
+ model or system prompt needed). It reads `IDEOGRAM_API_KEY` — get a key at
175
+ [developer.ideogram.ai](https://developer.ideogram.ai/):
176
+
177
+ ```bash
178
+ python run_inference.py \
179
+ --prompt "a ginger cat wearing a tiny wizard hat reading a spellbook" \
180
+ --output out.png \
181
+ --quantization "nf4" \
182
+ --magic-prompt-key "$IDEOGRAM_API_KEY"
183
+ ```
184
+
185
+ You can also run the expansion through your own LLM provider — one of our magic-prompt
186
+ system prompt is **open source**. See the
187
+ [Prompting Guide](https://github.com/ideogram-oss/ideogram4/blob/main/docs/prompting.md#magic-prompt) for details.
188
+
189
+ For the highest-quality images, set `--height 2048 --width 2048` and
190
+ `--sampler-preset V4_QUALITY_48`.
191
+
192
+ #### Safety screening with Hive
193
+
194
+ Prompt and output safety screening is performed via [Hive](https://thehive.ai/).
195
+ Sign up and create a Text Moderation key and a Visual Content Moderation key,
196
+ then export them as `HIVE_TEXT_MODERATION_KEY` and `HIVE_VISUAL_MODERATION_KEY`
197
+ (or pass them via `--hive-text-key` / `--hive-visual-key`).
198
+
199
+ ```bash
200
+ python run_inference.py \
201
+ --prompt "an isometric illustration of a tiny city floating in the clouds" \
202
+ --output out.png \
203
+ --quantization "nf4" \
204
+ --magic-prompt-key "$MAGIC_PROMPT_API_KEY" \
205
+ --hive-text-key "$HIVE_TEXT_MODERATION_KEY" \
206
+ --hive-visual-key "$HIVE_VISUAL_MODERATION_KEY"
207
+ ```
208
+
209
+ For sampler presets, parameter reference, and optimization tips, see
210
+ [docs/inference.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/inference.md).
211
+
212
+ ## Model Summary
213
+
214
+ Ideogram 4 is a **foundation model trained entirely from scratch**, not a
215
+ fine-tune or distillation of any existing checkpoint. It is a flow-matching
216
+ text-to-image model built on a **fully single-stream** Diffusion Transformer
217
+ (DiT) architecture.
218
+
219
+ **Architecture:**
220
+ - **Fully single-stream DiT.** Text and image tokens are concatenated into one
221
+ unified sequence and processed through the same 34-layer transformer, with no
222
+ separate text or image branches. This enables deep cross-modal interaction at
223
+ every layer.
224
+ - **Vision-language model as text encoder.** Instead of a text-only encoder
225
+ like CLIP or T5, Ideogram 4 uses
226
+ [Qwen3-VL-8B-Instruct](https://huggingface.co/Qwen/Qwen3-VL-8B-Instruct),
227
+ a full vision-language model that provides far richer understanding of visual
228
+ concepts. Hidden states are extracted from **13 intermediate layers** and
229
+ concatenated, giving the model multi-scale semantic features ranging from
230
+ surface-level token information to deep compositional understanding.
231
+ - **Dual-branch classifier-free guidance.** The conditional (positive) and
232
+ unconditional (negative) branches can be independently refined, enabling
233
+ separate control over prompt adherence and image quality.
234
+ - **Flexible resolution.** Native support for any resolution from 256 to 2048
235
+ (multiples of 16), with aspect ratios up to 6:1. A single model handles
236
+ everything from square thumbnails to ultrawide banners, with the noise
237
+ schedule auto-adjusting per resolution.
238
+
239
+ **Key Capabilities:**
240
+ - **Extreme controllability.** Ideogram 4 is trained on structured JSON
241
+ captions, giving users unprecedented control over composition, style,
242
+ lighting, color palette, typography, and spatial layout, all from a single
243
+ prompt.
244
+ - **State-of-the-art text rendering.** Ideogram 4 delivers best-in-class
245
+ in-image text generation (signage, logos, captions, watermarks, multi-line
246
+ text) with high fidelity directly from the prompt.
247
+ - **Spatial layout control.** Bounding-box coordinates in the prompt allow
248
+ explicit placement of subjects, text elements, and background regions.
249
+ - **Color palette conditioning.** Specify hex colors in the prompt to steer the
250
+ image's dominant color scheme.
251
+
252
+ For full architecture details, see
253
+ [docs/model_architecture.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/model_architecture.md). For a walkthrough of
254
+ how the pipeline components fit together, see
255
+ [docs/pipeline.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/pipeline.md).
256
+
257
+ ## Prompting Guide
258
+
259
+ Ideogram 4 is trained exclusively on **structured JSON captions**. While
260
+ plain-text prompts work, you will get the best results by providing a JSON
261
+ object that follows our caption schema.
262
+
263
+
264
+ Key points:
265
+
266
+ - **Use JSON prompts** for maximum controllability — the model was trained on
267
+ them and understands the structure natively.
268
+ - **Color palette conditioning** — specify a `colour_palette` array of hex
269
+ colors in the style description to steer the image's color scheme.
270
+ - **Aspect ratio flexibility** — Ideogram 4 supports a wide range of aspect
271
+ ratios (any multiple-of-16 resolution from 256 to 2048 on each side). This
272
+ is a key advantage for practical use: portraits, landscapes, banners,
273
+ phone wallpapers, social media formats, etc.
274
+ - **Bounding-box layout** — specify `bbox` coordinates in the prompt to
275
+ explicitly place subjects, text elements, and background regions.
276
+ - **Compositional control** — use `compositional_deconstruction` with bounding
277
+ boxes and per-element descriptions for precise spatial layout.
278
+
279
+
280
+ **Why JSON-only training?** We train exclusively on JSON so that training
281
+ and inference share a single, common prompt format. The training captions themselves are deliberately
282
+ **extremely descriptive**: each JSON exhaustively describes everything in
283
+ the image to maximize training efficiency. The more
284
+ text-to-image relationships each caption pins down, the more grounded
285
+ supervision the model extracts from a single training pair, rather than
286
+ having to infer those relationships across many sparsely-captioned samples.
287
+
288
+ **Why JSON at inference time?** Because the model was trained on captions
289
+ that name every object explicitly, the most reliable way to get every
290
+ requested object rendered is to mirror that pattern. Plain-text prompts still work, but
291
+ won't perform as well since the model was only trained on structured JSON captions.
292
+
293
+ **Don't want to write JSON by hand?** That's what *magic prompt* is for: it uses
294
+ an LLM to expand a plain-text prompt into a full structured caption before
295
+ generation, so you get JSON-quality results from a casual prompt. It runs by
296
+ default in `run_inference.py` (see the [CLI](#cli) section).
297
+
298
+ See [docs/prompting.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/prompting.md) for a full guide.
299
+
300
+ ## Documentation
301
+
302
+ | Document | Description |
303
+ | :------- | :---------- |
304
+ | [docs/prompting.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/prompting.md) | How to write JSON prompts, color palette conditioning, aspect ratios |
305
+ | [docs/inference.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/inference.md) | Sampler presets, parameter reference, resolutions, optimization tips |
306
+ | [docs/model_architecture.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/model_architecture.md) | Architecture diagram, DiT spec, component details |
307
+ | [docs/pipeline.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/pipeline.md) | Conceptual pipeline walkthrough — how all components fit together |
308
+ | [docs/development.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/development.md) | Dev setup, pre-commit hooks, contributing |
309
+ | [docs/safety.md](https://github.com/ideogram-oss/ideogram4/blob/main/docs/safety.md) | Pre-training, post-training, and inference-time safety mitigations; how to report violations |
310
+
311
+ ## Citation
312
+
313
+ If you find the provided code or models useful for your research, consider citing them as:
314
+
315
+
316
+ ```bibtex
317
+ @misc{ideogram-4-2026,
318
+ author={Ideogram AI},
319
+ title={{Ideogram 4}},
320
+ year={2026},
321
+ howpublished={\url{https://ideogram.ai/blog/ideogram-4.0/}},
322
+ }
323
+ ```
324
+
325
+ ## We're Hiring!
326
+
327
+ We're looking for **Research Scientists** and **Research Engineers** to
328
+ work on next-generation generative models and the products built on top of
329
+ them. Interested candidates please apply https://jobs.ashbyhq.com/ideogram
assets/benchmarks/contralabs_typography.png ADDED
assets/benchmarks/contralabs_typography2.png ADDED
assets/benchmarks/design_arena.png ADDED

Git LFS Details

  • SHA256: 7c4aa9ba1d97567072ab743c8d3404b37da9099d389d43d329a7dd9a3e6faa43
  • Pointer size: 131 Bytes
  • Size of remote file: 927 kB
assets/benchmarks/design_arena2.png ADDED

Git LFS Details

  • SHA256: b388372b6b3d00dfacccd3dc7b587e19918018109f7d066487f03d2f9745329c
  • Pointer size: 131 Bytes
  • Size of remote file: 798 kB
assets/benchmarks/ideogram_benchmark.png ADDED

Git LFS Details

  • SHA256: 695fa3419503880acc1ce7f25c259ed41d5276cf7c3f297b896fda56adea993c
  • Pointer size: 131 Bytes
  • Size of remote file: 216 kB
assets/benchmarks/lmarena_benchmark.png ADDED

Git LFS Details

  • SHA256: e8a852a2ea0b71e227d254aa1488eaea223fbe9e61371a64f413678976a443e3
  • Pointer size: 131 Bytes
  • Size of remote file: 198 kB
assets/benchmarks/opensource.png ADDED

Git LFS Details

  • SHA256: d8d0b2dc5a5813dc1b4707e8d6f54f4a75ecab2feb30dda2327fc58b0f3dc253
  • Pointer size: 131 Bytes
  • Size of remote file: 328 kB
assets/benchmarks/opensource2.png ADDED

Git LFS Details

  • SHA256: d5bce23395cad5c65539c29c084e1cf1511431a14efda283377f049d6d439e37
  • Pointer size: 131 Bytes
  • Size of remote file: 163 kB
assets/ideogram_logo.svg ADDED
assets/ideogram_logo_darkmode.svg ADDED
assets/samples/collage_landscape.jpg ADDED

Git LFS Details

  • SHA256: b98b2d7cde3e24c1f28341fb531898e0b09cfe03ccbdc978a14cf87ef8bb1987
  • Pointer size: 132 Bytes
  • Size of remote file: 8.18 MB
model_index.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "Ideogram4Pipeline",
3
+ "_diffusers_version": "0.39.0.dev0",
4
+ "_name_or_path": "ideogram-ai/debug-ideogram-v4",
5
+ "scheduler": [
6
+ "diffusers",
7
+ "FlowMatchEulerDiscreteScheduler"
8
+ ],
9
+ "text_encoder": [
10
+ "transformers",
11
+ "Qwen3VLModel"
12
+ ],
13
+ "tokenizer": [
14
+ "transformers",
15
+ "Qwen2Tokenizer"
16
+ ],
17
+ "transformer": [
18
+ "diffusers",
19
+ "Ideogram4Transformer2DModel"
20
+ ],
21
+ "unconditional_transformer": [
22
+ "diffusers",
23
+ "Ideogram4Transformer2DModel"
24
+ ],
25
+ "vae": [
26
+ "diffusers",
27
+ "AutoencoderKLFlux2"
28
+ ]
29
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
+ "_diffusers_version": "0.39.0.dev0",
4
+ "base_image_seq_len": 256,
5
+ "base_shift": 0.5,
6
+ "invert_sigmas": false,
7
+ "max_image_seq_len": 4096,
8
+ "max_shift": 1.15,
9
+ "num_train_timesteps": 1000,
10
+ "shift": 1.0,
11
+ "shift_terminal": null,
12
+ "stochastic_sampling": false,
13
+ "time_shift_type": "exponential",
14
+ "use_beta_sigmas": false,
15
+ "use_dynamic_shifting": false,
16
+ "use_exponential_sigmas": false,
17
+ "use_karras_sigmas": false
18
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3VLModel"
4
+ ],
5
+ "dtype": "bfloat16",
6
+ "image_token_id": 151655,
7
+ "model_type": "qwen3_vl",
8
+ "text_config": {
9
+ "attention_bias": false,
10
+ "attention_dropout": 0.0,
11
+ "bos_token_id": 151643,
12
+ "dtype": "bfloat16",
13
+ "eos_token_id": 151645,
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 4096,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 12288,
19
+ "max_position_embeddings": 262144,
20
+ "model_type": "qwen3_vl_text",
21
+ "num_attention_heads": 32,
22
+ "num_hidden_layers": 36,
23
+ "num_key_value_heads": 8,
24
+ "pad_token_id": null,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_parameters": {
27
+ "mrope_interleaved": true,
28
+ "mrope_section": [
29
+ 24,
30
+ 20,
31
+ 20
32
+ ],
33
+ "rope_theta": 5000000,
34
+ "rope_type": "default"
35
+ },
36
+ "use_cache": true,
37
+ "vocab_size": 151936
38
+ },
39
+ "tie_word_embeddings": false,
40
+ "transformers_version": "5.8.0",
41
+ "video_token_id": 151656,
42
+ "vision_config": {
43
+ "deepstack_visual_indexes": [
44
+ 8,
45
+ 16,
46
+ 24
47
+ ],
48
+ "depth": 27,
49
+ "dtype": "bfloat16",
50
+ "hidden_act": "gelu_pytorch_tanh",
51
+ "hidden_size": 1152,
52
+ "in_channels": 3,
53
+ "initializer_range": 0.02,
54
+ "intermediate_size": 4304,
55
+ "model_type": "qwen3_vl_vision",
56
+ "num_heads": 16,
57
+ "num_position_embeddings": 2304,
58
+ "out_hidden_size": 4096,
59
+ "patch_size": 16,
60
+ "spatial_merge_size": 2,
61
+ "temporal_patch_size": 2
62
+ },
63
+ "vision_end_token_id": 151653,
64
+ "vision_start_token_id": 151652,
65
+ "ideogram_fp8_weight_only": true
66
+ }
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b094e8be345fc602b79eae674004cf44078e511f03d200980095244a0d1bcf46
3
+ size 8779278400
text_encoder/model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"total_size": 8779147168}, "weight_map": {"language_model.embed_tokens.weight": "model.safetensors", "language_model.layers.0.input_layernorm.weight": "model.safetensors", "language_model.layers.0.mlp.down_proj.weight": "model.safetensors", "language_model.layers.0.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.0.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.0.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.0.mlp.up_proj.weight": "model.safetensors", "language_model.layers.0.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.0.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.0.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.0.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.0.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.0.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.0.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.0.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.0.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.0.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.0.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.0.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.1.input_layernorm.weight": "model.safetensors", "language_model.layers.1.mlp.down_proj.weight": "model.safetensors", "language_model.layers.1.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.1.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.1.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.1.mlp.up_proj.weight": "model.safetensors", "language_model.layers.1.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.1.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.1.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.1.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.1.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.1.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.1.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.1.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.1.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.1.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.1.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.1.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.10.input_layernorm.weight": "model.safetensors", "language_model.layers.10.mlp.down_proj.weight": "model.safetensors", "language_model.layers.10.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.10.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.10.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.10.mlp.up_proj.weight": "model.safetensors", "language_model.layers.10.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.10.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.10.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.10.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.10.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.10.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.10.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.10.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.10.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.10.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.10.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.10.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.11.input_layernorm.weight": "model.safetensors", "language_model.layers.11.mlp.down_proj.weight": "model.safetensors", "language_model.layers.11.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.11.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.11.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.11.mlp.up_proj.weight": "model.safetensors", "language_model.layers.11.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.11.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.11.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.11.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.11.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.11.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.11.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.11.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.11.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.11.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.11.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.11.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.12.input_layernorm.weight": "model.safetensors", "language_model.layers.12.mlp.down_proj.weight": "model.safetensors", "language_model.layers.12.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.12.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.12.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.12.mlp.up_proj.weight": "model.safetensors", "language_model.layers.12.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.12.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.12.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.12.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.12.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.12.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.12.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.12.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.12.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.12.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.12.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.12.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.13.input_layernorm.weight": "model.safetensors", "language_model.layers.13.mlp.down_proj.weight": "model.safetensors", "language_model.layers.13.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.13.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.13.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.13.mlp.up_proj.weight": "model.safetensors", "language_model.layers.13.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.13.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.13.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.13.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.13.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.13.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.13.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.13.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.13.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.13.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.13.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.13.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.14.input_layernorm.weight": "model.safetensors", "language_model.layers.14.mlp.down_proj.weight": "model.safetensors", "language_model.layers.14.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.14.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.14.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.14.mlp.up_proj.weight": "model.safetensors", "language_model.layers.14.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.14.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.14.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.14.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.14.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.14.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.14.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.14.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.14.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.14.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.14.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.14.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.15.input_layernorm.weight": "model.safetensors", "language_model.layers.15.mlp.down_proj.weight": "model.safetensors", "language_model.layers.15.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.15.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.15.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.15.mlp.up_proj.weight": "model.safetensors", "language_model.layers.15.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.15.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.15.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.15.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.15.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.15.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.15.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.15.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.15.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.15.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.15.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.15.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.16.input_layernorm.weight": "model.safetensors", "language_model.layers.16.mlp.down_proj.weight": "model.safetensors", "language_model.layers.16.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.16.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.16.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.16.mlp.up_proj.weight": "model.safetensors", "language_model.layers.16.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.16.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.16.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.16.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.16.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.16.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.16.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.16.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.16.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.16.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.16.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.16.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.17.input_layernorm.weight": "model.safetensors", "language_model.layers.17.mlp.down_proj.weight": "model.safetensors", "language_model.layers.17.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.17.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.17.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.17.mlp.up_proj.weight": "model.safetensors", "language_model.layers.17.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.17.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.17.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.17.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.17.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.17.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.17.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.17.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.17.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.17.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.17.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.17.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.18.input_layernorm.weight": "model.safetensors", "language_model.layers.18.mlp.down_proj.weight": "model.safetensors", "language_model.layers.18.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.18.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.18.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.18.mlp.up_proj.weight": "model.safetensors", "language_model.layers.18.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.18.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.18.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.18.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.18.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.18.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.18.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.18.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.18.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.18.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.18.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.18.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.19.input_layernorm.weight": "model.safetensors", "language_model.layers.19.mlp.down_proj.weight": "model.safetensors", "language_model.layers.19.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.19.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.19.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.19.mlp.up_proj.weight": "model.safetensors", "language_model.layers.19.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.19.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.19.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.19.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.19.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.19.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.19.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.19.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.19.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.19.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.19.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.19.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.2.input_layernorm.weight": "model.safetensors", "language_model.layers.2.mlp.down_proj.weight": "model.safetensors", "language_model.layers.2.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.2.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.2.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.2.mlp.up_proj.weight": "model.safetensors", "language_model.layers.2.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.2.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.2.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.2.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.2.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.2.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.2.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.2.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.2.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.2.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.2.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.2.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.20.input_layernorm.weight": "model.safetensors", "language_model.layers.20.mlp.down_proj.weight": "model.safetensors", "language_model.layers.20.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.20.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.20.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.20.mlp.up_proj.weight": "model.safetensors", "language_model.layers.20.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.20.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.20.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.20.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.20.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.20.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.20.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.20.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.20.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.20.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.20.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.20.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.21.input_layernorm.weight": "model.safetensors", "language_model.layers.21.mlp.down_proj.weight": "model.safetensors", "language_model.layers.21.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.21.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.21.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.21.mlp.up_proj.weight": "model.safetensors", "language_model.layers.21.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.21.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.21.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.21.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.21.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.21.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.21.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.21.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.21.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.21.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.21.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.21.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.22.input_layernorm.weight": "model.safetensors", "language_model.layers.22.mlp.down_proj.weight": "model.safetensors", "language_model.layers.22.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.22.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.22.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.22.mlp.up_proj.weight": "model.safetensors", "language_model.layers.22.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.22.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.22.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.22.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.22.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.22.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.22.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.22.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.22.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.22.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.22.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.22.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.23.input_layernorm.weight": "model.safetensors", "language_model.layers.23.mlp.down_proj.weight": "model.safetensors", "language_model.layers.23.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.23.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.23.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.23.mlp.up_proj.weight": "model.safetensors", "language_model.layers.23.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.23.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.23.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.23.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.23.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.23.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.23.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.23.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.23.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.23.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.23.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.23.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.24.input_layernorm.weight": "model.safetensors", "language_model.layers.24.mlp.down_proj.weight": "model.safetensors", "language_model.layers.24.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.24.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.24.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.24.mlp.up_proj.weight": "model.safetensors", "language_model.layers.24.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.24.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.24.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.24.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.24.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.24.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.24.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.24.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.24.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.24.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.24.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.24.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.25.input_layernorm.weight": "model.safetensors", "language_model.layers.25.mlp.down_proj.weight": "model.safetensors", "language_model.layers.25.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.25.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.25.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.25.mlp.up_proj.weight": "model.safetensors", "language_model.layers.25.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.25.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.25.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.25.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.25.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.25.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.25.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.25.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.25.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.25.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.25.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.25.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.26.input_layernorm.weight": "model.safetensors", "language_model.layers.26.mlp.down_proj.weight": "model.safetensors", "language_model.layers.26.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.26.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.26.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.26.mlp.up_proj.weight": "model.safetensors", "language_model.layers.26.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.26.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.26.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.26.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.26.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.26.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.26.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.26.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.26.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.26.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.26.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.26.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.27.input_layernorm.weight": "model.safetensors", "language_model.layers.27.mlp.down_proj.weight": "model.safetensors", "language_model.layers.27.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.27.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.27.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.27.mlp.up_proj.weight": "model.safetensors", "language_model.layers.27.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.27.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.27.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.27.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.27.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.27.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.27.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.27.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.27.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.27.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.27.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.27.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.28.input_layernorm.weight": "model.safetensors", "language_model.layers.28.mlp.down_proj.weight": "model.safetensors", "language_model.layers.28.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.28.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.28.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.28.mlp.up_proj.weight": "model.safetensors", "language_model.layers.28.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.28.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.28.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.28.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.28.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.28.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.28.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.28.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.28.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.28.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.28.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.28.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.29.input_layernorm.weight": "model.safetensors", "language_model.layers.29.mlp.down_proj.weight": "model.safetensors", "language_model.layers.29.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.29.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.29.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.29.mlp.up_proj.weight": "model.safetensors", "language_model.layers.29.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.29.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.29.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.29.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.29.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.29.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.29.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.29.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.29.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.29.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.29.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.29.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.3.input_layernorm.weight": "model.safetensors", "language_model.layers.3.mlp.down_proj.weight": "model.safetensors", "language_model.layers.3.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.3.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.3.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.3.mlp.up_proj.weight": "model.safetensors", "language_model.layers.3.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.3.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.3.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.3.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.3.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.3.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.3.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.3.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.3.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.3.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.3.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.3.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.30.input_layernorm.weight": "model.safetensors", "language_model.layers.30.mlp.down_proj.weight": "model.safetensors", "language_model.layers.30.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.30.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.30.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.30.mlp.up_proj.weight": "model.safetensors", "language_model.layers.30.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.30.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.30.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.30.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.30.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.30.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.30.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.30.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.30.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.30.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.30.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.30.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.31.input_layernorm.weight": "model.safetensors", "language_model.layers.31.mlp.down_proj.weight": "model.safetensors", "language_model.layers.31.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.31.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.31.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.31.mlp.up_proj.weight": "model.safetensors", "language_model.layers.31.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.31.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.31.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.31.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.31.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.31.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.31.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.31.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.31.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.31.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.31.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.31.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.32.input_layernorm.weight": "model.safetensors", "language_model.layers.32.mlp.down_proj.weight": "model.safetensors", "language_model.layers.32.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.32.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.32.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.32.mlp.up_proj.weight": "model.safetensors", "language_model.layers.32.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.32.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.32.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.32.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.32.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.32.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.32.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.32.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.32.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.32.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.32.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.32.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.33.input_layernorm.weight": "model.safetensors", "language_model.layers.33.mlp.down_proj.weight": "model.safetensors", "language_model.layers.33.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.33.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.33.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.33.mlp.up_proj.weight": "model.safetensors", "language_model.layers.33.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.33.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.33.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.33.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.33.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.33.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.33.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.33.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.33.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.33.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.33.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.33.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.34.input_layernorm.weight": "model.safetensors", "language_model.layers.34.mlp.down_proj.weight": "model.safetensors", "language_model.layers.34.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.34.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.34.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.34.mlp.up_proj.weight": "model.safetensors", "language_model.layers.34.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.34.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.34.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.34.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.34.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.34.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.34.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.34.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.34.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.34.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.34.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.34.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.35.input_layernorm.weight": "model.safetensors", "language_model.layers.35.mlp.down_proj.weight": "model.safetensors", "language_model.layers.35.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.35.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.35.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.35.mlp.up_proj.weight": "model.safetensors", "language_model.layers.35.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.35.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.35.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.35.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.35.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.35.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.35.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.35.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.35.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.35.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.35.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.35.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.4.input_layernorm.weight": "model.safetensors", "language_model.layers.4.mlp.down_proj.weight": "model.safetensors", "language_model.layers.4.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.4.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.4.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.4.mlp.up_proj.weight": "model.safetensors", "language_model.layers.4.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.4.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.4.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.4.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.4.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.4.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.4.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.4.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.4.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.4.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.4.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.4.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.5.input_layernorm.weight": "model.safetensors", "language_model.layers.5.mlp.down_proj.weight": "model.safetensors", "language_model.layers.5.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.5.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.5.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.5.mlp.up_proj.weight": "model.safetensors", "language_model.layers.5.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.5.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.5.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.5.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.5.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.5.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.5.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.5.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.5.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.5.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.5.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.5.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.6.input_layernorm.weight": "model.safetensors", "language_model.layers.6.mlp.down_proj.weight": "model.safetensors", "language_model.layers.6.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.6.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.6.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.6.mlp.up_proj.weight": "model.safetensors", "language_model.layers.6.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.6.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.6.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.6.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.6.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.6.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.6.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.6.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.6.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.6.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.6.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.6.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.7.input_layernorm.weight": "model.safetensors", "language_model.layers.7.mlp.down_proj.weight": "model.safetensors", "language_model.layers.7.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.7.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.7.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.7.mlp.up_proj.weight": "model.safetensors", "language_model.layers.7.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.7.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.7.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.7.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.7.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.7.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.7.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.7.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.7.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.7.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.7.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.7.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.8.input_layernorm.weight": "model.safetensors", "language_model.layers.8.mlp.down_proj.weight": "model.safetensors", "language_model.layers.8.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.8.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.8.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.8.mlp.up_proj.weight": "model.safetensors", "language_model.layers.8.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.8.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.8.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.8.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.8.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.8.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.8.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.8.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.8.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.8.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.8.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.8.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.layers.9.input_layernorm.weight": "model.safetensors", "language_model.layers.9.mlp.down_proj.weight": "model.safetensors", "language_model.layers.9.mlp.down_proj.weight_scale": "model.safetensors", "language_model.layers.9.mlp.gate_proj.weight": "model.safetensors", "language_model.layers.9.mlp.gate_proj.weight_scale": "model.safetensors", "language_model.layers.9.mlp.up_proj.weight": "model.safetensors", "language_model.layers.9.mlp.up_proj.weight_scale": "model.safetensors", "language_model.layers.9.post_attention_layernorm.weight": "model.safetensors", "language_model.layers.9.self_attn.k_norm.weight": "model.safetensors", "language_model.layers.9.self_attn.k_proj.weight": "model.safetensors", "language_model.layers.9.self_attn.k_proj.weight_scale": "model.safetensors", "language_model.layers.9.self_attn.o_proj.weight": "model.safetensors", "language_model.layers.9.self_attn.o_proj.weight_scale": "model.safetensors", "language_model.layers.9.self_attn.q_norm.weight": "model.safetensors", "language_model.layers.9.self_attn.q_proj.weight": "model.safetensors", "language_model.layers.9.self_attn.q_proj.weight_scale": "model.safetensors", "language_model.layers.9.self_attn.v_proj.weight": "model.safetensors", "language_model.layers.9.self_attn.v_proj.weight_scale": "model.safetensors", "language_model.norm.weight": "model.safetensors", "visual.blocks.0.attn.proj.bias": "model.safetensors", "visual.blocks.0.attn.proj.weight": "model.safetensors", "visual.blocks.0.attn.proj.weight_scale": "model.safetensors", "visual.blocks.0.attn.qkv.bias": "model.safetensors", "visual.blocks.0.attn.qkv.weight": "model.safetensors", "visual.blocks.0.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.0.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.0.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.0.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.0.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.0.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.0.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.0.norm1.bias": "model.safetensors", "visual.blocks.0.norm1.weight": "model.safetensors", "visual.blocks.0.norm2.bias": "model.safetensors", "visual.blocks.0.norm2.weight": "model.safetensors", "visual.blocks.1.attn.proj.bias": "model.safetensors", "visual.blocks.1.attn.proj.weight": "model.safetensors", "visual.blocks.1.attn.proj.weight_scale": "model.safetensors", "visual.blocks.1.attn.qkv.bias": "model.safetensors", "visual.blocks.1.attn.qkv.weight": "model.safetensors", "visual.blocks.1.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.1.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.1.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.1.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.1.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.1.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.1.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.1.norm1.bias": "model.safetensors", "visual.blocks.1.norm1.weight": "model.safetensors", "visual.blocks.1.norm2.bias": "model.safetensors", "visual.blocks.1.norm2.weight": "model.safetensors", "visual.blocks.10.attn.proj.bias": "model.safetensors", "visual.blocks.10.attn.proj.weight": "model.safetensors", "visual.blocks.10.attn.proj.weight_scale": "model.safetensors", "visual.blocks.10.attn.qkv.bias": "model.safetensors", "visual.blocks.10.attn.qkv.weight": "model.safetensors", "visual.blocks.10.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.10.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.10.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.10.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.10.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.10.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.10.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.10.norm1.bias": "model.safetensors", "visual.blocks.10.norm1.weight": "model.safetensors", "visual.blocks.10.norm2.bias": "model.safetensors", "visual.blocks.10.norm2.weight": "model.safetensors", "visual.blocks.11.attn.proj.bias": "model.safetensors", "visual.blocks.11.attn.proj.weight": "model.safetensors", "visual.blocks.11.attn.proj.weight_scale": "model.safetensors", "visual.blocks.11.attn.qkv.bias": "model.safetensors", "visual.blocks.11.attn.qkv.weight": "model.safetensors", "visual.blocks.11.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.11.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.11.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.11.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.11.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.11.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.11.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.11.norm1.bias": "model.safetensors", "visual.blocks.11.norm1.weight": "model.safetensors", "visual.blocks.11.norm2.bias": "model.safetensors", "visual.blocks.11.norm2.weight": "model.safetensors", "visual.blocks.12.attn.proj.bias": "model.safetensors", "visual.blocks.12.attn.proj.weight": "model.safetensors", "visual.blocks.12.attn.proj.weight_scale": "model.safetensors", "visual.blocks.12.attn.qkv.bias": "model.safetensors", "visual.blocks.12.attn.qkv.weight": "model.safetensors", "visual.blocks.12.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.12.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.12.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.12.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.12.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.12.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.12.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.12.norm1.bias": "model.safetensors", "visual.blocks.12.norm1.weight": "model.safetensors", "visual.blocks.12.norm2.bias": "model.safetensors", "visual.blocks.12.norm2.weight": "model.safetensors", "visual.blocks.13.attn.proj.bias": "model.safetensors", "visual.blocks.13.attn.proj.weight": "model.safetensors", "visual.blocks.13.attn.proj.weight_scale": "model.safetensors", "visual.blocks.13.attn.qkv.bias": "model.safetensors", "visual.blocks.13.attn.qkv.weight": "model.safetensors", "visual.blocks.13.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.13.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.13.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.13.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.13.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.13.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.13.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.13.norm1.bias": "model.safetensors", "visual.blocks.13.norm1.weight": "model.safetensors", "visual.blocks.13.norm2.bias": "model.safetensors", "visual.blocks.13.norm2.weight": "model.safetensors", "visual.blocks.14.attn.proj.bias": "model.safetensors", "visual.blocks.14.attn.proj.weight": "model.safetensors", "visual.blocks.14.attn.proj.weight_scale": "model.safetensors", "visual.blocks.14.attn.qkv.bias": "model.safetensors", "visual.blocks.14.attn.qkv.weight": "model.safetensors", "visual.blocks.14.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.14.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.14.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.14.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.14.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.14.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.14.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.14.norm1.bias": "model.safetensors", "visual.blocks.14.norm1.weight": "model.safetensors", "visual.blocks.14.norm2.bias": "model.safetensors", "visual.blocks.14.norm2.weight": "model.safetensors", "visual.blocks.15.attn.proj.bias": "model.safetensors", "visual.blocks.15.attn.proj.weight": "model.safetensors", "visual.blocks.15.attn.proj.weight_scale": "model.safetensors", "visual.blocks.15.attn.qkv.bias": "model.safetensors", "visual.blocks.15.attn.qkv.weight": "model.safetensors", "visual.blocks.15.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.15.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.15.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.15.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.15.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.15.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.15.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.15.norm1.bias": "model.safetensors", "visual.blocks.15.norm1.weight": "model.safetensors", "visual.blocks.15.norm2.bias": "model.safetensors", "visual.blocks.15.norm2.weight": "model.safetensors", "visual.blocks.16.attn.proj.bias": "model.safetensors", "visual.blocks.16.attn.proj.weight": "model.safetensors", "visual.blocks.16.attn.proj.weight_scale": "model.safetensors", "visual.blocks.16.attn.qkv.bias": "model.safetensors", "visual.blocks.16.attn.qkv.weight": "model.safetensors", "visual.blocks.16.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.16.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.16.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.16.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.16.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.16.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.16.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.16.norm1.bias": "model.safetensors", "visual.blocks.16.norm1.weight": "model.safetensors", "visual.blocks.16.norm2.bias": "model.safetensors", "visual.blocks.16.norm2.weight": "model.safetensors", "visual.blocks.17.attn.proj.bias": "model.safetensors", "visual.blocks.17.attn.proj.weight": "model.safetensors", "visual.blocks.17.attn.proj.weight_scale": "model.safetensors", "visual.blocks.17.attn.qkv.bias": "model.safetensors", "visual.blocks.17.attn.qkv.weight": "model.safetensors", "visual.blocks.17.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.17.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.17.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.17.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.17.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.17.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.17.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.17.norm1.bias": "model.safetensors", "visual.blocks.17.norm1.weight": "model.safetensors", "visual.blocks.17.norm2.bias": "model.safetensors", "visual.blocks.17.norm2.weight": "model.safetensors", "visual.blocks.18.attn.proj.bias": "model.safetensors", "visual.blocks.18.attn.proj.weight": "model.safetensors", "visual.blocks.18.attn.proj.weight_scale": "model.safetensors", "visual.blocks.18.attn.qkv.bias": "model.safetensors", "visual.blocks.18.attn.qkv.weight": "model.safetensors", "visual.blocks.18.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.18.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.18.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.18.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.18.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.18.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.18.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.18.norm1.bias": "model.safetensors", "visual.blocks.18.norm1.weight": "model.safetensors", "visual.blocks.18.norm2.bias": "model.safetensors", "visual.blocks.18.norm2.weight": "model.safetensors", "visual.blocks.19.attn.proj.bias": "model.safetensors", "visual.blocks.19.attn.proj.weight": "model.safetensors", "visual.blocks.19.attn.proj.weight_scale": "model.safetensors", "visual.blocks.19.attn.qkv.bias": "model.safetensors", "visual.blocks.19.attn.qkv.weight": "model.safetensors", "visual.blocks.19.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.19.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.19.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.19.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.19.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.19.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.19.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.19.norm1.bias": "model.safetensors", "visual.blocks.19.norm1.weight": "model.safetensors", "visual.blocks.19.norm2.bias": "model.safetensors", "visual.blocks.19.norm2.weight": "model.safetensors", "visual.blocks.2.attn.proj.bias": "model.safetensors", "visual.blocks.2.attn.proj.weight": "model.safetensors", "visual.blocks.2.attn.proj.weight_scale": "model.safetensors", "visual.blocks.2.attn.qkv.bias": "model.safetensors", "visual.blocks.2.attn.qkv.weight": "model.safetensors", "visual.blocks.2.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.2.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.2.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.2.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.2.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.2.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.2.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.2.norm1.bias": "model.safetensors", "visual.blocks.2.norm1.weight": "model.safetensors", "visual.blocks.2.norm2.bias": "model.safetensors", "visual.blocks.2.norm2.weight": "model.safetensors", "visual.blocks.20.attn.proj.bias": "model.safetensors", "visual.blocks.20.attn.proj.weight": "model.safetensors", "visual.blocks.20.attn.proj.weight_scale": "model.safetensors", "visual.blocks.20.attn.qkv.bias": "model.safetensors", "visual.blocks.20.attn.qkv.weight": "model.safetensors", "visual.blocks.20.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.20.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.20.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.20.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.20.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.20.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.20.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.20.norm1.bias": "model.safetensors", "visual.blocks.20.norm1.weight": "model.safetensors", "visual.blocks.20.norm2.bias": "model.safetensors", "visual.blocks.20.norm2.weight": "model.safetensors", "visual.blocks.21.attn.proj.bias": "model.safetensors", "visual.blocks.21.attn.proj.weight": "model.safetensors", "visual.blocks.21.attn.proj.weight_scale": "model.safetensors", "visual.blocks.21.attn.qkv.bias": "model.safetensors", "visual.blocks.21.attn.qkv.weight": "model.safetensors", "visual.blocks.21.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.21.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.21.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.21.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.21.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.21.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.21.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.21.norm1.bias": "model.safetensors", "visual.blocks.21.norm1.weight": "model.safetensors", "visual.blocks.21.norm2.bias": "model.safetensors", "visual.blocks.21.norm2.weight": "model.safetensors", "visual.blocks.22.attn.proj.bias": "model.safetensors", "visual.blocks.22.attn.proj.weight": "model.safetensors", "visual.blocks.22.attn.proj.weight_scale": "model.safetensors", "visual.blocks.22.attn.qkv.bias": "model.safetensors", "visual.blocks.22.attn.qkv.weight": "model.safetensors", "visual.blocks.22.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.22.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.22.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.22.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.22.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.22.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.22.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.22.norm1.bias": "model.safetensors", "visual.blocks.22.norm1.weight": "model.safetensors", "visual.blocks.22.norm2.bias": "model.safetensors", "visual.blocks.22.norm2.weight": "model.safetensors", "visual.blocks.23.attn.proj.bias": "model.safetensors", "visual.blocks.23.attn.proj.weight": "model.safetensors", "visual.blocks.23.attn.proj.weight_scale": "model.safetensors", "visual.blocks.23.attn.qkv.bias": "model.safetensors", "visual.blocks.23.attn.qkv.weight": "model.safetensors", "visual.blocks.23.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.23.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.23.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.23.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.23.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.23.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.23.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.23.norm1.bias": "model.safetensors", "visual.blocks.23.norm1.weight": "model.safetensors", "visual.blocks.23.norm2.bias": "model.safetensors", "visual.blocks.23.norm2.weight": "model.safetensors", "visual.blocks.24.attn.proj.bias": "model.safetensors", "visual.blocks.24.attn.proj.weight": "model.safetensors", "visual.blocks.24.attn.proj.weight_scale": "model.safetensors", "visual.blocks.24.attn.qkv.bias": "model.safetensors", "visual.blocks.24.attn.qkv.weight": "model.safetensors", "visual.blocks.24.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.24.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.24.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.24.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.24.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.24.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.24.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.24.norm1.bias": "model.safetensors", "visual.blocks.24.norm1.weight": "model.safetensors", "visual.blocks.24.norm2.bias": "model.safetensors", "visual.blocks.24.norm2.weight": "model.safetensors", "visual.blocks.25.attn.proj.bias": "model.safetensors", "visual.blocks.25.attn.proj.weight": "model.safetensors", "visual.blocks.25.attn.proj.weight_scale": "model.safetensors", "visual.blocks.25.attn.qkv.bias": "model.safetensors", "visual.blocks.25.attn.qkv.weight": "model.safetensors", "visual.blocks.25.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.25.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.25.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.25.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.25.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.25.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.25.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.25.norm1.bias": "model.safetensors", "visual.blocks.25.norm1.weight": "model.safetensors", "visual.blocks.25.norm2.bias": "model.safetensors", "visual.blocks.25.norm2.weight": "model.safetensors", "visual.blocks.26.attn.proj.bias": "model.safetensors", "visual.blocks.26.attn.proj.weight": "model.safetensors", "visual.blocks.26.attn.proj.weight_scale": "model.safetensors", "visual.blocks.26.attn.qkv.bias": "model.safetensors", "visual.blocks.26.attn.qkv.weight": "model.safetensors", "visual.blocks.26.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.26.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.26.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.26.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.26.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.26.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.26.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.26.norm1.bias": "model.safetensors", "visual.blocks.26.norm1.weight": "model.safetensors", "visual.blocks.26.norm2.bias": "model.safetensors", "visual.blocks.26.norm2.weight": "model.safetensors", "visual.blocks.3.attn.proj.bias": "model.safetensors", "visual.blocks.3.attn.proj.weight": "model.safetensors", "visual.blocks.3.attn.proj.weight_scale": "model.safetensors", "visual.blocks.3.attn.qkv.bias": "model.safetensors", "visual.blocks.3.attn.qkv.weight": "model.safetensors", "visual.blocks.3.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.3.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.3.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.3.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.3.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.3.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.3.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.3.norm1.bias": "model.safetensors", "visual.blocks.3.norm1.weight": "model.safetensors", "visual.blocks.3.norm2.bias": "model.safetensors", "visual.blocks.3.norm2.weight": "model.safetensors", "visual.blocks.4.attn.proj.bias": "model.safetensors", "visual.blocks.4.attn.proj.weight": "model.safetensors", "visual.blocks.4.attn.proj.weight_scale": "model.safetensors", "visual.blocks.4.attn.qkv.bias": "model.safetensors", "visual.blocks.4.attn.qkv.weight": "model.safetensors", "visual.blocks.4.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.4.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.4.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.4.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.4.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.4.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.4.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.4.norm1.bias": "model.safetensors", "visual.blocks.4.norm1.weight": "model.safetensors", "visual.blocks.4.norm2.bias": "model.safetensors", "visual.blocks.4.norm2.weight": "model.safetensors", "visual.blocks.5.attn.proj.bias": "model.safetensors", "visual.blocks.5.attn.proj.weight": "model.safetensors", "visual.blocks.5.attn.proj.weight_scale": "model.safetensors", "visual.blocks.5.attn.qkv.bias": "model.safetensors", "visual.blocks.5.attn.qkv.weight": "model.safetensors", "visual.blocks.5.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.5.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.5.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.5.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.5.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.5.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.5.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.5.norm1.bias": "model.safetensors", "visual.blocks.5.norm1.weight": "model.safetensors", "visual.blocks.5.norm2.bias": "model.safetensors", "visual.blocks.5.norm2.weight": "model.safetensors", "visual.blocks.6.attn.proj.bias": "model.safetensors", "visual.blocks.6.attn.proj.weight": "model.safetensors", "visual.blocks.6.attn.proj.weight_scale": "model.safetensors", "visual.blocks.6.attn.qkv.bias": "model.safetensors", "visual.blocks.6.attn.qkv.weight": "model.safetensors", "visual.blocks.6.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.6.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.6.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.6.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.6.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.6.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.6.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.6.norm1.bias": "model.safetensors", "visual.blocks.6.norm1.weight": "model.safetensors", "visual.blocks.6.norm2.bias": "model.safetensors", "visual.blocks.6.norm2.weight": "model.safetensors", "visual.blocks.7.attn.proj.bias": "model.safetensors", "visual.blocks.7.attn.proj.weight": "model.safetensors", "visual.blocks.7.attn.proj.weight_scale": "model.safetensors", "visual.blocks.7.attn.qkv.bias": "model.safetensors", "visual.blocks.7.attn.qkv.weight": "model.safetensors", "visual.blocks.7.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.7.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.7.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.7.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.7.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.7.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.7.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.7.norm1.bias": "model.safetensors", "visual.blocks.7.norm1.weight": "model.safetensors", "visual.blocks.7.norm2.bias": "model.safetensors", "visual.blocks.7.norm2.weight": "model.safetensors", "visual.blocks.8.attn.proj.bias": "model.safetensors", "visual.blocks.8.attn.proj.weight": "model.safetensors", "visual.blocks.8.attn.proj.weight_scale": "model.safetensors", "visual.blocks.8.attn.qkv.bias": "model.safetensors", "visual.blocks.8.attn.qkv.weight": "model.safetensors", "visual.blocks.8.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.8.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.8.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.8.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.8.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.8.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.8.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.8.norm1.bias": "model.safetensors", "visual.blocks.8.norm1.weight": "model.safetensors", "visual.blocks.8.norm2.bias": "model.safetensors", "visual.blocks.8.norm2.weight": "model.safetensors", "visual.blocks.9.attn.proj.bias": "model.safetensors", "visual.blocks.9.attn.proj.weight": "model.safetensors", "visual.blocks.9.attn.proj.weight_scale": "model.safetensors", "visual.blocks.9.attn.qkv.bias": "model.safetensors", "visual.blocks.9.attn.qkv.weight": "model.safetensors", "visual.blocks.9.attn.qkv.weight_scale": "model.safetensors", "visual.blocks.9.mlp.linear_fc1.bias": "model.safetensors", "visual.blocks.9.mlp.linear_fc1.weight": "model.safetensors", "visual.blocks.9.mlp.linear_fc1.weight_scale": "model.safetensors", "visual.blocks.9.mlp.linear_fc2.bias": "model.safetensors", "visual.blocks.9.mlp.linear_fc2.weight": "model.safetensors", "visual.blocks.9.mlp.linear_fc2.weight_scale": "model.safetensors", "visual.blocks.9.norm1.bias": "model.safetensors", "visual.blocks.9.norm1.weight": "model.safetensors", "visual.blocks.9.norm2.bias": "model.safetensors", "visual.blocks.9.norm2.weight": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc1.bias": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc1.weight": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc1.weight_scale": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc2.bias": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc2.weight": "model.safetensors", "visual.deepstack_merger_list.0.linear_fc2.weight_scale": "model.safetensors", "visual.deepstack_merger_list.0.norm.bias": "model.safetensors", "visual.deepstack_merger_list.0.norm.weight": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc1.bias": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc1.weight": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc1.weight_scale": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc2.bias": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc2.weight": "model.safetensors", "visual.deepstack_merger_list.1.linear_fc2.weight_scale": "model.safetensors", "visual.deepstack_merger_list.1.norm.bias": "model.safetensors", "visual.deepstack_merger_list.1.norm.weight": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc1.bias": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc1.weight": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc1.weight_scale": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc2.bias": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc2.weight": "model.safetensors", "visual.deepstack_merger_list.2.linear_fc2.weight_scale": "model.safetensors", "visual.deepstack_merger_list.2.norm.bias": "model.safetensors", "visual.deepstack_merger_list.2.norm.weight": "model.safetensors", "visual.merger.linear_fc1.bias": "model.safetensors", "visual.merger.linear_fc1.weight": "model.safetensors", "visual.merger.linear_fc1.weight_scale": "model.safetensors", "visual.merger.linear_fc2.bias": "model.safetensors", "visual.merger.linear_fc2.weight": "model.safetensors", "visual.merger.linear_fc2.weight_scale": "model.safetensors", "visual.merger.norm.bias": "model.safetensors", "visual.merger.norm.weight": "model.safetensors", "visual.patch_embed.proj.bias": "model.safetensors", "visual.patch_embed.proj.weight": "model.safetensors", "visual.pos_embed.weight": "model.safetensors"}}
tokenizer/chat_template.jinja ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if tools %}
2
+ {{- '<|im_start|>system\n' }}
3
+ {%- if messages[0].role == 'system' %}
4
+ {%- if messages[0].content is string %}
5
+ {{- messages[0].content }}
6
+ {%- else %}
7
+ {%- for content in messages[0].content %}
8
+ {%- if 'text' in content %}
9
+ {{- content.text }}
10
+ {%- endif %}
11
+ {%- endfor %}
12
+ {%- endif %}
13
+ {{- '\n\n' }}
14
+ {%- endif %}
15
+ {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
16
+ {%- for tool in tools %}
17
+ {{- "\n" }}
18
+ {{- tool | tojson }}
19
+ {%- endfor %}
20
+ {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
21
+ {%- else %}
22
+ {%- if messages[0].role == 'system' %}
23
+ {{- '<|im_start|>system\n' }}
24
+ {%- if messages[0].content is string %}
25
+ {{- messages[0].content }}
26
+ {%- else %}
27
+ {%- for content in messages[0].content %}
28
+ {%- if 'text' in content %}
29
+ {{- content.text }}
30
+ {%- endif %}
31
+ {%- endfor %}
32
+ {%- endif %}
33
+ {{- '<|im_end|>\n' }}
34
+ {%- endif %}
35
+ {%- endif %}
36
+ {%- set image_count = namespace(value=0) %}
37
+ {%- set video_count = namespace(value=0) %}
38
+ {%- for message in messages %}
39
+ {%- if message.role == "user" %}
40
+ {{- '<|im_start|>' + message.role + '\n' }}
41
+ {%- if message.content is string %}
42
+ {{- message.content }}
43
+ {%- else %}
44
+ {%- for content in message.content %}
45
+ {%- if content.type == 'image' or 'image' in content or 'image_url' in content %}
46
+ {%- set image_count.value = image_count.value + 1 %}
47
+ {%- if add_vision_id %}Picture {{ image_count.value }}: {% endif -%}
48
+ <|vision_start|><|image_pad|><|vision_end|>
49
+ {%- elif content.type == 'video' or 'video' in content %}
50
+ {%- set video_count.value = video_count.value + 1 %}
51
+ {%- if add_vision_id %}Video {{ video_count.value }}: {% endif -%}
52
+ <|vision_start|><|video_pad|><|vision_end|>
53
+ {%- elif 'text' in content %}
54
+ {{- content.text }}
55
+ {%- endif %}
56
+ {%- endfor %}
57
+ {%- endif %}
58
+ {{- '<|im_end|>\n' }}
59
+ {%- elif message.role == "assistant" %}
60
+ {{- '<|im_start|>' + message.role + '\n' }}
61
+ {%- if message.content is string %}
62
+ {{- message.content }}
63
+ {%- else %}
64
+ {%- for content_item in message.content %}
65
+ {%- if 'text' in content_item %}
66
+ {{- content_item.text }}
67
+ {%- endif %}
68
+ {%- endfor %}
69
+ {%- endif %}
70
+ {%- if message.tool_calls %}
71
+ {%- for tool_call in message.tool_calls %}
72
+ {%- if (loop.first and message.content) or (not loop.first) %}
73
+ {{- '\n' }}
74
+ {%- endif %}
75
+ {%- if tool_call.function %}
76
+ {%- set tool_call = tool_call.function %}
77
+ {%- endif %}
78
+ {{- '<tool_call>\n{"name": "' }}
79
+ {{- tool_call.name }}
80
+ {{- '", "arguments": ' }}
81
+ {%- if tool_call.arguments is string %}
82
+ {{- tool_call.arguments }}
83
+ {%- else %}
84
+ {{- tool_call.arguments | tojson }}
85
+ {%- endif %}
86
+ {{- '}\n</tool_call>' }}
87
+ {%- endfor %}
88
+ {%- endif %}
89
+ {{- '<|im_end|>\n' }}
90
+ {%- elif message.role == "tool" %}
91
+ {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
92
+ {{- '<|im_start|>user' }}
93
+ {%- endif %}
94
+ {{- '\n<tool_response>\n' }}
95
+ {%- if message.content is string %}
96
+ {{- message.content }}
97
+ {%- else %}
98
+ {%- for content in message.content %}
99
+ {%- if content.type == 'image' or 'image' in content or 'image_url' in content %}
100
+ {%- set image_count.value = image_count.value + 1 %}
101
+ {%- if add_vision_id %}Picture {{ image_count.value }}: {% endif -%}
102
+ <|vision_start|><|image_pad|><|vision_end|>
103
+ {%- elif content.type == 'video' or 'video' in content %}
104
+ {%- set video_count.value = video_count.value + 1 %}
105
+ {%- if add_vision_id %}Video {{ video_count.value }}: {% endif -%}
106
+ <|vision_start|><|video_pad|><|vision_end|>
107
+ {%- elif 'text' in content %}
108
+ {{- content.text }}
109
+ {%- endif %}
110
+ {%- endfor %}
111
+ {%- endif %}
112
+ {{- '\n</tool_response>' }}
113
+ {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
114
+ {{- '<|im_end|>\n' }}
115
+ {%- endif %}
116
+ {%- endif %}
117
+ {%- endfor %}
118
+ {%- if add_generation_prompt %}
119
+ {{- '<|im_start|>assistant\n' }}
120
+ {%- endif %}
tokenizer/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
+ size 11422650
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": null,
5
+ "clean_up_tokenization_spaces": false,
6
+ "eos_token": "<|im_end|>",
7
+ "errors": "replace",
8
+ "extra_special_tokens": [
9
+ "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<|object_ref_start|>",
12
+ "<|object_ref_end|>",
13
+ "<|box_start|>",
14
+ "<|box_end|>",
15
+ "<|quad_start|>",
16
+ "<|quad_end|>",
17
+ "<|vision_start|>",
18
+ "<|vision_end|>",
19
+ "<|vision_pad|>",
20
+ "<|image_pad|>",
21
+ "<|video_pad|>"
22
+ ],
23
+ "is_local": true,
24
+ "local_files_only": false,
25
+ "model_max_length": 262144,
26
+ "pad_token": "<|endoftext|>",
27
+ "split_special_tokens": false,
28
+ "tokenizer_class": "Qwen2Tokenizer",
29
+ "unk_token": null
30
+ }
transformer/config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "Ideogram4Transformer2DModel",
3
+ "_diffusers_version": "0.39.0.dev0",
4
+ "_name_or_path": "/home/jinli/.cache/huggingface/hub/models--ideogram-ai--debug-ideogram-v4/snapshots/41af6183c9fd9b6254864b0720319ef984535bfc/transformer",
5
+ "adaln_dim": 512,
6
+ "attention_head_dim": 256,
7
+ "in_channels": 128,
8
+ "intermediate_size": 12288,
9
+ "llm_features_dim": 53248,
10
+ "mrope_section": [
11
+ 24,
12
+ 20,
13
+ 20
14
+ ],
15
+ "norm_eps": 1e-05,
16
+ "num_attention_heads": 18,
17
+ "num_layers": 34,
18
+ "rope_theta": 5000000
19
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19e12b4d5bdfcf35e17e5f4d292f5301a69a30e02336a9f8645e4b82f8319a1b
3
+ size 9289792888
transformer/diffusion_pytorch_model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"total_size": 9289722624}, "weight_map": {"adaln_proj.bias": "diffusion_pytorch_model.safetensors", "adaln_proj.weight": "diffusion_pytorch_model.safetensors", "adaln_proj.weight_scale": "diffusion_pytorch_model.safetensors", "embed_image_indicator.weight": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "final_layer.linear.bias": "diffusion_pytorch_model.safetensors", "final_layer.linear.weight": "diffusion_pytorch_model.safetensors", "final_layer.linear.weight_scale": "diffusion_pytorch_model.safetensors", "input_proj.bias": "diffusion_pytorch_model.safetensors", "input_proj.weight": "diffusion_pytorch_model.safetensors", "input_proj.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.0.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.1.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.10.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.11.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.12.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.13.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.14.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.15.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.16.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.17.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.18.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.19.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.2.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.20.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.21.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.22.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.23.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.24.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.25.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.26.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.27.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.28.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.29.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.3.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.30.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.31.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.32.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.33.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.4.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.5.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.6.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.7.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.8.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.9.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "llm_cond_norm.weight": "diffusion_pytorch_model.safetensors", "llm_cond_proj.bias": "diffusion_pytorch_model.safetensors", "llm_cond_proj.weight": "diffusion_pytorch_model.safetensors", "llm_cond_proj.weight_scale": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.bias": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.weight": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.weight_scale": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.bias": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.weight": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.weight_scale": "diffusion_pytorch_model.safetensors"}}
unconditional_transformer/config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "Ideogram4Transformer2DModel",
3
+ "_diffusers_version": "0.39.0.dev0",
4
+ "_name_or_path": "/home/jinli/.cache/huggingface/hub/models--ideogram-ai--debug-ideogram-v4/snapshots/41af6183c9fd9b6254864b0720319ef984535bfc/unconditional_transformer",
5
+ "adaln_dim": 512,
6
+ "attention_head_dim": 256,
7
+ "in_channels": 128,
8
+ "intermediate_size": 12288,
9
+ "llm_features_dim": 53248,
10
+ "mrope_section": [
11
+ 24,
12
+ 20,
13
+ 20
14
+ ],
15
+ "norm_eps": 1e-05,
16
+ "num_attention_heads": 18,
17
+ "num_layers": 34,
18
+ "rope_theta": 5000000
19
+ }
unconditional_transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83f7f7d1d0a409c1e9288b11c8ec44a03c95348d46851d6c184f054b6ec4626d
3
+ size 9289792888
unconditional_transformer/diffusion_pytorch_model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"total_size": 9289722624}, "weight_map": {"adaln_proj.bias": "diffusion_pytorch_model.safetensors", "adaln_proj.weight": "diffusion_pytorch_model.safetensors", "adaln_proj.weight_scale": "diffusion_pytorch_model.safetensors", "embed_image_indicator.weight": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "final_layer.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "final_layer.linear.bias": "diffusion_pytorch_model.safetensors", "final_layer.linear.weight": "diffusion_pytorch_model.safetensors", "final_layer.linear.weight_scale": "diffusion_pytorch_model.safetensors", "input_proj.bias": "diffusion_pytorch_model.safetensors", "input_proj.weight": "diffusion_pytorch_model.safetensors", "input_proj.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.0.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.0.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.0.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.0.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.0.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.1.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.1.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.1.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.1.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.1.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.10.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.10.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.10.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.10.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.10.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.11.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.11.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.11.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.11.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.11.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.12.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.12.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.12.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.12.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.12.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.13.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.13.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.13.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.13.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.13.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.14.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.14.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.14.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.14.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.14.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.15.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.15.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.15.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.15.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.15.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.16.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.16.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.16.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.16.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.16.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.17.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.17.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.17.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.17.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.17.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.18.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.18.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.18.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.18.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.18.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.19.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.19.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.19.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.19.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.19.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.2.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.2.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.2.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.2.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.2.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.20.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.20.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.20.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.20.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.20.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.21.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.21.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.21.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.21.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.21.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.22.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.22.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.22.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.22.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.22.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.23.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.23.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.23.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.23.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.23.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.24.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.24.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.24.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.24.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.24.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.25.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.25.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.25.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.25.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.25.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.26.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.26.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.26.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.26.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.26.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.27.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.27.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.27.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.27.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.27.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.28.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.28.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.28.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.28.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.28.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.29.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.29.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.29.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.29.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.29.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.3.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.3.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.3.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.3.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.3.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.30.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.30.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.30.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.30.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.30.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.31.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.31.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.31.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.31.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.31.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.32.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.32.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.32.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.32.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.32.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.33.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.33.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.33.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.33.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.33.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.4.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.4.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.4.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.4.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.4.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.5.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.5.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.5.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.5.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.5.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.6.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.6.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.6.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.6.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.6.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.7.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.7.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.7.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.7.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.7.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.8.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.8.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.8.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.8.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.8.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.bias": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.weight": "diffusion_pytorch_model.safetensors", "layers.9.adaln_modulation.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention.norm_k.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.norm_q.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.o.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.o.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention.qkv.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention.qkv.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.attention_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.9.attention_norm2.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w1.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w1.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w2.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w2.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w3.weight": "diffusion_pytorch_model.safetensors", "layers.9.feed_forward.w3.weight_scale": "diffusion_pytorch_model.safetensors", "layers.9.ffn_norm1.weight": "diffusion_pytorch_model.safetensors", "layers.9.ffn_norm2.weight": "diffusion_pytorch_model.safetensors", "llm_cond_norm.weight": "diffusion_pytorch_model.safetensors", "llm_cond_proj.bias": "diffusion_pytorch_model.safetensors", "llm_cond_proj.weight": "diffusion_pytorch_model.safetensors", "llm_cond_proj.weight_scale": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.bias": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.weight": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_in.weight_scale": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.bias": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.weight": "diffusion_pytorch_model.safetensors", "t_embedding.mlp_out.weight_scale": "diffusion_pytorch_model.safetensors"}}
vae/config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKLFlux2",
3
+ "_diffusers_version": "0.39.0.dev0",
4
+ "_name_or_path": "/home/jinli/.cache/huggingface/hub/models--ideogram-ai--debug-ideogram-v4/snapshots/41af6183c9fd9b6254864b0720319ef984535bfc/vae",
5
+ "act_fn": "silu",
6
+ "batch_norm_eps": 0.0001,
7
+ "batch_norm_momentum": 0.1,
8
+ "block_out_channels": [
9
+ 128,
10
+ 256,
11
+ 512,
12
+ 512
13
+ ],
14
+ "decoder_block_out_channels": null,
15
+ "down_block_types": [
16
+ "DownEncoderBlock2D",
17
+ "DownEncoderBlock2D",
18
+ "DownEncoderBlock2D",
19
+ "DownEncoderBlock2D"
20
+ ],
21
+ "force_upcast": true,
22
+ "in_channels": 3,
23
+ "latent_channels": 32,
24
+ "layers_per_block": 2,
25
+ "mid_block_add_attention": true,
26
+ "norm_num_groups": 32,
27
+ "out_channels": 3,
28
+ "patch_size": [
29
+ 2,
30
+ 2
31
+ ],
32
+ "sample_size": 1024,
33
+ "up_block_types": [
34
+ "UpDecoderBlock2D",
35
+ "UpDecoderBlock2D",
36
+ "UpDecoderBlock2D",
37
+ "UpDecoderBlock2D"
38
+ ],
39
+ "use_post_quant_conv": true,
40
+ "use_quant_conv": true
41
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:925ce3a08e8759174667f5e89384ba2b54dd81a87b7379dadb68a1a87b70b052
3
+ size 168120878