yuvraj108c commited on
Commit
f4b856c
1 Parent(s): f5febd5

Upload folder using huggingface_hub

Browse files
Files changed (41) hide show
  1. LICENSE.md +51 -0
  2. README.md +256 -0
  3. SD3.5L_plus_SD3.5M_upscaling_example_workflow.json +1235 -0
  4. SD3.5M_SLG_example_workflow.json +1006 -0
  5. SD3.5M_example_workflow.json +697 -0
  6. mmdit-x.png +0 -0
  7. model_index.json +40 -0
  8. scheduler/scheduler_config.json +6 -0
  9. sd3.5_medium.safetensors +3 -0
  10. sd3.5_medium_demo.jpg +0 -0
  11. text_encoder/config.json +24 -0
  12. text_encoder/model.fp16.safetensors +3 -0
  13. text_encoder/model.safetensors +3 -0
  14. text_encoder_2/config.json +24 -0
  15. text_encoder_2/model.fp16.safetensors +3 -0
  16. text_encoder_2/model.safetensors +3 -0
  17. text_encoder_3/config.json +31 -0
  18. text_encoder_3/model-00001-of-00002.safetensors +3 -0
  19. text_encoder_3/model-00002-of-00002.safetensors +3 -0
  20. text_encoder_3/model.fp16-00001-of-00002.safetensors +3 -0
  21. text_encoder_3/model.fp16-00002-of-00002.safetensors +3 -0
  22. text_encoder_3/model.safetensors.index.fp16.json +226 -0
  23. text_encoder_3/model.safetensors.index.json +226 -0
  24. tokenizer/merges.txt +0 -0
  25. tokenizer/special_tokens_map.json +30 -0
  26. tokenizer/tokenizer_config.json +30 -0
  27. tokenizer/vocab.json +0 -0
  28. tokenizer_2/merges.txt +0 -0
  29. tokenizer_2/special_tokens_map.json +30 -0
  30. tokenizer_2/tokenizer_config.json +38 -0
  31. tokenizer_2/vocab.json +0 -0
  32. tokenizer_3/special_tokens_map.json +125 -0
  33. tokenizer_3/spiece.model +3 -0
  34. tokenizer_3/tokenizer.json +0 -0
  35. tokenizer_3/tokenizer_config.json +940 -0
  36. transformer/config.json +31 -0
  37. transformer/diffusion_pytorch_model.safetensors +3 -0
  38. vae copy/config.json +38 -0
  39. vae copy/diffusion_pytorch_model.safetensors +3 -0
  40. vae/config.json +38 -0
  41. vae/diffusion_pytorch_model.safetensors +3 -0
LICENSE.md ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ STABILITY AI COMMUNITY LICENSE AGREEMENT
2
+ Last Updated: July 5, 2024
3
+
4
+
5
+ I. INTRODUCTION
6
+
7
+ This Agreement applies to any individual person or entity ("You", "Your" or "Licensee") that uses or distributes any portion or element of the Stability AI Materials or Derivative Works thereof for any Research & Non-Commercial or Commercial purpose. Capitalized terms not otherwise defined herein are defined in Section V below.
8
+
9
+
10
+ This Agreement is intended to allow research, non-commercial, and limited commercial uses of the Models free of charge. In order to ensure that certain limited commercial uses of the Models continue to be allowed, this Agreement preserves free access to the Models for people or organizations generating annual revenue of less than US $1,000,000 (or local currency equivalent).
11
+
12
+
13
+ By clicking "I Accept" or by using or distributing or using any portion or element of the Stability Materials or Derivative Works, You agree that You have read, understood and are bound by the terms of this Agreement. If You are acting on behalf of a company, organization or other entity, then "You" includes you and that entity, and You agree that You: (i) are an authorized representative of such entity with the authority to bind such entity to this Agreement, and (ii) You agree to the terms of this Agreement on that entity's behalf.
14
+
15
+ II. RESEARCH & NON-COMMERCIAL USE LICENSE
16
+
17
+ Subject to the terms of this Agreement, Stability AI grants You a non-exclusive, worldwide, non-transferable, non-sublicensable, revocable and royalty-free limited license under Stability AI's intellectual property or other rights owned by Stability AI embodied in the Stability AI Materials to use, reproduce, distribute, and create Derivative Works of, and make modifications to, the Stability AI Materials for any Research or Non-Commercial Purpose. "Research Purpose" means academic or scientific advancement, and in each case, is not primarily intended for commercial advantage or monetary compensation to You or others. "Non-Commercial Purpose" means any purpose other than a Research Purpose that is not primarily intended for commercial advantage or monetary compensation to You or others, such as personal use (i.e., hobbyist) or evaluation and testing.
18
+
19
+ III. COMMERCIAL USE LICENSE
20
+
21
+ Subject to the terms of this Agreement (including the remainder of this Section III), Stability AI grants You a non-exclusive, worldwide, non-transferable, non-sublicensable, revocable and royalty-free limited license under Stability AI's intellectual property or other rights owned by Stability AI embodied in the Stability AI Materials to use, reproduce, distribute, and create Derivative Works of, and make modifications to, the Stability AI Materials for any Commercial Purpose. "Commercial Purpose" means any purpose other than a Research Purpose or Non-Commercial Purpose that is primarily intended for commercial advantage or monetary compensation to You or others, including but not limited to, (i) creating, modifying, or distributing Your product or service, including via a hosted service or application programming interface, and (ii) for Your business's or organization's internal operations.
22
+ If You are using or distributing the Stability AI Materials for a Commercial Purpose, You must register with Stability AI at (https://stability.ai/community-license). If at any time You or Your Affiliate(s), either individually or in aggregate, generate more than USD $1,000,000 in annual revenue (or the equivalent thereof in Your local currency), regardless of whether that revenue is generated directly or indirectly from the Stability AI Materials or Derivative Works, any licenses granted to You under this Agreement shall terminate as of such date. You must request a license from Stability AI at (https://stability.ai/enterprise) , which Stability AI may grant to You in its sole discretion. If you receive Stability AI Materials, or any Derivative Works thereof, from a Licensee as part of an integrated end user product, then Section III of this Agreement will not apply to you.
23
+
24
+ IV. GENERAL TERMS
25
+
26
+ Your Research, Non-Commercial, and Commercial License(s) under this Agreement are subject to the following terms.
27
+ a. Distribution & Attribution. If You distribute or make available the Stability AI Materials or a Derivative Work to a third party, or a product or service that uses any portion of them, You shall: (i) provide a copy of this Agreement to that third party, (ii) retain the following attribution notice within a "Notice" text file distributed as a part of such copies: "This Stability AI Model is licensed under the Stability AI Community License, Copyright © Stability AI Ltd. All Rights Reserved", and (iii) prominently display "Powered by Stability AI" on a related website, user interface, blogpost, about page, or product documentation. If You create a Derivative Work, You may add your own attribution notice(s) to the "Notice" text file included with that Derivative Work, provided that You clearly indicate which attributions apply to the Stability AI Materials and state in the "Notice" text file that You changed the Stability AI Materials and how it was modified.
28
+ b. Use Restrictions. Your use of the Stability AI Materials and Derivative Works, including any output or results of the Stability AI Materials or Derivative Works, must comply with applicable laws and regulations (including Trade Control Laws and equivalent regulations) and adhere to the Documentation and Stability AI's AUP, which is hereby incorporated by reference. Furthermore, You will not use the Stability AI Materials or Derivative Works, or any output or results of the Stability AI Materials or Derivative Works, to create or improve any foundational generative AI model (excluding the Models or Derivative Works).
29
+ c. Intellectual Property.
30
+ (i) Trademark License. No trademark licenses are granted under this Agreement, and in connection with the Stability AI Materials or Derivative Works, You may not use any name or mark owned by or associated with Stability AI or any of its Affiliates, except as required under Section IV(a) herein.
31
+ (ii) Ownership of Derivative Works. As between You and Stability AI, You are the owner of Derivative Works You create, subject to Stability AI's ownership of the Stability AI Materials and any Derivative Works made by or for Stability AI.
32
+ (iii) Ownership of Outputs. As between You and Stability AI, You own any outputs generated from the Models or Derivative Works to the extent permitted by applicable law.
33
+ (iv) Disputes. If You or Your Affiliate(s) institute litigation or other proceedings against Stability AI (including a cross-claim or counterclaim in a lawsuit) alleging that the Stability AI Materials, Derivative Works or associated outputs or results, or any portion of any of the foregoing, constitutes infringement of intellectual property or other rights owned or licensable by You, then any licenses granted to You under this Agreement shall terminate as of the date such litigation or claim is filed or instituted. You will indemnify and hold harmless Stability AI from and against any claim by any third party arising out of or related to Your use or distribution of the Stability AI Materials or Derivative Works in violation of this Agreement.
34
+ (v) Feedback. From time to time, You may provide Stability AI with verbal and/or written suggestions, comments or other feedback related to Stability AI's existing or prospective technology, products or services (collectively, "Feedback"). You are not obligated to provide Stability AI with Feedback, but to the extent that You do, You hereby grant Stability AI a perpetual, irrevocable, royalty-free, fully-paid, sub-licensable, transferable, non-exclusive, worldwide right and license to exploit the Feedback in any manner without restriction. Your Feedback is provided "AS IS" and You make no warranties whatsoever about any Feedback.
35
+ d. Disclaimer Of Warranty. UNLESS REQUIRED BY APPLICABLE LAW, THE STABILITY AI MATERIALS AND ANY OUTPUT AND RESULTS THEREFROM ARE PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED, INCLUDING, WITHOUT LIMITATION, ANY WARRANTIES OF TITLE, NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE. YOU ARE SOLELY RESPONSIBLE FOR DETERMINING THE APPROPRIATENESS OR LAWFULNESS OF USING OR REDISTRIBUTING THE STABILITY AI MATERIALS, DERIVATIVE WORKS OR ANY OUTPUT OR RESULTS AND ASSUME ANY RISKS ASSOCIATED WITH YOUR USE OF THE STABILITY AI MATERIALS, DERIVATIVE WORKS AND ANY OUTPUT AND RESULTS.
36
+ e. Limitation Of Liability. IN NO EVENT WILL STABILITY AI OR ITS AFFILIATES BE LIABLE UNDER ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, TORT, NEGLIGENCE, PRODUCTS LIABILITY, OR OTHERWISE, ARISING OUT OF THIS AGREEMENT, FOR ANY LOST PROFITS OR ANY DIRECT, INDIRECT, SPECIAL, CONSEQUENTIAL, INCIDENTAL, EXEMPLARY OR PUNITIVE DAMAGES, EVEN IF STABILITY AI OR ITS AFFILIATES HAVE BEEN ADVISED OF THE POSSIBILITY OF ANY OF THE FOREGOING.
37
+ f. Term And Termination. The term of this Agreement will commence upon Your acceptance of this Agreement or access to the Stability AI Materials and will continue in full force and effect until terminated in accordance with the terms and conditions herein. Stability AI may terminate this Agreement if You are in breach of any term or condition of this Agreement. Upon termination of this Agreement, You shall delete and cease use of any Stability AI Materials or Derivative Works. Section IV(d), (e), and (g) shall survive the termination of this Agreement.
38
+ g. Governing Law. This Agreement will be governed by and constructed in accordance with the laws of the United States and the State of California without regard to choice of law principles, and the UN Convention on Contracts for International Sale of Goods does not apply to this Agreement.
39
+
40
+ V. DEFINITIONS
41
+
42
+ "Affiliate(s)" means any entity that directly or indirectly controls, is controlled by, or is under common control with the subject entity; for purposes of this definition, "control" means direct or indirect ownership or control of more than 50% of the voting interests of the subject entity.
43
+ "Agreement" means this Stability AI Community License Agreement.
44
+ "AUP" means the Stability AI Acceptable Use Policy available at https://stability.ai/use-policy, as may be updated from time to time.
45
+ "Derivative Work(s)" means (a) any derivative work of the Stability AI Materials as recognized by U.S. copyright laws and (b) any modifications to a Model, and any other model created which is based on or derived from the Model or the Model's output, including"fine tune" and "low-rank adaptation" models derived from a Model or a Model's output, but do not include the output of any Model.
46
+ "Documentation" means any specifications, manuals, documentation, and other written information provided by Stability AI related to the Software or Models.
47
+ "Model(s)" means, collectively, Stability AI's proprietary models and algorithms, including machine-learning models, trained model weights and other elements of the foregoing listed on Stability's Core Models Webpage available at, https://stability.ai/core-models, as may be updated from time to time.
48
+ "Stability AI" or "we" means Stability AI Ltd. and its Affiliates.
49
+ "Software" means Stability AI's proprietary software made available under this Agreement now or in the future.
50
+ "Stability AI Materials" means, collectively, Stability's proprietary Models, Software and Documentation (and any portion or combination thereof) made available under this Agreement.
51
+ "Trade Control Laws" means any applicable U.S. and non-U.S. export control and trade sanctions laws and regulations.
README.md ADDED
@@ -0,0 +1,256 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ license_name: stabilityai-ai-community
4
+ license_link: LICENSE.md
5
+ tags:
6
+ - text-to-image
7
+ - stable-diffusion
8
+ - diffusers
9
+ inference: true
10
+ extra_gated_prompt: >-
11
+ By clicking "Agree", you agree to the [License
12
+ Agreement](https://huggingface.co/stabilityai/stable-diffusion-3.5-medium/blob/main/LICENSE.md)
13
+ and acknowledge Stability AI's [Privacy
14
+ Policy](https://stability.ai/privacy-policy).
15
+ extra_gated_fields:
16
+ Name: text
17
+ Email: text
18
+ Country: country
19
+ Organization or Affiliation: text
20
+ Receive email updates and promotions on Stability AI products, services, and research?:
21
+ type: select
22
+ options:
23
+ - 'Yes'
24
+ - 'No'
25
+ What do you intend to use the model for?:
26
+ type: select
27
+ options:
28
+ - Research
29
+ - Personal use
30
+ - Creative Professional
31
+ - Startup
32
+ - Enterprise
33
+ I agree to the License Agreement and acknowledge Stability AI's Privacy Policy: checkbox
34
+
35
+ language:
36
+ - en
37
+ pipeline_tag: text-to-image
38
+ ---
39
+
40
+ # Stable Diffusion 3.5 Medium
41
+ ![3.5 Medium Demo Image](sd3.5_medium_demo.jpg)
42
+
43
+ ## Model
44
+
45
+ ![MMDiT-X](mmdit-x.png)
46
+
47
+ [Stable Diffusion 3.5 Medium](https://stability.ai/news/introducing-stable-diffusion-3-5) is a Multimodal Diffusion Transformer with improvements (MMDiT-X) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resource-efficiency.
48
+
49
+ Please note: This model is released under the [Stability Community License](https://stability.ai/community-license-agreement). Visit [Stability AI](https://stability.ai/license) to learn or [contact us](https://stability.ai/enterprise) for commercial licensing details.
50
+
51
+
52
+ ### Model Description
53
+
54
+ - **Developed by:** Stability AI
55
+ - **Model type:** MMDiT-X text-to-image generative model
56
+ - **Model Description:** This model generates images based on text prompts. It is a Multimodal Diffusion Transformer
57
+ (https://arxiv.org/abs/2403.03206) with improvements that use three fixed, pretrained text encoders, with QK-normalization to improve training stability, and dual attention blocks in the first 12 transformer layers.
58
+
59
+ ### License
60
+
61
+ - **Community License:** Free for research, non-commercial, and commercial use for organizations or individuals with less than $1M in total annual revenue. More details can be found in the [Community License Agreement](https://stability.ai/community-license-agreement). Read more at https://stability.ai/license.
62
+ - **For individuals and organizations with annual revenue above $1M**: please [contact us](https://stability.ai/enterprise) to get an Enterprise License.
63
+
64
+ ### Model Sources
65
+
66
+ For local or self-hosted use, we recommend [ComfyUI](https://github.com/comfyanonymous/ComfyUI) for node-based UI inference, or [diffusers](https://github.com/huggingface/diffusers) or [GitHub](https://github.com/Stability-AI/sd3.5) for programmatic use.
67
+
68
+ - **ComfyUI:** [Github](https://github.com/comfyanonymous/ComfyUI), [Example Workflow](https://comfyanonymous.github.io/ComfyUI_examples/sd3/)
69
+ - **Huggingface Space:** [Space](https://huggingface.co/spaces/stabilityai/stable-diffusion-3.5-medium)
70
+ - **Diffusers**: [See below](#using-with-diffusers).
71
+ - **GitHub**: [GitHub](https://github.com/Stability-AI/sd3.5).
72
+
73
+ - **API Endpoints:**
74
+ - [Stability AI API](https://platform.stability.ai/docs/api-reference#tag/Generate/paths/~1v2beta~1stable-image~1generate~1sd3/post)
75
+
76
+
77
+ ### Implementation Details
78
+
79
+ - **MMDiT-X:** Introduces self-attention modules in the first 13 layers of the transformer, enhancing multi-resolution generation and overall image coherence.
80
+
81
+ - **QK Normalization:** Implements the QK normalization technique to improve training Stability.
82
+
83
+ - **Mixed-Resolution Training:**
84
+ - Progressive training stages: 256 → 512 → 768 → 1024 → 1440 resolution
85
+ - The final stage included mixed-scale image training to boost multi-resolution generation performance
86
+ - Extended positional embedding space to 384x384 (latent) at lower resolution stages
87
+ - Employed random crop augmentation on positional embeddings to enhance transformer layer robustness across the entire range of mixed resolutions and aspect ratios. For example, given a 64x64 latent image, we add a randomly cropped 64x64 embedding from the 192x192 embedding space during training as the input to the x stream.
88
+
89
+ These enhancements collectively contribute to the model's improved performance in multi-resolution image generation, coherence, and adaptability across various text-to-image tasks.
90
+
91
+ - **Text Encoders:**
92
+ - CLIPs: [OpenCLIP-ViT/G](https://github.com/mlfoundations/open_clip), [CLIP-ViT/L](https://github.com/openai/CLIP/tree/main), context length 77 tokens
93
+ - T5: [T5-xxl](https://huggingface.co/google/t5-v1_1-xxl), context length 77/256 tokens at different stages of training
94
+
95
+ - **Training Data and Strategy:**
96
+
97
+ This model was trained on a wide variety of data, including synthetic data and filtered publicly available data.
98
+
99
+ For more technical details of the original MMDiT architecture, please refer to the [Research paper](https://stability.ai/news/stable-diffusion-3-research-paper).
100
+
101
+ ### Usage & Limitations
102
+ - While this model can handle long prompts, you may observe artifacts on the edge of generations when T5 tokens go over 256. Pay attention to the token limits when using this model in your workflow, and shortern prompts if artifacts becomes too obvious.
103
+ - The medium model has a different training data distribution than the large model, so it may not respond to the same prompt similarly.
104
+ - We recommend sampling with **[Skip Layer Guidance](https://github.com/comfyanonymous/ComfyUI/pull/5404)** for better structure and anatomy coherency.
105
+
106
+ ### Model Performance
107
+
108
+ See [blog](https://stability.ai/news/introducing-stable-diffusion-3-5) for our study about comparative performance in prompt adherence and aesthetic quality.
109
+
110
+
111
+ ## File Structure
112
+
113
+ Click here to access the [Files and versions tab](https://huggingface.co/stabilityai/stable-diffusion-3.5-medium/tree/main)
114
+
115
+ ```│
116
+ ├── text_encoders/
117
+ │ ├── README.md
118
+ │ ├── clip_g.safetensors
119
+ │ ├── clip_l.safetensors
120
+ │ ├── t5xxl_fp16.safetensors
121
+ │ └── t5xxl_fp8_e4m3fn.safetensors
122
+
123
+ ├── README.md
124
+ ├── LICENSE
125
+ ├── sd3.5_medium.safetensors
126
+ ├── SD3.5M_example_workflow.json
127
+ ├── SD3.5M_SLG_example_workflow.json
128
+ ├── SD3.5L_plus_SD3.5M_upscaling_example_workflow.json
129
+ └── sd3_medium_demo.jpg
130
+
131
+ ** File structure below is for diffusers integration**
132
+ ├── scheduler/
133
+ ├── text_encoder/
134
+ ├── text_encoder_2/
135
+ ├── text_encoder_3/
136
+ ├── tokenizer/
137
+ ├── tokenizer_2/
138
+ ├── tokenizer_3/
139
+ ├── transformer/
140
+ ├── vae/
141
+ └── model_index.json
142
+ ```
143
+
144
+ ## Using with Diffusers
145
+ Upgrade to the latest version of the [🧨 diffusers library](https://github.com/huggingface/diffusers)
146
+ ```
147
+ pip install -U diffusers
148
+ ```
149
+
150
+ and then you can run
151
+ ```py
152
+ import torch
153
+ from diffusers import StableDiffusion3Pipeline
154
+
155
+ pipe = StableDiffusion3Pipeline.from_pretrained("stabilityai/stable-diffusion-3.5-medium", torch_dtype=torch.bfloat16)
156
+ pipe = pipe.to("cuda")
157
+
158
+ image = pipe(
159
+ "A capybara holding a sign that reads Hello World",
160
+ num_inference_steps=40,
161
+ guidance_scale=4.5,
162
+ ).images[0]
163
+ image.save("capybara.png")
164
+ ```
165
+
166
+ ### Quantizing the model with diffusers
167
+
168
+ Reduce your VRAM usage and have the model fit on 🤏 VRAM GPUs
169
+
170
+ ```
171
+ pip install bitsandbytes
172
+ ```
173
+
174
+ ```py
175
+ from diffusers import BitsAndBytesConfig, SD3Transformer2DModel
176
+ from diffusers import StableDiffusion3Pipeline
177
+ import torch
178
+
179
+ model_id = "stabilityai/stable-diffusion-3.5-medium"
180
+
181
+ nf4_config = BitsAndBytesConfig(
182
+ load_in_4bit=True,
183
+ bnb_4bit_quant_type="nf4",
184
+ bnb_4bit_compute_dtype=torch.bfloat16
185
+ )
186
+ model_nf4 = SD3Transformer2DModel.from_pretrained(
187
+ model_id,
188
+ subfolder="transformer",
189
+ quantization_config=nf4_config,
190
+ torch_dtype=torch.bfloat16
191
+ )
192
+
193
+ pipeline = StableDiffusion3Pipeline.from_pretrained(
194
+ model_id,
195
+ transformer=model_nf4,
196
+ torch_dtype=torch.bfloat16
197
+ )
198
+ pipeline.enable_model_cpu_offload()
199
+
200
+ prompt = "A whimsical and creative image depicting a hybrid creature that is a mix of a waffle and a hippopotamus, basking in a river of melted butter amidst a breakfast-themed landscape. It features the distinctive, bulky body shape of a hippo. However, instead of the usual grey skin, the creature's body resembles a golden-brown, crispy waffle fresh off the griddle. The skin is textured with the familiar grid pattern of a waffle, each square filled with a glistening sheen of syrup. The environment combines the natural habitat of a hippo with elements of a breakfast table setting, a river of warm, melted butter, with oversized utensils or plates peeking out from the lush, pancake-like foliage in the background, a towering pepper mill standing in for a tree. As the sun rises in this fantastical world, it casts a warm, buttery glow over the scene. The creature, content in its butter river, lets out a yawn. Nearby, a flock of birds take flight"
201
+
202
+ image = pipeline(
203
+ prompt=prompt,
204
+ num_inference_steps=40,
205
+ guidance_scale=4.5,
206
+ max_sequence_length=512,
207
+ ).images[0]
208
+ image.save("whimsical.png")
209
+ ```
210
+
211
+ ### Fine-tuning
212
+
213
+ Please see the fine-tuning guide [here](https://stabilityai.notion.site/Stable-Diffusion-3-5-Large-Fine-tuning-Tutorial-11a61cdcd1968027a15bdbd7c40be8c6).
214
+
215
+
216
+ ## Uses
217
+
218
+ ### Intended Uses
219
+
220
+ Intended uses include the following:
221
+ * Generation of artworks and use in design and other artistic processes.
222
+ * Applications in educational or creative tools.
223
+ * Research on generative models, including understanding the limitations of generative models.
224
+
225
+ All uses of the model must be in accordance with our [Acceptable Use Policy](https://stability.ai/use-policy).
226
+
227
+ ### Out-of-Scope Uses
228
+
229
+ The model was not trained to be factual or true representations of people or events. As such, using the model to generate such content is out-of-scope of the abilities of this model.
230
+
231
+ ## Safety
232
+
233
+ As part of our safety-by-design and responsible AI deployment approach, we take deliberate measures to ensure Integrity starts at the early stages of development. We implement safety measures throughout the development of our models. We have implemented safety mitigations that are intended to reduce the risk of certain harms, however we recommend that developers conduct their own testing and apply additional mitigations based on their specific use cases.
234
+ For more about our approach to Safety, please visit our [Safety page](https://stability.ai/safety).
235
+
236
+ ### Integrity Evaluation
237
+
238
+ Our integrity evaluation methods include structured evaluations and red-teaming testing for certain harms. Testing was conducted primarily in English and may not cover all possible harms.
239
+
240
+ ### Risks identified and mitigations:
241
+
242
+ * Harmful content: We have used filtered data sets when training our models and implemented safeguards that attempt to strike the right balance between usefulness and preventing harm. However, this does not guarantee that all possible harmful content has been removed. TAll developers and deployers should exercise caution and implement content safety guardrails based on their specific product policies and application use cases.
243
+ * Misuse: Technical limitations and developer and end-user education can help mitigate against malicious applications of models. All users are required to adhere to our [Acceptable Use Policy](https://stability.ai/use-policy), including when applying fine-tuning and prompt engineering mechanisms. Please reference the Stability AI Acceptable Use Policy for information on violative uses of our products.
244
+ * Privacy violations: Developers and deployers are encouraged to adhere to privacy regulations with techniques that respect data privacy.
245
+
246
+ ### Contact
247
+
248
+ Please report any issues with the model or contact us:
249
+
250
+ * Safety issues: safety@stability.ai
251
+ * Security issues: security@stability.ai
252
+ * Privacy issues: privacy@stability.ai
253
+ * License and general: https://stability.ai/license
254
+ * Enterprise license: https://stability.ai/enterprise
255
+
256
+
SD3.5L_plus_SD3.5M_upscaling_example_workflow.json ADDED
@@ -0,0 +1,1235 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "last_node_id": 331,
3
+ "last_link_id": 672,
4
+ "nodes": [
5
+ {
6
+ "id": 68,
7
+ "type": "ConditioningSetTimestepRange",
8
+ "pos": [
9
+ 756,
10
+ 1008
11
+ ],
12
+ "size": {
13
+ "0": 317.4000244140625,
14
+ "1": 82
15
+ },
16
+ "flags": {},
17
+ "order": 14,
18
+ "mode": 0,
19
+ "inputs": [
20
+ {
21
+ "name": "conditioning",
22
+ "type": "CONDITIONING",
23
+ "link": 90
24
+ }
25
+ ],
26
+ "outputs": [
27
+ {
28
+ "name": "CONDITIONING",
29
+ "type": "CONDITIONING",
30
+ "links": [
31
+ 91
32
+ ],
33
+ "shape": 3,
34
+ "slot_index": 0
35
+ }
36
+ ],
37
+ "properties": {
38
+ "Node name for S&R": "ConditioningSetTimestepRange"
39
+ },
40
+ "widgets_values": [
41
+ 0.1,
42
+ 1
43
+ ]
44
+ },
45
+ {
46
+ "id": 67,
47
+ "type": "ConditioningZeroOut",
48
+ "pos": [
49
+ 504,
50
+ 1008
51
+ ],
52
+ "size": {
53
+ "0": 211.60000610351562,
54
+ "1": 26
55
+ },
56
+ "flags": {},
57
+ "order": 13,
58
+ "mode": 0,
59
+ "inputs": [
60
+ {
61
+ "name": "conditioning",
62
+ "type": "CONDITIONING",
63
+ "link": 597
64
+ }
65
+ ],
66
+ "outputs": [
67
+ {
68
+ "name": "CONDITIONING",
69
+ "type": "CONDITIONING",
70
+ "links": [
71
+ 90
72
+ ],
73
+ "shape": 3,
74
+ "slot_index": 0
75
+ }
76
+ ],
77
+ "properties": {
78
+ "Node name for S&R": "ConditioningZeroOut"
79
+ }
80
+ },
81
+ {
82
+ "id": 11,
83
+ "type": "TripleCLIPLoader",
84
+ "pos": [
85
+ -1386,
86
+ 756
87
+ ],
88
+ "size": {
89
+ "0": 315,
90
+ "1": 106
91
+ },
92
+ "flags": {},
93
+ "order": 0,
94
+ "mode": 0,
95
+ "outputs": [
96
+ {
97
+ "name": "CLIP",
98
+ "type": "CLIP",
99
+ "links": [
100
+ 5,
101
+ 94,
102
+ 662
103
+ ],
104
+ "shape": 3,
105
+ "slot_index": 0
106
+ }
107
+ ],
108
+ "properties": {
109
+ "Node name for S&R": "TripleCLIPLoader"
110
+ },
111
+ "widgets_values": [
112
+ "clip_g_sdxl_base.safetensors",
113
+ "clip_l_sdxl_base.safetensors",
114
+ "t5xxl.safetensors"
115
+ ]
116
+ },
117
+ {
118
+ "id": 69,
119
+ "type": "ConditioningCombine",
120
+ "pos": [
121
+ 1134,
122
+ 1008
123
+ ],
124
+ "size": {
125
+ "0": 228.39999389648438,
126
+ "1": 46
127
+ },
128
+ "flags": {},
129
+ "order": 15,
130
+ "mode": 0,
131
+ "inputs": [
132
+ {
133
+ "name": "conditioning_1",
134
+ "type": "CONDITIONING",
135
+ "link": 91
136
+ },
137
+ {
138
+ "name": "conditioning_2",
139
+ "type": "CONDITIONING",
140
+ "link": 92
141
+ }
142
+ ],
143
+ "outputs": [
144
+ {
145
+ "name": "CONDITIONING",
146
+ "type": "CONDITIONING",
147
+ "links": [
148
+ 604,
149
+ 622
150
+ ],
151
+ "shape": 3,
152
+ "slot_index": 0
153
+ }
154
+ ],
155
+ "properties": {
156
+ "Node name for S&R": "ConditioningCombine"
157
+ }
158
+ },
159
+ {
160
+ "id": 4,
161
+ "type": "CheckpointLoaderSimple",
162
+ "pos": [
163
+ -1386,
164
+ 252
165
+ ],
166
+ "size": {
167
+ "0": 632.6060180664062,
168
+ "1": 98
169
+ },
170
+ "flags": {},
171
+ "order": 1,
172
+ "mode": 0,
173
+ "outputs": [
174
+ {
175
+ "name": "MODEL",
176
+ "type": "MODEL",
177
+ "links": [
178
+ 445
179
+ ],
180
+ "shape": 3,
181
+ "slot_index": 0
182
+ },
183
+ {
184
+ "name": "CLIP",
185
+ "type": "CLIP",
186
+ "links": null,
187
+ "shape": 3
188
+ },
189
+ {
190
+ "name": "VAE",
191
+ "type": "VAE",
192
+ "links": [
193
+ 605,
194
+ 616,
195
+ 617
196
+ ],
197
+ "shape": 3,
198
+ "slot_index": 2
199
+ }
200
+ ],
201
+ "properties": {
202
+ "Node name for S&R": "CheckpointLoaderSimple"
203
+ },
204
+ "widgets_values": [
205
+ "sd3.5_large.safetensors"
206
+ ]
207
+ },
208
+ {
209
+ "id": 8,
210
+ "type": "VAEDecode",
211
+ "pos": [
212
+ 2015,
213
+ 536
214
+ ],
215
+ "size": {
216
+ "0": 210,
217
+ "1": 46
218
+ },
219
+ "flags": {},
220
+ "order": 17,
221
+ "mode": 0,
222
+ "inputs": [
223
+ {
224
+ "name": "samples",
225
+ "type": "LATENT",
226
+ "link": 572
227
+ },
228
+ {
229
+ "name": "vae",
230
+ "type": "VAE",
231
+ "link": 605
232
+ }
233
+ ],
234
+ "outputs": [
235
+ {
236
+ "name": "IMAGE",
237
+ "type": "IMAGE",
238
+ "links": [
239
+ 274,
240
+ 660
241
+ ],
242
+ "shape": 3,
243
+ "slot_index": 0
244
+ }
245
+ ],
246
+ "properties": {
247
+ "Node name for S&R": "VAEDecode"
248
+ }
249
+ },
250
+ {
251
+ "id": 294,
252
+ "type": "KSampler",
253
+ "pos": [
254
+ 1512,
255
+ 378
256
+ ],
257
+ "size": {
258
+ "0": 378,
259
+ "1": 504
260
+ },
261
+ "flags": {},
262
+ "order": 16,
263
+ "mode": 0,
264
+ "inputs": [
265
+ {
266
+ "name": "model",
267
+ "type": "MODEL",
268
+ "link": 568
269
+ },
270
+ {
271
+ "name": "positive",
272
+ "type": "CONDITIONING",
273
+ "link": 569
274
+ },
275
+ {
276
+ "name": "negative",
277
+ "type": "CONDITIONING",
278
+ "link": 604
279
+ },
280
+ {
281
+ "name": "latent_image",
282
+ "type": "LATENT",
283
+ "link": 598
284
+ }
285
+ ],
286
+ "outputs": [
287
+ {
288
+ "name": "LATENT",
289
+ "type": "LATENT",
290
+ "links": [
291
+ 572
292
+ ],
293
+ "shape": 3,
294
+ "slot_index": 0
295
+ }
296
+ ],
297
+ "properties": {
298
+ "Node name for S&R": "KSampler"
299
+ },
300
+ "widgets_values": [
301
+ 339087769667945,
302
+ "fixed",
303
+ 40,
304
+ 4.5,
305
+ "dpmpp_2m",
306
+ "sgm_uniform",
307
+ 1
308
+ ]
309
+ },
310
+ {
311
+ "id": 70,
312
+ "type": "ConditioningSetTimestepRange",
313
+ "pos": [
314
+ 756,
315
+ 1134
316
+ ],
317
+ "size": {
318
+ "0": 317.4000244140625,
319
+ "1": 82
320
+ },
321
+ "flags": {},
322
+ "order": 12,
323
+ "mode": 0,
324
+ "inputs": [
325
+ {
326
+ "name": "conditioning",
327
+ "type": "CONDITIONING",
328
+ "link": 93,
329
+ "slot_index": 0
330
+ }
331
+ ],
332
+ "outputs": [
333
+ {
334
+ "name": "CONDITIONING",
335
+ "type": "CONDITIONING",
336
+ "links": [
337
+ 92
338
+ ],
339
+ "shape": 3,
340
+ "slot_index": 0
341
+ }
342
+ ],
343
+ "properties": {
344
+ "Node name for S&R": "ConditioningSetTimestepRange"
345
+ },
346
+ "widgets_values": [
347
+ 0,
348
+ 0.1
349
+ ]
350
+ },
351
+ {
352
+ "id": 50,
353
+ "type": "PreviewImage",
354
+ "pos": [
355
+ 2394,
356
+ 378
357
+ ],
358
+ "size": {
359
+ "0": 616.689697265625,
360
+ "1": 613.84130859375
361
+ },
362
+ "flags": {},
363
+ "order": 18,
364
+ "mode": 0,
365
+ "inputs": [
366
+ {
367
+ "name": "images",
368
+ "type": "IMAGE",
369
+ "link": 274
370
+ }
371
+ ],
372
+ "properties": {
373
+ "Node name for S&R": "PreviewImage"
374
+ }
375
+ },
376
+ {
377
+ "id": 308,
378
+ "type": "VAEEncode",
379
+ "pos": [
380
+ 3150,
381
+ 378
382
+ ],
383
+ "size": {
384
+ "0": 210,
385
+ "1": 46
386
+ },
387
+ "flags": {},
388
+ "order": 21,
389
+ "mode": 0,
390
+ "inputs": [
391
+ {
392
+ "name": "pixels",
393
+ "type": "IMAGE",
394
+ "link": 671
395
+ },
396
+ {
397
+ "name": "vae",
398
+ "type": "VAE",
399
+ "link": 616
400
+ }
401
+ ],
402
+ "outputs": [
403
+ {
404
+ "name": "LATENT",
405
+ "type": "LATENT",
406
+ "links": [
407
+ 623
408
+ ],
409
+ "shape": 3,
410
+ "slot_index": 0
411
+ }
412
+ ],
413
+ "properties": {
414
+ "Node name for S&R": "VAEEncode"
415
+ }
416
+ },
417
+ {
418
+ "id": 310,
419
+ "type": "KSamplerAdvanced",
420
+ "pos": [
421
+ 3402,
422
+ 378
423
+ ],
424
+ "size": {
425
+ "0": 378,
426
+ "1": 546
427
+ },
428
+ "flags": {},
429
+ "order": 22,
430
+ "mode": 0,
431
+ "inputs": [
432
+ {
433
+ "name": "model",
434
+ "type": "MODEL",
435
+ "link": 620
436
+ },
437
+ {
438
+ "name": "positive",
439
+ "type": "CONDITIONING",
440
+ "link": 665
441
+ },
442
+ {
443
+ "name": "negative",
444
+ "type": "CONDITIONING",
445
+ "link": 622
446
+ },
447
+ {
448
+ "name": "latent_image",
449
+ "type": "LATENT",
450
+ "link": 623
451
+ },
452
+ {
453
+ "name": "start_at_step",
454
+ "type": "INT",
455
+ "link": 672,
456
+ "widget": {
457
+ "name": "start_at_step"
458
+ }
459
+ }
460
+ ],
461
+ "outputs": [
462
+ {
463
+ "name": "LATENT",
464
+ "type": "LATENT",
465
+ "links": [
466
+ 624
467
+ ],
468
+ "shape": 3,
469
+ "slot_index": 0
470
+ }
471
+ ],
472
+ "properties": {
473
+ "Node name for S&R": "KSamplerAdvanced"
474
+ },
475
+ "widgets_values": [
476
+ "enable",
477
+ 383006107596742,
478
+ "increment",
479
+ 42,
480
+ 4.5,
481
+ "dpmpp_2m",
482
+ "sgm_uniform",
483
+ 30,
484
+ 10000,
485
+ "disable"
486
+ ]
487
+ },
488
+ {
489
+ "id": 305,
490
+ "type": "VAEDecode",
491
+ "pos": [
492
+ 3906,
493
+ 378
494
+ ],
495
+ "size": {
496
+ "0": 210,
497
+ "1": 46
498
+ },
499
+ "flags": {},
500
+ "order": 23,
501
+ "mode": 0,
502
+ "inputs": [
503
+ {
504
+ "name": "samples",
505
+ "type": "LATENT",
506
+ "link": 624
507
+ },
508
+ {
509
+ "name": "vae",
510
+ "type": "VAE",
511
+ "link": 617
512
+ }
513
+ ],
514
+ "outputs": [
515
+ {
516
+ "name": "IMAGE",
517
+ "type": "IMAGE",
518
+ "links": [
519
+ 670
520
+ ],
521
+ "shape": 3,
522
+ "slot_index": 0
523
+ }
524
+ ],
525
+ "properties": {
526
+ "Node name for S&R": "VAEDecode"
527
+ }
528
+ },
529
+ {
530
+ "id": 306,
531
+ "type": "PreviewImage",
532
+ "pos": [
533
+ 4284,
534
+ 378
535
+ ],
536
+ "size": {
537
+ "0": 616.689697265625,
538
+ "1": 613.84130859375
539
+ },
540
+ "flags": {},
541
+ "order": 24,
542
+ "mode": 0,
543
+ "inputs": [
544
+ {
545
+ "name": "images",
546
+ "type": "IMAGE",
547
+ "link": 670
548
+ }
549
+ ],
550
+ "properties": {
551
+ "Node name for S&R": "PreviewImage"
552
+ }
553
+ },
554
+ {
555
+ "id": 309,
556
+ "type": "PreviewImage",
557
+ "pos": [
558
+ 4032,
559
+ 630
560
+ ],
561
+ "size": {
562
+ "0": 210,
563
+ "1": 246
564
+ },
565
+ "flags": {},
566
+ "order": 20,
567
+ "mode": 0,
568
+ "inputs": [
569
+ {
570
+ "name": "images",
571
+ "type": "IMAGE",
572
+ "link": 619
573
+ }
574
+ ],
575
+ "properties": {
576
+ "Node name for S&R": "PreviewImage"
577
+ }
578
+ },
579
+ {
580
+ "id": 105,
581
+ "type": "Note",
582
+ "pos": [
583
+ -630,
584
+ 630
585
+ ],
586
+ "size": {
587
+ "0": 210,
588
+ "1": 110.18948364257812
589
+ },
590
+ "flags": {},
591
+ "order": 2,
592
+ "mode": 0,
593
+ "properties": {
594
+ "text": ""
595
+ },
596
+ "widgets_values": [
597
+ "Make sure the resolution is multiple of 64 pixels and adds up to around 1 megapixel. "
598
+ ],
599
+ "color": "#432",
600
+ "bgcolor": "#653"
601
+ },
602
+ {
603
+ "id": 302,
604
+ "type": "ModelSamplingSD3",
605
+ "pos": [
606
+ 756,
607
+ 504
608
+ ],
609
+ "size": {
610
+ "0": 315,
611
+ "1": 58
612
+ },
613
+ "flags": {
614
+ "collapsed": false
615
+ },
616
+ "order": 11,
617
+ "mode": 0,
618
+ "inputs": [
619
+ {
620
+ "name": "model",
621
+ "type": "MODEL",
622
+ "link": 606
623
+ }
624
+ ],
625
+ "outputs": [
626
+ {
627
+ "name": "MODEL",
628
+ "type": "MODEL",
629
+ "links": [
630
+ 620
631
+ ],
632
+ "shape": 3,
633
+ "slot_index": 0
634
+ }
635
+ ],
636
+ "properties": {
637
+ "Node name for S&R": "ModelSamplingSD3"
638
+ },
639
+ "widgets_values": [
640
+ 3
641
+ ]
642
+ },
643
+ {
644
+ "id": 13,
645
+ "type": "ModelSamplingSD3",
646
+ "pos": [
647
+ 756,
648
+ 252
649
+ ],
650
+ "size": {
651
+ "0": 315,
652
+ "1": 58
653
+ },
654
+ "flags": {
655
+ "collapsed": false
656
+ },
657
+ "order": 10,
658
+ "mode": 0,
659
+ "inputs": [
660
+ {
661
+ "name": "model",
662
+ "type": "MODEL",
663
+ "link": 445
664
+ }
665
+ ],
666
+ "outputs": [
667
+ {
668
+ "name": "MODEL",
669
+ "type": "MODEL",
670
+ "links": [
671
+ 568
672
+ ],
673
+ "shape": 3,
674
+ "slot_index": 0
675
+ }
676
+ ],
677
+ "properties": {
678
+ "Node name for S&R": "ModelSamplingSD3"
679
+ },
680
+ "widgets_values": [
681
+ 3
682
+ ]
683
+ },
684
+ {
685
+ "id": 307,
686
+ "type": "ImageScaleBy",
687
+ "pos": [
688
+ 2394,
689
+ 252
690
+ ],
691
+ "size": {
692
+ "0": 315,
693
+ "1": 82
694
+ },
695
+ "flags": {},
696
+ "order": 19,
697
+ "mode": 0,
698
+ "inputs": [
699
+ {
700
+ "name": "image",
701
+ "type": "IMAGE",
702
+ "link": 660
703
+ }
704
+ ],
705
+ "outputs": [
706
+ {
707
+ "name": "IMAGE",
708
+ "type": "IMAGE",
709
+ "links": [
710
+ 619,
711
+ 671
712
+ ],
713
+ "shape": 3,
714
+ "slot_index": 0
715
+ }
716
+ ],
717
+ "properties": {
718
+ "Node name for S&R": "ImageScaleBy"
719
+ },
720
+ "widgets_values": [
721
+ "lanczos",
722
+ 1.4000000000000001
723
+ ]
724
+ },
725
+ {
726
+ "id": 330,
727
+ "type": "PrimitiveNode",
728
+ "pos": [
729
+ 3150,
730
+ 504
731
+ ],
732
+ "size": {
733
+ "0": 210,
734
+ "1": 82
735
+ },
736
+ "flags": {},
737
+ "order": 3,
738
+ "mode": 0,
739
+ "outputs": [
740
+ {
741
+ "name": "INT",
742
+ "type": "INT",
743
+ "links": [
744
+ 672
745
+ ],
746
+ "slot_index": 0,
747
+ "widget": {
748
+ "name": "start_at_step"
749
+ }
750
+ }
751
+ ],
752
+ "title": "Start at Step",
753
+ "properties": {
754
+ "Run widget replace on values": false
755
+ },
756
+ "widgets_values": [
757
+ 30,
758
+ "fixed"
759
+ ]
760
+ },
761
+ {
762
+ "id": 135,
763
+ "type": "EmptySD3LatentImage",
764
+ "pos": [
765
+ -378,
766
+ 630
767
+ ],
768
+ "size": {
769
+ "0": 315,
770
+ "1": 106
771
+ },
772
+ "flags": {},
773
+ "order": 4,
774
+ "mode": 0,
775
+ "inputs": [],
776
+ "outputs": [
777
+ {
778
+ "name": "LATENT",
779
+ "type": "LATENT",
780
+ "links": [
781
+ 598
782
+ ],
783
+ "shape": 3,
784
+ "slot_index": 0
785
+ }
786
+ ],
787
+ "properties": {
788
+ "Node name for S&R": "EmptySD3LatentImage"
789
+ },
790
+ "widgets_values": [
791
+ 1152,
792
+ 896,
793
+ 1
794
+ ]
795
+ },
796
+ {
797
+ "id": 301,
798
+ "type": "CheckpointLoaderSimple",
799
+ "pos": [
800
+ -1386,
801
+ 504
802
+ ],
803
+ "size": {
804
+ "0": 632.6060180664062,
805
+ "1": 98
806
+ },
807
+ "flags": {},
808
+ "order": 5,
809
+ "mode": 0,
810
+ "outputs": [
811
+ {
812
+ "name": "MODEL",
813
+ "type": "MODEL",
814
+ "links": [
815
+ 606
816
+ ],
817
+ "shape": 3,
818
+ "slot_index": 0
819
+ },
820
+ {
821
+ "name": "CLIP",
822
+ "type": "CLIP",
823
+ "links": null,
824
+ "shape": 3
825
+ },
826
+ {
827
+ "name": "VAE",
828
+ "type": "VAE",
829
+ "links": [],
830
+ "shape": 3,
831
+ "slot_index": 2
832
+ }
833
+ ],
834
+ "properties": {
835
+ "Node name for S&R": "CheckpointLoaderSimple"
836
+ },
837
+ "widgets_values": [
838
+ "sd3.5_medium.safetensors"
839
+ ]
840
+ },
841
+ {
842
+ "id": 71,
843
+ "type": "CLIPTextEncode",
844
+ "pos": [
845
+ -378,
846
+ 1260
847
+ ],
848
+ "size": {
849
+ "0": 351.8130798339844,
850
+ "1": 195.57545471191406
851
+ },
852
+ "flags": {},
853
+ "order": 8,
854
+ "mode": 0,
855
+ "inputs": [
856
+ {
857
+ "name": "clip",
858
+ "type": "CLIP",
859
+ "link": 94
860
+ }
861
+ ],
862
+ "outputs": [
863
+ {
864
+ "name": "CONDITIONING",
865
+ "type": "CONDITIONING",
866
+ "links": [
867
+ 93,
868
+ 597
869
+ ],
870
+ "shape": 3,
871
+ "slot_index": 0
872
+ }
873
+ ],
874
+ "properties": {
875
+ "Node name for S&R": "CLIPTextEncode"
876
+ },
877
+ "widgets_values": [
878
+ ""
879
+ ],
880
+ "color": "#322",
881
+ "bgcolor": "#533"
882
+ },
883
+ {
884
+ "id": 6,
885
+ "type": "CLIPTextEncode",
886
+ "pos": [
887
+ -378,
888
+ 882
889
+ ],
890
+ "size": [
891
+ 342.21509258248534,
892
+ 195.87930444715585
893
+ ],
894
+ "flags": {},
895
+ "order": 7,
896
+ "mode": 0,
897
+ "inputs": [
898
+ {
899
+ "name": "clip",
900
+ "type": "CLIP",
901
+ "link": 5
902
+ }
903
+ ],
904
+ "outputs": [
905
+ {
906
+ "name": "CONDITIONING",
907
+ "type": "CONDITIONING",
908
+ "links": [
909
+ 569
910
+ ],
911
+ "shape": 3,
912
+ "slot_index": 0
913
+ }
914
+ ],
915
+ "properties": {
916
+ "Node name for S&R": "CLIPTextEncode"
917
+ },
918
+ "widgets_values": [
919
+ "cinematic film still, epic, photo of a woman wearing sunglasses"
920
+ ],
921
+ "color": "#232",
922
+ "bgcolor": "#353"
923
+ },
924
+ {
925
+ "id": 324,
926
+ "type": "CLIPTextEncode",
927
+ "pos": [
928
+ -378,
929
+ 1134
930
+ ],
931
+ "size": [
932
+ 346.27611650227504,
933
+ 80.0318642466309
934
+ ],
935
+ "flags": {},
936
+ "order": 9,
937
+ "mode": 0,
938
+ "inputs": [
939
+ {
940
+ "name": "clip",
941
+ "type": "CLIP",
942
+ "link": 662
943
+ }
944
+ ],
945
+ "outputs": [
946
+ {
947
+ "name": "CONDITIONING",
948
+ "type": "CONDITIONING",
949
+ "links": [
950
+ 665
951
+ ],
952
+ "shape": 3,
953
+ "slot_index": 0
954
+ }
955
+ ],
956
+ "properties": {
957
+ "Node name for S&R": "CLIPTextEncode"
958
+ },
959
+ "widgets_values": [
960
+ "cinematic film still, epic, photo of a woman wearing sunglasses"
961
+ ],
962
+ "color": "#232",
963
+ "bgcolor": "#353"
964
+ },
965
+ {
966
+ "id": 329,
967
+ "type": "Note",
968
+ "pos": [
969
+ -630,
970
+ 1134
971
+ ],
972
+ "size": [
973
+ 222.24755928435616,
974
+ 69.25623726364165
975
+ ],
976
+ "flags": {},
977
+ "order": 6,
978
+ "mode": 0,
979
+ "properties": {
980
+ "text": ""
981
+ },
982
+ "widgets_values": [
983
+ "Medium has a token limit on T5. Use a shorter version of the prompt limited to ~70 words or truncate"
984
+ ],
985
+ "color": "#432",
986
+ "bgcolor": "#653"
987
+ }
988
+ ],
989
+ "links": [
990
+ [
991
+ 5,
992
+ 11,
993
+ 0,
994
+ 6,
995
+ 0,
996
+ "CLIP"
997
+ ],
998
+ [
999
+ 90,
1000
+ 67,
1001
+ 0,
1002
+ 68,
1003
+ 0,
1004
+ "CONDITIONING"
1005
+ ],
1006
+ [
1007
+ 91,
1008
+ 68,
1009
+ 0,
1010
+ 69,
1011
+ 0,
1012
+ "CONDITIONING"
1013
+ ],
1014
+ [
1015
+ 92,
1016
+ 70,
1017
+ 0,
1018
+ 69,
1019
+ 1,
1020
+ "CONDITIONING"
1021
+ ],
1022
+ [
1023
+ 93,
1024
+ 71,
1025
+ 0,
1026
+ 70,
1027
+ 0,
1028
+ "CONDITIONING"
1029
+ ],
1030
+ [
1031
+ 94,
1032
+ 11,
1033
+ 0,
1034
+ 71,
1035
+ 0,
1036
+ "CLIP"
1037
+ ],
1038
+ [
1039
+ 274,
1040
+ 8,
1041
+ 0,
1042
+ 50,
1043
+ 0,
1044
+ "IMAGE"
1045
+ ],
1046
+ [
1047
+ 445,
1048
+ 4,
1049
+ 0,
1050
+ 13,
1051
+ 0,
1052
+ "MODEL"
1053
+ ],
1054
+ [
1055
+ 568,
1056
+ 13,
1057
+ 0,
1058
+ 294,
1059
+ 0,
1060
+ "MODEL"
1061
+ ],
1062
+ [
1063
+ 569,
1064
+ 6,
1065
+ 0,
1066
+ 294,
1067
+ 1,
1068
+ "CONDITIONING"
1069
+ ],
1070
+ [
1071
+ 572,
1072
+ 294,
1073
+ 0,
1074
+ 8,
1075
+ 0,
1076
+ "LATENT"
1077
+ ],
1078
+ [
1079
+ 597,
1080
+ 71,
1081
+ 0,
1082
+ 67,
1083
+ 0,
1084
+ "CONDITIONING"
1085
+ ],
1086
+ [
1087
+ 598,
1088
+ 135,
1089
+ 0,
1090
+ 294,
1091
+ 3,
1092
+ "LATENT"
1093
+ ],
1094
+ [
1095
+ 604,
1096
+ 69,
1097
+ 0,
1098
+ 294,
1099
+ 2,
1100
+ "CONDITIONING"
1101
+ ],
1102
+ [
1103
+ 605,
1104
+ 4,
1105
+ 2,
1106
+ 8,
1107
+ 1,
1108
+ "VAE"
1109
+ ],
1110
+ [
1111
+ 606,
1112
+ 301,
1113
+ 0,
1114
+ 302,
1115
+ 0,
1116
+ "MODEL"
1117
+ ],
1118
+ [
1119
+ 616,
1120
+ 4,
1121
+ 2,
1122
+ 308,
1123
+ 1,
1124
+ "VAE"
1125
+ ],
1126
+ [
1127
+ 617,
1128
+ 4,
1129
+ 2,
1130
+ 305,
1131
+ 1,
1132
+ "VAE"
1133
+ ],
1134
+ [
1135
+ 619,
1136
+ 307,
1137
+ 0,
1138
+ 309,
1139
+ 0,
1140
+ "IMAGE"
1141
+ ],
1142
+ [
1143
+ 620,
1144
+ 302,
1145
+ 0,
1146
+ 310,
1147
+ 0,
1148
+ "MODEL"
1149
+ ],
1150
+ [
1151
+ 622,
1152
+ 69,
1153
+ 0,
1154
+ 310,
1155
+ 2,
1156
+ "CONDITIONING"
1157
+ ],
1158
+ [
1159
+ 623,
1160
+ 308,
1161
+ 0,
1162
+ 310,
1163
+ 3,
1164
+ "LATENT"
1165
+ ],
1166
+ [
1167
+ 624,
1168
+ 310,
1169
+ 0,
1170
+ 305,
1171
+ 0,
1172
+ "LATENT"
1173
+ ],
1174
+ [
1175
+ 660,
1176
+ 8,
1177
+ 0,
1178
+ 307,
1179
+ 0,
1180
+ "IMAGE"
1181
+ ],
1182
+ [
1183
+ 662,
1184
+ 11,
1185
+ 0,
1186
+ 324,
1187
+ 0,
1188
+ "CLIP"
1189
+ ],
1190
+ [
1191
+ 665,
1192
+ 324,
1193
+ 0,
1194
+ 310,
1195
+ 1,
1196
+ "CONDITIONING"
1197
+ ],
1198
+ [
1199
+ 670,
1200
+ 305,
1201
+ 0,
1202
+ 306,
1203
+ 0,
1204
+ "IMAGE"
1205
+ ],
1206
+ [
1207
+ 671,
1208
+ 307,
1209
+ 0,
1210
+ 308,
1211
+ 0,
1212
+ "IMAGE"
1213
+ ],
1214
+ [
1215
+ 672,
1216
+ 330,
1217
+ 0,
1218
+ 310,
1219
+ 4,
1220
+ "INT"
1221
+ ]
1222
+ ],
1223
+ "groups": [],
1224
+ "config": {},
1225
+ "extra": {
1226
+ "ds": {
1227
+ "scale": 0.3797498335833178,
1228
+ "offset": [
1229
+ 2577.2791383634726,
1230
+ 94.5657992857425
1231
+ ]
1232
+ }
1233
+ },
1234
+ "version": 0.4
1235
+ }
SD3.5M_SLG_example_workflow.json ADDED
@@ -0,0 +1,1006 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "last_node_id": 305,
3
+ "last_link_id": 627,
4
+ "nodes": [
5
+ {
6
+ "id": 11,
7
+ "type": "TripleCLIPLoader",
8
+ "pos": {
9
+ "0": -2016,
10
+ "1": -252
11
+ },
12
+ "size": {
13
+ "0": 315,
14
+ "1": 106
15
+ },
16
+ "flags": {},
17
+ "order": 0,
18
+ "mode": 0,
19
+ "inputs": [],
20
+ "outputs": [
21
+ {
22
+ "name": "CLIP",
23
+ "type": "CLIP",
24
+ "links": [
25
+ 5,
26
+ 94
27
+ ],
28
+ "slot_index": 0,
29
+ "shape": 3
30
+ }
31
+ ],
32
+ "properties": {
33
+ "Node name for S&R": "TripleCLIPLoader"
34
+ },
35
+ "widgets_values": [
36
+ "sdv3/clip_g.safetensors",
37
+ "sdv3/clip_l.safetensors",
38
+ "sdv3/t5xxl_fp16.safetensors"
39
+ ]
40
+ },
41
+ {
42
+ "id": 303,
43
+ "type": "VAEDecode",
44
+ "pos": {
45
+ "0": 1381,
46
+ "1": 233
47
+ },
48
+ "size": {
49
+ "0": 210,
50
+ "1": 46
51
+ },
52
+ "flags": {},
53
+ "order": 15,
54
+ "mode": 0,
55
+ "inputs": [
56
+ {
57
+ "name": "samples",
58
+ "type": "LATENT",
59
+ "link": 612
60
+ },
61
+ {
62
+ "name": "vae",
63
+ "type": "VAE",
64
+ "link": 614
65
+ }
66
+ ],
67
+ "outputs": [
68
+ {
69
+ "name": "IMAGE",
70
+ "type": "IMAGE",
71
+ "links": [
72
+ 613
73
+ ],
74
+ "slot_index": 0,
75
+ "shape": 3
76
+ }
77
+ ],
78
+ "properties": {
79
+ "Node name for S&R": "VAEDecode"
80
+ },
81
+ "widgets_values": []
82
+ },
83
+ {
84
+ "id": 105,
85
+ "type": "Note",
86
+ "pos": {
87
+ "0": -1484,
88
+ "1": -249
89
+ },
90
+ "size": {
91
+ "0": 210,
92
+ "1": 110.18948364257812
93
+ },
94
+ "flags": {},
95
+ "order": 1,
96
+ "mode": 0,
97
+ "inputs": [],
98
+ "outputs": [],
99
+ "properties": {
100
+ "text": ""
101
+ },
102
+ "widgets_values": [
103
+ "Make sure the resolution is multiple of 64 pixels and adds up to around 1 megapixel. "
104
+ ],
105
+ "color": "#432",
106
+ "bgcolor": "#653"
107
+ },
108
+ {
109
+ "id": 304,
110
+ "type": "PreviewImage",
111
+ "pos": {
112
+ "0": 1758,
113
+ "1": 150
114
+ },
115
+ "size": {
116
+ "0": 616.689697265625,
117
+ "1": 613.84130859375
118
+ },
119
+ "flags": {},
120
+ "order": 17,
121
+ "mode": 0,
122
+ "inputs": [
123
+ {
124
+ "name": "images",
125
+ "type": "IMAGE",
126
+ "link": 613
127
+ }
128
+ ],
129
+ "outputs": [],
130
+ "properties": {
131
+ "Node name for S&R": "PreviewImage"
132
+ },
133
+ "widgets_values": []
134
+ },
135
+ {
136
+ "id": 50,
137
+ "type": "PreviewImage",
138
+ "pos": {
139
+ "0": 1764,
140
+ "1": -504
141
+ },
142
+ "size": {
143
+ "0": 616.689697265625,
144
+ "1": 613.84130859375
145
+ },
146
+ "flags": {},
147
+ "order": 18,
148
+ "mode": 0,
149
+ "inputs": [
150
+ {
151
+ "name": "images",
152
+ "type": "IMAGE",
153
+ "link": 274
154
+ }
155
+ ],
156
+ "outputs": [],
157
+ "properties": {
158
+ "Node name for S&R": "PreviewImage"
159
+ },
160
+ "widgets_values": []
161
+ },
162
+ {
163
+ "id": 67,
164
+ "type": "ConditioningZeroOut",
165
+ "pos": {
166
+ "0": -1103,
167
+ "1": 454
168
+ },
169
+ "size": {
170
+ "0": 211.60000610351562,
171
+ "1": 26
172
+ },
173
+ "flags": {},
174
+ "order": 8,
175
+ "mode": 0,
176
+ "inputs": [
177
+ {
178
+ "name": "conditioning",
179
+ "type": "CONDITIONING",
180
+ "link": 597
181
+ }
182
+ ],
183
+ "outputs": [
184
+ {
185
+ "name": "CONDITIONING",
186
+ "type": "CONDITIONING",
187
+ "links": [
188
+ 90
189
+ ],
190
+ "slot_index": 0,
191
+ "shape": 3
192
+ }
193
+ ],
194
+ "properties": {
195
+ "Node name for S&R": "ConditioningZeroOut"
196
+ },
197
+ "widgets_values": []
198
+ },
199
+ {
200
+ "id": 68,
201
+ "type": "ConditioningSetTimestepRange",
202
+ "pos": {
203
+ "0": -839,
204
+ "1": 442
205
+ },
206
+ "size": {
207
+ "0": 317.4000244140625,
208
+ "1": 82
209
+ },
210
+ "flags": {},
211
+ "order": 11,
212
+ "mode": 0,
213
+ "inputs": [
214
+ {
215
+ "name": "conditioning",
216
+ "type": "CONDITIONING",
217
+ "link": 90
218
+ }
219
+ ],
220
+ "outputs": [
221
+ {
222
+ "name": "CONDITIONING",
223
+ "type": "CONDITIONING",
224
+ "links": [
225
+ 91
226
+ ],
227
+ "slot_index": 0,
228
+ "shape": 3
229
+ }
230
+ ],
231
+ "properties": {
232
+ "Node name for S&R": "ConditioningSetTimestepRange"
233
+ },
234
+ "widgets_values": [
235
+ 0.1,
236
+ 1
237
+ ]
238
+ },
239
+ {
240
+ "id": 69,
241
+ "type": "ConditioningCombine",
242
+ "pos": {
243
+ "0": -129,
244
+ "1": 290
245
+ },
246
+ "size": {
247
+ "0": 228.39999389648438,
248
+ "1": 46
249
+ },
250
+ "flags": {},
251
+ "order": 12,
252
+ "mode": 0,
253
+ "inputs": [
254
+ {
255
+ "name": "conditioning_1",
256
+ "type": "CONDITIONING",
257
+ "link": 91
258
+ },
259
+ {
260
+ "name": "conditioning_2",
261
+ "type": "CONDITIONING",
262
+ "link": 92
263
+ }
264
+ ],
265
+ "outputs": [
266
+ {
267
+ "name": "CONDITIONING",
268
+ "type": "CONDITIONING",
269
+ "links": [
270
+ 621,
271
+ 625
272
+ ],
273
+ "slot_index": 0,
274
+ "shape": 3
275
+ }
276
+ ],
277
+ "properties": {
278
+ "Node name for S&R": "ConditioningCombine"
279
+ },
280
+ "widgets_values": []
281
+ },
282
+ {
283
+ "id": 13,
284
+ "type": "ModelSamplingSD3",
285
+ "pos": {
286
+ "0": -424,
287
+ "1": -516
288
+ },
289
+ "size": {
290
+ "0": 315,
291
+ "1": 58
292
+ },
293
+ "flags": {
294
+ "collapsed": false
295
+ },
296
+ "order": 7,
297
+ "mode": 0,
298
+ "inputs": [
299
+ {
300
+ "name": "model",
301
+ "type": "MODEL",
302
+ "link": 445
303
+ }
304
+ ],
305
+ "outputs": [
306
+ {
307
+ "name": "MODEL",
308
+ "type": "MODEL",
309
+ "links": [
310
+ 606,
311
+ 618
312
+ ],
313
+ "slot_index": 0,
314
+ "shape": 3
315
+ }
316
+ ],
317
+ "properties": {
318
+ "Node name for S&R": "ModelSamplingSD3"
319
+ },
320
+ "widgets_values": [
321
+ 3
322
+ ]
323
+ },
324
+ {
325
+ "id": 135,
326
+ "type": "EmptySD3LatentImage",
327
+ "pos": {
328
+ "0": -1195,
329
+ "1": -251
330
+ },
331
+ "size": {
332
+ "0": 315,
333
+ "1": 106
334
+ },
335
+ "flags": {},
336
+ "order": 2,
337
+ "mode": 0,
338
+ "inputs": [],
339
+ "outputs": [
340
+ {
341
+ "name": "LATENT",
342
+ "type": "LATENT",
343
+ "links": [
344
+ 598,
345
+ 611
346
+ ],
347
+ "slot_index": 0,
348
+ "shape": 3
349
+ }
350
+ ],
351
+ "properties": {
352
+ "Node name for S&R": "EmptySD3LatentImage"
353
+ },
354
+ "widgets_values": [
355
+ 1280,
356
+ 768,
357
+ 1
358
+ ]
359
+ },
360
+ {
361
+ "id": 8,
362
+ "type": "VAEDecode",
363
+ "pos": {
364
+ "0": 1387,
365
+ "1": -415
366
+ },
367
+ "size": {
368
+ "0": 210,
369
+ "1": 46
370
+ },
371
+ "flags": {},
372
+ "order": 16,
373
+ "mode": 0,
374
+ "inputs": [
375
+ {
376
+ "name": "samples",
377
+ "type": "LATENT",
378
+ "link": 572
379
+ },
380
+ {
381
+ "name": "vae",
382
+ "type": "VAE",
383
+ "link": 605
384
+ }
385
+ ],
386
+ "outputs": [
387
+ {
388
+ "name": "IMAGE",
389
+ "type": "IMAGE",
390
+ "links": [
391
+ 274
392
+ ],
393
+ "slot_index": 0,
394
+ "shape": 3
395
+ }
396
+ ],
397
+ "properties": {
398
+ "Node name for S&R": "VAEDecode"
399
+ },
400
+ "widgets_values": []
401
+ },
402
+ {
403
+ "id": 4,
404
+ "type": "CheckpointLoaderSimple",
405
+ "pos": {
406
+ "0": -2016,
407
+ "1": -504
408
+ },
409
+ "size": [
410
+ 311.9781150464221,
411
+ 99.19846549382407
412
+ ],
413
+ "flags": {},
414
+ "order": 3,
415
+ "mode": 0,
416
+ "inputs": [],
417
+ "outputs": [
418
+ {
419
+ "name": "MODEL",
420
+ "type": "MODEL",
421
+ "links": [
422
+ 445
423
+ ],
424
+ "slot_index": 0,
425
+ "shape": 3
426
+ },
427
+ {
428
+ "name": "CLIP",
429
+ "type": "CLIP",
430
+ "links": null,
431
+ "shape": 3
432
+ },
433
+ {
434
+ "name": "VAE",
435
+ "type": "VAE",
436
+ "links": [
437
+ 605,
438
+ 614
439
+ ],
440
+ "slot_index": 2,
441
+ "shape": 3
442
+ }
443
+ ],
444
+ "properties": {
445
+ "Node name for S&R": "CheckpointLoaderSimple"
446
+ },
447
+ "widgets_values": [
448
+ "sd3.5_medium.safetensors"
449
+ ]
450
+ },
451
+ {
452
+ "id": 302,
453
+ "type": "KSampler",
454
+ "pos": {
455
+ "0": 962,
456
+ "1": 236
457
+ },
458
+ "size": {
459
+ "0": 378,
460
+ "1": 504
461
+ },
462
+ "flags": {},
463
+ "order": 13,
464
+ "mode": 0,
465
+ "inputs": [
466
+ {
467
+ "name": "model",
468
+ "type": "MODEL",
469
+ "link": 618
470
+ },
471
+ {
472
+ "name": "positive",
473
+ "type": "CONDITIONING",
474
+ "link": 610
475
+ },
476
+ {
477
+ "name": "negative",
478
+ "type": "CONDITIONING",
479
+ "link": 621
480
+ },
481
+ {
482
+ "name": "latent_image",
483
+ "type": "LATENT",
484
+ "link": 611
485
+ },
486
+ {
487
+ "name": "seed",
488
+ "type": "INT",
489
+ "link": 617,
490
+ "widget": {
491
+ "name": "seed"
492
+ }
493
+ }
494
+ ],
495
+ "outputs": [
496
+ {
497
+ "name": "LATENT",
498
+ "type": "LATENT",
499
+ "links": [
500
+ 612
501
+ ],
502
+ "slot_index": 0,
503
+ "shape": 3
504
+ }
505
+ ],
506
+ "properties": {
507
+ "Node name for S&R": "KSampler"
508
+ },
509
+ "widgets_values": [
510
+ 42,
511
+ "randomize",
512
+ 50,
513
+ 5,
514
+ "dpmpp_2m",
515
+ "sgm_uniform",
516
+ 1
517
+ ]
518
+ },
519
+ {
520
+ "id": 301,
521
+ "type": "SkipLayerGuidanceSD3",
522
+ "pos": {
523
+ "0": 234,
524
+ "1": -513
525
+ },
526
+ "size": {
527
+ "0": 315,
528
+ "1": 130
529
+ },
530
+ "flags": {},
531
+ "order": 10,
532
+ "mode": 0,
533
+ "inputs": [
534
+ {
535
+ "name": "model",
536
+ "type": "MODEL",
537
+ "link": 606
538
+ }
539
+ ],
540
+ "outputs": [
541
+ {
542
+ "name": "MODEL",
543
+ "type": "MODEL",
544
+ "links": [
545
+ 607
546
+ ],
547
+ "slot_index": 0
548
+ }
549
+ ],
550
+ "properties": {
551
+ "Node name for S&R": "SkipLayerGuidanceSD3"
552
+ },
553
+ "widgets_values": [
554
+ "7,8,9",
555
+ 2,
556
+ 0.01,
557
+ 0.15
558
+ ]
559
+ },
560
+ {
561
+ "id": 70,
562
+ "type": "ConditioningSetTimestepRange",
563
+ "pos": {
564
+ "0": -851,
565
+ "1": 274
566
+ },
567
+ "size": {
568
+ "0": 317.4000244140625,
569
+ "1": 82
570
+ },
571
+ "flags": {},
572
+ "order": 9,
573
+ "mode": 0,
574
+ "inputs": [
575
+ {
576
+ "name": "conditioning",
577
+ "type": "CONDITIONING",
578
+ "link": 627,
579
+ "slot_index": 0
580
+ }
581
+ ],
582
+ "outputs": [
583
+ {
584
+ "name": "CONDITIONING",
585
+ "type": "CONDITIONING",
586
+ "links": [
587
+ 92
588
+ ],
589
+ "slot_index": 0,
590
+ "shape": 3
591
+ }
592
+ ],
593
+ "properties": {
594
+ "Node name for S&R": "ConditioningSetTimestepRange"
595
+ },
596
+ "widgets_values": [
597
+ 0,
598
+ 0.1
599
+ ]
600
+ },
601
+ {
602
+ "id": 71,
603
+ "type": "CLIPTextEncode",
604
+ "pos": {
605
+ "0": -1547,
606
+ "1": 348
607
+ },
608
+ "size": {
609
+ "0": 351.8130798339844,
610
+ "1": 195.57545471191406
611
+ },
612
+ "flags": {},
613
+ "order": 6,
614
+ "mode": 0,
615
+ "inputs": [
616
+ {
617
+ "name": "clip",
618
+ "type": "CLIP",
619
+ "link": 94
620
+ }
621
+ ],
622
+ "outputs": [
623
+ {
624
+ "name": "CONDITIONING",
625
+ "type": "CONDITIONING",
626
+ "links": [
627
+ 597,
628
+ 627
629
+ ],
630
+ "slot_index": 0,
631
+ "shape": 3
632
+ }
633
+ ],
634
+ "properties": {
635
+ "Node name for S&R": "CLIPTextEncode"
636
+ },
637
+ "widgets_values": [
638
+ ""
639
+ ],
640
+ "color": "#322",
641
+ "bgcolor": "#533"
642
+ },
643
+ {
644
+ "id": 294,
645
+ "type": "KSampler",
646
+ "pos": {
647
+ "0": 969,
648
+ "1": -417
649
+ },
650
+ "size": {
651
+ "0": 378,
652
+ "1": 504
653
+ },
654
+ "flags": {},
655
+ "order": 14,
656
+ "mode": 0,
657
+ "inputs": [
658
+ {
659
+ "name": "model",
660
+ "type": "MODEL",
661
+ "link": 607
662
+ },
663
+ {
664
+ "name": "positive",
665
+ "type": "CONDITIONING",
666
+ "link": 626
667
+ },
668
+ {
669
+ "name": "negative",
670
+ "type": "CONDITIONING",
671
+ "link": 625
672
+ },
673
+ {
674
+ "name": "latent_image",
675
+ "type": "LATENT",
676
+ "link": 598
677
+ },
678
+ {
679
+ "name": "seed",
680
+ "type": "INT",
681
+ "link": 616,
682
+ "widget": {
683
+ "name": "seed"
684
+ }
685
+ }
686
+ ],
687
+ "outputs": [
688
+ {
689
+ "name": "LATENT",
690
+ "type": "LATENT",
691
+ "links": [
692
+ 572
693
+ ],
694
+ "slot_index": 0,
695
+ "shape": 3
696
+ }
697
+ ],
698
+ "properties": {
699
+ "Node name for S&R": "KSampler"
700
+ },
701
+ "widgets_values": [
702
+ 42,
703
+ "randomize",
704
+ 50,
705
+ 4,
706
+ "dpmpp_2m",
707
+ "sgm_uniform",
708
+ 1
709
+ ]
710
+ },
711
+ {
712
+ "id": 305,
713
+ "type": "PrimitiveNode",
714
+ "pos": {
715
+ "0": -155,
716
+ "1": -674
717
+ },
718
+ "size": {
719
+ "0": 285.3897399902344,
720
+ "1": 86.61906433105469
721
+ },
722
+ "flags": {},
723
+ "order": 4,
724
+ "mode": 0,
725
+ "inputs": [],
726
+ "outputs": [
727
+ {
728
+ "name": "INT",
729
+ "type": "INT",
730
+ "links": [
731
+ 616,
732
+ 617
733
+ ],
734
+ "slot_index": 0,
735
+ "widget": {
736
+ "name": "seed"
737
+ }
738
+ }
739
+ ],
740
+ "title": "seed",
741
+ "properties": {
742
+ "Run widget replace on values": false
743
+ },
744
+ "widgets_values": [
745
+ 42,
746
+ "fixed"
747
+ ]
748
+ },
749
+ {
750
+ "id": 6,
751
+ "type": "CLIPTextEncode",
752
+ "pos": {
753
+ "0": -1547,
754
+ "1": 123
755
+ },
756
+ "size": {
757
+ "0": 342.8335266113281,
758
+ "1": 177.20867919921875
759
+ },
760
+ "flags": {},
761
+ "order": 5,
762
+ "mode": 0,
763
+ "inputs": [
764
+ {
765
+ "name": "clip",
766
+ "type": "CLIP",
767
+ "link": 5
768
+ }
769
+ ],
770
+ "outputs": [
771
+ {
772
+ "name": "CONDITIONING",
773
+ "type": "CONDITIONING",
774
+ "links": [
775
+ 610,
776
+ 626
777
+ ],
778
+ "slot_index": 0,
779
+ "shape": 3
780
+ }
781
+ ],
782
+ "properties": {
783
+ "Node name for S&R": "CLIPTextEncode"
784
+ },
785
+ "widgets_values": [
786
+ "photorealistic photography girl floating in air in white dress\n"
787
+ ],
788
+ "color": "#232",
789
+ "bgcolor": "#353"
790
+ }
791
+ ],
792
+ "links": [
793
+ [
794
+ 5,
795
+ 11,
796
+ 0,
797
+ 6,
798
+ 0,
799
+ "CLIP"
800
+ ],
801
+ [
802
+ 90,
803
+ 67,
804
+ 0,
805
+ 68,
806
+ 0,
807
+ "CONDITIONING"
808
+ ],
809
+ [
810
+ 91,
811
+ 68,
812
+ 0,
813
+ 69,
814
+ 0,
815
+ "CONDITIONING"
816
+ ],
817
+ [
818
+ 92,
819
+ 70,
820
+ 0,
821
+ 69,
822
+ 1,
823
+ "CONDITIONING"
824
+ ],
825
+ [
826
+ 94,
827
+ 11,
828
+ 0,
829
+ 71,
830
+ 0,
831
+ "CLIP"
832
+ ],
833
+ [
834
+ 274,
835
+ 8,
836
+ 0,
837
+ 50,
838
+ 0,
839
+ "IMAGE"
840
+ ],
841
+ [
842
+ 445,
843
+ 4,
844
+ 0,
845
+ 13,
846
+ 0,
847
+ "MODEL"
848
+ ],
849
+ [
850
+ 572,
851
+ 294,
852
+ 0,
853
+ 8,
854
+ 0,
855
+ "LATENT"
856
+ ],
857
+ [
858
+ 597,
859
+ 71,
860
+ 0,
861
+ 67,
862
+ 0,
863
+ "CONDITIONING"
864
+ ],
865
+ [
866
+ 598,
867
+ 135,
868
+ 0,
869
+ 294,
870
+ 3,
871
+ "LATENT"
872
+ ],
873
+ [
874
+ 605,
875
+ 4,
876
+ 2,
877
+ 8,
878
+ 1,
879
+ "VAE"
880
+ ],
881
+ [
882
+ 606,
883
+ 13,
884
+ 0,
885
+ 301,
886
+ 0,
887
+ "MODEL"
888
+ ],
889
+ [
890
+ 607,
891
+ 301,
892
+ 0,
893
+ 294,
894
+ 0,
895
+ "MODEL"
896
+ ],
897
+ [
898
+ 610,
899
+ 6,
900
+ 0,
901
+ 302,
902
+ 1,
903
+ "CONDITIONING"
904
+ ],
905
+ [
906
+ 611,
907
+ 135,
908
+ 0,
909
+ 302,
910
+ 3,
911
+ "LATENT"
912
+ ],
913
+ [
914
+ 612,
915
+ 302,
916
+ 0,
917
+ 303,
918
+ 0,
919
+ "LATENT"
920
+ ],
921
+ [
922
+ 613,
923
+ 303,
924
+ 0,
925
+ 304,
926
+ 0,
927
+ "IMAGE"
928
+ ],
929
+ [
930
+ 614,
931
+ 4,
932
+ 2,
933
+ 303,
934
+ 1,
935
+ "VAE"
936
+ ],
937
+ [
938
+ 616,
939
+ 305,
940
+ 0,
941
+ 294,
942
+ 4,
943
+ "INT"
944
+ ],
945
+ [
946
+ 617,
947
+ 305,
948
+ 0,
949
+ 302,
950
+ 4,
951
+ "INT"
952
+ ],
953
+ [
954
+ 618,
955
+ 13,
956
+ 0,
957
+ 302,
958
+ 0,
959
+ "MODEL"
960
+ ],
961
+ [
962
+ 621,
963
+ 69,
964
+ 0,
965
+ 302,
966
+ 2,
967
+ "CONDITIONING"
968
+ ],
969
+ [
970
+ 625,
971
+ 69,
972
+ 0,
973
+ 294,
974
+ 2,
975
+ "CONDITIONING"
976
+ ],
977
+ [
978
+ 626,
979
+ 6,
980
+ 0,
981
+ 294,
982
+ 1,
983
+ "CONDITIONING"
984
+ ],
985
+ [
986
+ 627,
987
+ 71,
988
+ 0,
989
+ 70,
990
+ 0,
991
+ "CONDITIONING"
992
+ ]
993
+ ],
994
+ "groups": [],
995
+ "config": {},
996
+ "extra": {
997
+ "ds": {
998
+ "scale": 1.0834705943388945,
999
+ "offset": [
1000
+ 2786.463291970421,
1001
+ 276.88316957958125
1002
+ ]
1003
+ }
1004
+ },
1005
+ "version": 0.4
1006
+ }
SD3.5M_example_workflow.json ADDED
@@ -0,0 +1,697 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "last_node_id": 300,
3
+ "last_link_id": 605,
4
+ "nodes": [
5
+ {
6
+ "id": 67,
7
+ "type": "ConditioningZeroOut",
8
+ "pos": {
9
+ "0": -126,
10
+ "1": 126
11
+ },
12
+ "size": {
13
+ "0": 211.60000610351562,
14
+ "1": 26
15
+ },
16
+ "flags": {},
17
+ "order": 8,
18
+ "mode": 0,
19
+ "inputs": [
20
+ {
21
+ "name": "conditioning",
22
+ "type": "CONDITIONING",
23
+ "link": 597
24
+ }
25
+ ],
26
+ "outputs": [
27
+ {
28
+ "name": "CONDITIONING",
29
+ "type": "CONDITIONING",
30
+ "links": [
31
+ 90
32
+ ],
33
+ "slot_index": 0,
34
+ "shape": 3
35
+ }
36
+ ],
37
+ "properties": {
38
+ "Node name for S&R": "ConditioningZeroOut"
39
+ },
40
+ "widgets_values": []
41
+ },
42
+ {
43
+ "id": 71,
44
+ "type": "CLIPTextEncode",
45
+ "pos": {
46
+ "0": -1010,
47
+ "1": 252
48
+ },
49
+ "size": {
50
+ "0": 351.8130798339844,
51
+ "1": 195.57545471191406
52
+ },
53
+ "flags": {},
54
+ "order": 6,
55
+ "mode": 0,
56
+ "inputs": [
57
+ {
58
+ "name": "clip",
59
+ "type": "CLIP",
60
+ "link": 94
61
+ }
62
+ ],
63
+ "outputs": [
64
+ {
65
+ "name": "CONDITIONING",
66
+ "type": "CONDITIONING",
67
+ "links": [
68
+ 93,
69
+ 597
70
+ ],
71
+ "slot_index": 0,
72
+ "shape": 3
73
+ }
74
+ ],
75
+ "properties": {
76
+ "Node name for S&R": "CLIPTextEncode"
77
+ },
78
+ "widgets_values": [
79
+ ""
80
+ ],
81
+ "color": "#322",
82
+ "bgcolor": "#533"
83
+ },
84
+ {
85
+ "id": 6,
86
+ "type": "CLIPTextEncode",
87
+ "pos": {
88
+ "0": -1008,
89
+ "1": 2
90
+ },
91
+ "size": {
92
+ "0": 342.8335266113281,
93
+ "1": 177.20867919921875
94
+ },
95
+ "flags": {},
96
+ "order": 5,
97
+ "mode": 0,
98
+ "inputs": [
99
+ {
100
+ "name": "clip",
101
+ "type": "CLIP",
102
+ "link": 5
103
+ }
104
+ ],
105
+ "outputs": [
106
+ {
107
+ "name": "CONDITIONING",
108
+ "type": "CONDITIONING",
109
+ "links": [
110
+ 569
111
+ ],
112
+ "slot_index": 0,
113
+ "shape": 3
114
+ }
115
+ ],
116
+ "properties": {
117
+ "Node name for S&R": "CLIPTextEncode"
118
+ },
119
+ "widgets_values": [
120
+ "beautiful scenery nature glass bottle landscape, purple galaxy bottle,"
121
+ ],
122
+ "color": "#232",
123
+ "bgcolor": "#353"
124
+ },
125
+ {
126
+ "id": 69,
127
+ "type": "ConditioningCombine",
128
+ "pos": {
129
+ "0": 504,
130
+ "1": 126
131
+ },
132
+ "size": {
133
+ "0": 228.39999389648438,
134
+ "1": 46
135
+ },
136
+ "flags": {},
137
+ "order": 10,
138
+ "mode": 0,
139
+ "inputs": [
140
+ {
141
+ "name": "conditioning_1",
142
+ "type": "CONDITIONING",
143
+ "link": 91
144
+ },
145
+ {
146
+ "name": "conditioning_2",
147
+ "type": "CONDITIONING",
148
+ "link": 92
149
+ }
150
+ ],
151
+ "outputs": [
152
+ {
153
+ "name": "CONDITIONING",
154
+ "type": "CONDITIONING",
155
+ "links": [
156
+ 604
157
+ ],
158
+ "slot_index": 0,
159
+ "shape": 3
160
+ }
161
+ ],
162
+ "properties": {
163
+ "Node name for S&R": "ConditioningCombine"
164
+ },
165
+ "widgets_values": []
166
+ },
167
+ {
168
+ "id": 8,
169
+ "type": "VAEDecode",
170
+ "pos": {
171
+ "0": 1386,
172
+ "1": -504
173
+ },
174
+ "size": {
175
+ "0": 210,
176
+ "1": 46
177
+ },
178
+ "flags": {},
179
+ "order": 12,
180
+ "mode": 0,
181
+ "inputs": [
182
+ {
183
+ "name": "samples",
184
+ "type": "LATENT",
185
+ "link": 572
186
+ },
187
+ {
188
+ "name": "vae",
189
+ "type": "VAE",
190
+ "link": 605
191
+ }
192
+ ],
193
+ "outputs": [
194
+ {
195
+ "name": "IMAGE",
196
+ "type": "IMAGE",
197
+ "links": [
198
+ 274
199
+ ],
200
+ "slot_index": 0,
201
+ "shape": 3
202
+ }
203
+ ],
204
+ "properties": {
205
+ "Node name for S&R": "VAEDecode"
206
+ },
207
+ "widgets_values": []
208
+ },
209
+ {
210
+ "id": 50,
211
+ "type": "PreviewImage",
212
+ "pos": {
213
+ "0": 1764,
214
+ "1": -504
215
+ },
216
+ "size": {
217
+ "0": 616.689697265625,
218
+ "1": 613.84130859375
219
+ },
220
+ "flags": {},
221
+ "order": 13,
222
+ "mode": 0,
223
+ "inputs": [
224
+ {
225
+ "name": "images",
226
+ "type": "IMAGE",
227
+ "link": 274
228
+ }
229
+ ],
230
+ "outputs": [],
231
+ "properties": {
232
+ "Node name for S&R": "PreviewImage"
233
+ },
234
+ "widgets_values": []
235
+ },
236
+ {
237
+ "id": 68,
238
+ "type": "ConditioningSetTimestepRange",
239
+ "pos": {
240
+ "0": 126,
241
+ "1": 126
242
+ },
243
+ "size": {
244
+ "0": 317.4000244140625,
245
+ "1": 82
246
+ },
247
+ "flags": {},
248
+ "order": 9,
249
+ "mode": 0,
250
+ "inputs": [
251
+ {
252
+ "name": "conditioning",
253
+ "type": "CONDITIONING",
254
+ "link": 90
255
+ }
256
+ ],
257
+ "outputs": [
258
+ {
259
+ "name": "CONDITIONING",
260
+ "type": "CONDITIONING",
261
+ "links": [
262
+ 91
263
+ ],
264
+ "slot_index": 0,
265
+ "shape": 3
266
+ }
267
+ ],
268
+ "properties": {
269
+ "Node name for S&R": "ConditioningSetTimestepRange"
270
+ },
271
+ "widgets_values": [
272
+ 0.2,
273
+ 1
274
+ ]
275
+ },
276
+ {
277
+ "id": 70,
278
+ "type": "ConditioningSetTimestepRange",
279
+ "pos": {
280
+ "0": 126,
281
+ "1": 252
282
+ },
283
+ "size": {
284
+ "0": 317.4000244140625,
285
+ "1": 82
286
+ },
287
+ "flags": {},
288
+ "order": 7,
289
+ "mode": 0,
290
+ "inputs": [
291
+ {
292
+ "name": "conditioning",
293
+ "type": "CONDITIONING",
294
+ "link": 93,
295
+ "slot_index": 0
296
+ }
297
+ ],
298
+ "outputs": [
299
+ {
300
+ "name": "CONDITIONING",
301
+ "type": "CONDITIONING",
302
+ "links": [
303
+ 92
304
+ ],
305
+ "slot_index": 0,
306
+ "shape": 3
307
+ }
308
+ ],
309
+ "properties": {
310
+ "Node name for S&R": "ConditioningSetTimestepRange"
311
+ },
312
+ "widgets_values": [
313
+ 0,
314
+ 0.2
315
+ ]
316
+ },
317
+ {
318
+ "id": 4,
319
+ "type": "CheckpointLoaderSimple",
320
+ "pos": {
321
+ "0": -2016,
322
+ "1": -504
323
+ },
324
+ "size": {
325
+ "0": 632.6060180664062,
326
+ "1": 98
327
+ },
328
+ "flags": {},
329
+ "order": 0,
330
+ "mode": 0,
331
+ "inputs": [],
332
+ "outputs": [
333
+ {
334
+ "name": "MODEL",
335
+ "type": "MODEL",
336
+ "links": [
337
+ 445
338
+ ],
339
+ "slot_index": 0,
340
+ "shape": 3
341
+ },
342
+ {
343
+ "name": "CLIP",
344
+ "type": "CLIP",
345
+ "links": null,
346
+ "shape": 3
347
+ },
348
+ {
349
+ "name": "VAE",
350
+ "type": "VAE",
351
+ "links": [
352
+ 605
353
+ ],
354
+ "slot_index": 2,
355
+ "shape": 3
356
+ }
357
+ ],
358
+ "properties": {
359
+ "Node name for S&R": "CheckpointLoaderSimple"
360
+ },
361
+ "widgets_values": [
362
+ "sd3.5_medium.safetensors"
363
+ ]
364
+ },
365
+ {
366
+ "id": 11,
367
+ "type": "TripleCLIPLoader",
368
+ "pos": {
369
+ "0": -2016,
370
+ "1": -252
371
+ },
372
+ "size": {
373
+ "0": 315,
374
+ "1": 106
375
+ },
376
+ "flags": {},
377
+ "order": 1,
378
+ "mode": 0,
379
+ "inputs": [],
380
+ "outputs": [
381
+ {
382
+ "name": "CLIP",
383
+ "type": "CLIP",
384
+ "links": [
385
+ 5,
386
+ 94
387
+ ],
388
+ "slot_index": 0,
389
+ "shape": 3
390
+ }
391
+ ],
392
+ "properties": {
393
+ "Node name for S&R": "TripleCLIPLoader"
394
+ },
395
+ "widgets_values": [
396
+ "sdv3/clip_g.safetensors",
397
+ "sdv3/clip_l.safetensors",
398
+ "sdv3/t5xxl_fp16.safetensors"
399
+ ]
400
+ },
401
+ {
402
+ "id": 105,
403
+ "type": "Note",
404
+ "pos": {
405
+ "0": -1260,
406
+ "1": -252
407
+ },
408
+ "size": {
409
+ "0": 210,
410
+ "1": 110.18948364257812
411
+ },
412
+ "flags": {},
413
+ "order": 2,
414
+ "mode": 0,
415
+ "inputs": [],
416
+ "outputs": [],
417
+ "properties": {
418
+ "text": ""
419
+ },
420
+ "widgets_values": [
421
+ "Make sure the resolution is multiple of 64 pixels and adds up to around 1 megapixel. "
422
+ ],
423
+ "color": "#432",
424
+ "bgcolor": "#653"
425
+ },
426
+ {
427
+ "id": 135,
428
+ "type": "EmptySD3LatentImage",
429
+ "pos": {
430
+ "0": -1008,
431
+ "1": -252
432
+ },
433
+ "size": {
434
+ "0": 315,
435
+ "1": 106
436
+ },
437
+ "flags": {},
438
+ "order": 3,
439
+ "mode": 0,
440
+ "inputs": [],
441
+ "outputs": [
442
+ {
443
+ "name": "LATENT",
444
+ "type": "LATENT",
445
+ "links": [
446
+ 598
447
+ ],
448
+ "slot_index": 0,
449
+ "shape": 3
450
+ }
451
+ ],
452
+ "properties": {
453
+ "Node name for S&R": "EmptySD3LatentImage"
454
+ },
455
+ "widgets_values": [
456
+ 1280,
457
+ 768,
458
+ 1
459
+ ]
460
+ },
461
+ {
462
+ "id": 294,
463
+ "type": "KSampler",
464
+ "pos": {
465
+ "0": 882,
466
+ "1": -504
467
+ },
468
+ "size": {
469
+ "0": 378,
470
+ "1": 504
471
+ },
472
+ "flags": {},
473
+ "order": 11,
474
+ "mode": 0,
475
+ "inputs": [
476
+ {
477
+ "name": "model",
478
+ "type": "MODEL",
479
+ "link": 568
480
+ },
481
+ {
482
+ "name": "positive",
483
+ "type": "CONDITIONING",
484
+ "link": 569
485
+ },
486
+ {
487
+ "name": "negative",
488
+ "type": "CONDITIONING",
489
+ "link": 604
490
+ },
491
+ {
492
+ "name": "latent_image",
493
+ "type": "LATENT",
494
+ "link": 598
495
+ }
496
+ ],
497
+ "outputs": [
498
+ {
499
+ "name": "LATENT",
500
+ "type": "LATENT",
501
+ "links": [
502
+ 572
503
+ ],
504
+ "slot_index": 0,
505
+ "shape": 3
506
+ }
507
+ ],
508
+ "properties": {
509
+ "Node name for S&R": "KSampler"
510
+ },
511
+ "widgets_values": [
512
+ 193277626003815,
513
+ "randomize",
514
+ 40,
515
+ 5.5,
516
+ "dpmpp_2m",
517
+ "sgm_uniform",
518
+ 1
519
+ ]
520
+ },
521
+ {
522
+ "id": 13,
523
+ "type": "ModelSamplingSD3",
524
+ "pos": {
525
+ "0": -192,
526
+ "1": -507
527
+ },
528
+ "size": {
529
+ "0": 315,
530
+ "1": 58
531
+ },
532
+ "flags": {
533
+ "collapsed": false
534
+ },
535
+ "order": 4,
536
+ "mode": 0,
537
+ "inputs": [
538
+ {
539
+ "name": "model",
540
+ "type": "MODEL",
541
+ "link": 445
542
+ }
543
+ ],
544
+ "outputs": [
545
+ {
546
+ "name": "MODEL",
547
+ "type": "MODEL",
548
+ "links": [
549
+ 568
550
+ ],
551
+ "slot_index": 0,
552
+ "shape": 3
553
+ }
554
+ ],
555
+ "properties": {
556
+ "Node name for S&R": "ModelSamplingSD3"
557
+ },
558
+ "widgets_values": [
559
+ 3
560
+ ]
561
+ }
562
+ ],
563
+ "links": [
564
+ [
565
+ 5,
566
+ 11,
567
+ 0,
568
+ 6,
569
+ 0,
570
+ "CLIP"
571
+ ],
572
+ [
573
+ 90,
574
+ 67,
575
+ 0,
576
+ 68,
577
+ 0,
578
+ "CONDITIONING"
579
+ ],
580
+ [
581
+ 91,
582
+ 68,
583
+ 0,
584
+ 69,
585
+ 0,
586
+ "CONDITIONING"
587
+ ],
588
+ [
589
+ 92,
590
+ 70,
591
+ 0,
592
+ 69,
593
+ 1,
594
+ "CONDITIONING"
595
+ ],
596
+ [
597
+ 93,
598
+ 71,
599
+ 0,
600
+ 70,
601
+ 0,
602
+ "CONDITIONING"
603
+ ],
604
+ [
605
+ 94,
606
+ 11,
607
+ 0,
608
+ 71,
609
+ 0,
610
+ "CLIP"
611
+ ],
612
+ [
613
+ 274,
614
+ 8,
615
+ 0,
616
+ 50,
617
+ 0,
618
+ "IMAGE"
619
+ ],
620
+ [
621
+ 445,
622
+ 4,
623
+ 0,
624
+ 13,
625
+ 0,
626
+ "MODEL"
627
+ ],
628
+ [
629
+ 568,
630
+ 13,
631
+ 0,
632
+ 294,
633
+ 0,
634
+ "MODEL"
635
+ ],
636
+ [
637
+ 569,
638
+ 6,
639
+ 0,
640
+ 294,
641
+ 1,
642
+ "CONDITIONING"
643
+ ],
644
+ [
645
+ 572,
646
+ 294,
647
+ 0,
648
+ 8,
649
+ 0,
650
+ "LATENT"
651
+ ],
652
+ [
653
+ 597,
654
+ 71,
655
+ 0,
656
+ 67,
657
+ 0,
658
+ "CONDITIONING"
659
+ ],
660
+ [
661
+ 598,
662
+ 135,
663
+ 0,
664
+ 294,
665
+ 3,
666
+ "LATENT"
667
+ ],
668
+ [
669
+ 604,
670
+ 69,
671
+ 0,
672
+ 294,
673
+ 2,
674
+ "CONDITIONING"
675
+ ],
676
+ [
677
+ 605,
678
+ 4,
679
+ 2,
680
+ 8,
681
+ 1,
682
+ "VAE"
683
+ ]
684
+ ],
685
+ "groups": [],
686
+ "config": {},
687
+ "extra": {
688
+ "ds": {
689
+ "scale": 0.6727499949325626,
690
+ "offset": [
691
+ 2163.0604070128397,
692
+ 1105.036283731024
693
+ ]
694
+ }
695
+ },
696
+ "version": 0.4
697
+ }
mmdit-x.png ADDED
model_index.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusion3Pipeline",
3
+ "_diffusers_version": "0.30.3.dev0",
4
+ "scheduler": [
5
+ "diffusers",
6
+ "FlowMatchEulerDiscreteScheduler"
7
+ ],
8
+ "text_encoder": [
9
+ "transformers",
10
+ "CLIPTextModelWithProjection"
11
+ ],
12
+ "text_encoder_2": [
13
+ "transformers",
14
+ "CLIPTextModelWithProjection"
15
+ ],
16
+ "text_encoder_3": [
17
+ "transformers",
18
+ "T5EncoderModel"
19
+ ],
20
+ "tokenizer": [
21
+ "transformers",
22
+ "CLIPTokenizer"
23
+ ],
24
+ "tokenizer_2": [
25
+ "transformers",
26
+ "CLIPTokenizer"
27
+ ],
28
+ "tokenizer_3": [
29
+ "transformers",
30
+ "T5TokenizerFast"
31
+ ],
32
+ "transformer": [
33
+ "diffusers",
34
+ "SD3Transformer2DModel"
35
+ ],
36
+ "vae": [
37
+ "diffusers",
38
+ "AutoencoderKL"
39
+ ]
40
+ }
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowMatchEulerDiscreteScheduler",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "num_train_timesteps": 1000,
5
+ "shift": 3.0
6
+ }
sd3.5_medium.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11fe06e22364b823dfeedc275912336b932b32a293a0b2f35ffac071990cc4de
3
+ size 5107104286
sd3.5_medium_demo.jpg ADDED
text_encoder/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModelWithProjection"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 768,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 768,
21
+ "torch_dtype": "float16",
22
+ "transformers_version": "4.41.2",
23
+ "vocab_size": 49408
24
+ }
text_encoder/model.fp16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e183d11db0c6b6282a4d9e0abb74125edc8692393e89ed8ee5571005f35cb1
3
+ size 247323896
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e183d11db0c6b6282a4d9e0abb74125edc8692393e89ed8ee5571005f35cb1
3
+ size 247323896
text_encoder_2/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModelWithProjection"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_size": 1280,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 5120,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 20,
18
+ "num_hidden_layers": 32,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 1280,
21
+ "torch_dtype": "float16",
22
+ "transformers_version": "4.41.2",
23
+ "vocab_size": 49408
24
+ }
text_encoder_2/model.fp16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec310df2af79c318e24d20511b601a591ca8cd4f1fce1d8dff822a356bcdb1f4
3
+ size 1389382176
text_encoder_2/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec310df2af79c318e24d20511b601a591ca8cd4f1fce1d8dff822a356bcdb1f4
3
+ size 1389382176
text_encoder_3/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "T5EncoderModel"
4
+ ],
5
+ "classifier_dropout": 0.0,
6
+ "d_ff": 10240,
7
+ "d_kv": 64,
8
+ "d_model": 4096,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "gelu_new",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "gated-gelu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": true,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "t5",
19
+ "num_decoder_layers": 24,
20
+ "num_heads": 64,
21
+ "num_layers": 24,
22
+ "output_past": true,
23
+ "pad_token_id": 0,
24
+ "relative_attention_max_distance": 128,
25
+ "relative_attention_num_buckets": 32,
26
+ "tie_word_embeddings": false,
27
+ "torch_dtype": "float16",
28
+ "transformers_version": "4.41.2",
29
+ "use_cache": true,
30
+ "vocab_size": 32128
31
+ }
text_encoder_3/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f2751ceeb2a96edd693e539dc5d6bba0b8d3814f49a9b3798403a0cec4b2e3d
3
+ size 4994582104
text_encoder_3/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63154532130422309532ff56f11945fbea8266c958e3133e8e5aef85c6293c7
3
+ size 4530066248
text_encoder_3/model.fp16-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f2751ceeb2a96edd693e539dc5d6bba0b8d3814f49a9b3798403a0cec4b2e3d
3
+ size 4994582104
text_encoder_3/model.fp16-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63154532130422309532ff56f11945fbea8266c958e3133e8e5aef85c6293c7
3
+ size 4530066248
text_encoder_3/model.safetensors.index.fp16.json ADDED
@@ -0,0 +1,226 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_size": 9524621312
4
+ },
5
+ "weight_map": {
6
+ "encoder.block.0.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
7
+ "encoder.block.0.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
8
+ "encoder.block.0.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
9
+ "encoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight": "model.fp16-00001-of-00002.safetensors",
10
+ "encoder.block.0.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
11
+ "encoder.block.0.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
12
+ "encoder.block.0.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
13
+ "encoder.block.0.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
14
+ "encoder.block.0.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
15
+ "encoder.block.0.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
16
+ "encoder.block.1.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
17
+ "encoder.block.1.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
18
+ "encoder.block.1.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
19
+ "encoder.block.1.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
20
+ "encoder.block.1.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
21
+ "encoder.block.1.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
22
+ "encoder.block.1.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
23
+ "encoder.block.1.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
24
+ "encoder.block.1.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
25
+ "encoder.block.10.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
26
+ "encoder.block.10.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
27
+ "encoder.block.10.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
28
+ "encoder.block.10.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
29
+ "encoder.block.10.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
30
+ "encoder.block.10.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
31
+ "encoder.block.10.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
32
+ "encoder.block.10.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
33
+ "encoder.block.10.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
34
+ "encoder.block.11.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
35
+ "encoder.block.11.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
36
+ "encoder.block.11.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
37
+ "encoder.block.11.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
38
+ "encoder.block.11.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
39
+ "encoder.block.11.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
40
+ "encoder.block.11.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
41
+ "encoder.block.11.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
42
+ "encoder.block.11.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
43
+ "encoder.block.12.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
44
+ "encoder.block.12.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
45
+ "encoder.block.12.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
46
+ "encoder.block.12.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
47
+ "encoder.block.12.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
48
+ "encoder.block.12.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
49
+ "encoder.block.12.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
50
+ "encoder.block.12.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
51
+ "encoder.block.12.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
52
+ "encoder.block.13.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
53
+ "encoder.block.13.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
54
+ "encoder.block.13.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
55
+ "encoder.block.13.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
56
+ "encoder.block.13.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
57
+ "encoder.block.13.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
58
+ "encoder.block.13.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
59
+ "encoder.block.13.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
60
+ "encoder.block.13.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
61
+ "encoder.block.14.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
62
+ "encoder.block.14.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
63
+ "encoder.block.14.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
64
+ "encoder.block.14.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
65
+ "encoder.block.14.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
66
+ "encoder.block.14.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
67
+ "encoder.block.14.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
68
+ "encoder.block.14.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
69
+ "encoder.block.14.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
70
+ "encoder.block.15.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
71
+ "encoder.block.15.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
72
+ "encoder.block.15.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
73
+ "encoder.block.15.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
74
+ "encoder.block.15.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
75
+ "encoder.block.15.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
76
+ "encoder.block.15.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
77
+ "encoder.block.15.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
78
+ "encoder.block.15.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
79
+ "encoder.block.16.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
80
+ "encoder.block.16.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
81
+ "encoder.block.16.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
82
+ "encoder.block.16.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
83
+ "encoder.block.16.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
84
+ "encoder.block.16.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
85
+ "encoder.block.16.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
86
+ "encoder.block.16.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
87
+ "encoder.block.16.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
88
+ "encoder.block.17.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
89
+ "encoder.block.17.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
90
+ "encoder.block.17.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
91
+ "encoder.block.17.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
92
+ "encoder.block.17.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
93
+ "encoder.block.17.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
94
+ "encoder.block.17.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
95
+ "encoder.block.17.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
96
+ "encoder.block.17.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
97
+ "encoder.block.18.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
98
+ "encoder.block.18.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
99
+ "encoder.block.18.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
100
+ "encoder.block.18.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
101
+ "encoder.block.18.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
102
+ "encoder.block.18.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
103
+ "encoder.block.18.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
104
+ "encoder.block.18.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
105
+ "encoder.block.18.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
106
+ "encoder.block.19.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
107
+ "encoder.block.19.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
108
+ "encoder.block.19.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
109
+ "encoder.block.19.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
110
+ "encoder.block.19.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
111
+ "encoder.block.19.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
112
+ "encoder.block.19.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
113
+ "encoder.block.19.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
114
+ "encoder.block.19.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
115
+ "encoder.block.2.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
116
+ "encoder.block.2.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
117
+ "encoder.block.2.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
118
+ "encoder.block.2.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
119
+ "encoder.block.2.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
120
+ "encoder.block.2.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
121
+ "encoder.block.2.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
122
+ "encoder.block.2.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
123
+ "encoder.block.2.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
124
+ "encoder.block.20.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
125
+ "encoder.block.20.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
126
+ "encoder.block.20.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
127
+ "encoder.block.20.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
128
+ "encoder.block.20.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
129
+ "encoder.block.20.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
130
+ "encoder.block.20.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
131
+ "encoder.block.20.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
132
+ "encoder.block.20.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
133
+ "encoder.block.21.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
134
+ "encoder.block.21.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
135
+ "encoder.block.21.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
136
+ "encoder.block.21.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
137
+ "encoder.block.21.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
138
+ "encoder.block.21.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
139
+ "encoder.block.21.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
140
+ "encoder.block.21.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
141
+ "encoder.block.21.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
142
+ "encoder.block.22.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
143
+ "encoder.block.22.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
144
+ "encoder.block.22.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
145
+ "encoder.block.22.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
146
+ "encoder.block.22.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
147
+ "encoder.block.22.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
148
+ "encoder.block.22.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
149
+ "encoder.block.22.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
150
+ "encoder.block.22.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
151
+ "encoder.block.23.layer.0.SelfAttention.k.weight": "model.fp16-00002-of-00002.safetensors",
152
+ "encoder.block.23.layer.0.SelfAttention.o.weight": "model.fp16-00002-of-00002.safetensors",
153
+ "encoder.block.23.layer.0.SelfAttention.q.weight": "model.fp16-00002-of-00002.safetensors",
154
+ "encoder.block.23.layer.0.SelfAttention.v.weight": "model.fp16-00002-of-00002.safetensors",
155
+ "encoder.block.23.layer.0.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
156
+ "encoder.block.23.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00002-of-00002.safetensors",
157
+ "encoder.block.23.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00002-of-00002.safetensors",
158
+ "encoder.block.23.layer.1.DenseReluDense.wo.weight": "model.fp16-00002-of-00002.safetensors",
159
+ "encoder.block.23.layer.1.layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
160
+ "encoder.block.3.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
161
+ "encoder.block.3.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
162
+ "encoder.block.3.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
163
+ "encoder.block.3.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
164
+ "encoder.block.3.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
165
+ "encoder.block.3.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
166
+ "encoder.block.3.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
167
+ "encoder.block.3.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
168
+ "encoder.block.3.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
169
+ "encoder.block.4.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
170
+ "encoder.block.4.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
171
+ "encoder.block.4.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
172
+ "encoder.block.4.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
173
+ "encoder.block.4.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
174
+ "encoder.block.4.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
175
+ "encoder.block.4.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
176
+ "encoder.block.4.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
177
+ "encoder.block.4.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
178
+ "encoder.block.5.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
179
+ "encoder.block.5.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
180
+ "encoder.block.5.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
181
+ "encoder.block.5.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
182
+ "encoder.block.5.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
183
+ "encoder.block.5.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
184
+ "encoder.block.5.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
185
+ "encoder.block.5.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
186
+ "encoder.block.5.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
187
+ "encoder.block.6.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
188
+ "encoder.block.6.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
189
+ "encoder.block.6.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
190
+ "encoder.block.6.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
191
+ "encoder.block.6.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
192
+ "encoder.block.6.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
193
+ "encoder.block.6.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
194
+ "encoder.block.6.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
195
+ "encoder.block.6.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
196
+ "encoder.block.7.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
197
+ "encoder.block.7.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
198
+ "encoder.block.7.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
199
+ "encoder.block.7.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
200
+ "encoder.block.7.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
201
+ "encoder.block.7.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
202
+ "encoder.block.7.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
203
+ "encoder.block.7.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
204
+ "encoder.block.7.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
205
+ "encoder.block.8.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
206
+ "encoder.block.8.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
207
+ "encoder.block.8.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
208
+ "encoder.block.8.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
209
+ "encoder.block.8.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
210
+ "encoder.block.8.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
211
+ "encoder.block.8.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
212
+ "encoder.block.8.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
213
+ "encoder.block.8.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
214
+ "encoder.block.9.layer.0.SelfAttention.k.weight": "model.fp16-00001-of-00002.safetensors",
215
+ "encoder.block.9.layer.0.SelfAttention.o.weight": "model.fp16-00001-of-00002.safetensors",
216
+ "encoder.block.9.layer.0.SelfAttention.q.weight": "model.fp16-00001-of-00002.safetensors",
217
+ "encoder.block.9.layer.0.SelfAttention.v.weight": "model.fp16-00001-of-00002.safetensors",
218
+ "encoder.block.9.layer.0.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
219
+ "encoder.block.9.layer.1.DenseReluDense.wi_0.weight": "model.fp16-00001-of-00002.safetensors",
220
+ "encoder.block.9.layer.1.DenseReluDense.wi_1.weight": "model.fp16-00001-of-00002.safetensors",
221
+ "encoder.block.9.layer.1.DenseReluDense.wo.weight": "model.fp16-00001-of-00002.safetensors",
222
+ "encoder.block.9.layer.1.layer_norm.weight": "model.fp16-00001-of-00002.safetensors",
223
+ "encoder.final_layer_norm.weight": "model.fp16-00002-of-00002.safetensors",
224
+ "shared.weight": "model.fp16-00001-of-00002.safetensors"
225
+ }
226
+ }
text_encoder_3/model.safetensors.index.json ADDED
@@ -0,0 +1,226 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_size": 9524621312
4
+ },
5
+ "weight_map": {
6
+ "encoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
7
+ "encoder.block.0.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
8
+ "encoder.block.0.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
9
+ "encoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight": "model-00001-of-00002.safetensors",
10
+ "encoder.block.0.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
11
+ "encoder.block.0.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
12
+ "encoder.block.0.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
13
+ "encoder.block.0.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
14
+ "encoder.block.0.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
15
+ "encoder.block.0.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
16
+ "encoder.block.1.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
17
+ "encoder.block.1.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
18
+ "encoder.block.1.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
19
+ "encoder.block.1.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
20
+ "encoder.block.1.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
21
+ "encoder.block.1.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
22
+ "encoder.block.1.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
23
+ "encoder.block.1.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
24
+ "encoder.block.1.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
25
+ "encoder.block.10.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
26
+ "encoder.block.10.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
27
+ "encoder.block.10.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
28
+ "encoder.block.10.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
29
+ "encoder.block.10.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
30
+ "encoder.block.10.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
31
+ "encoder.block.10.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
32
+ "encoder.block.10.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
33
+ "encoder.block.10.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
34
+ "encoder.block.11.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
35
+ "encoder.block.11.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
36
+ "encoder.block.11.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
37
+ "encoder.block.11.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
38
+ "encoder.block.11.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
39
+ "encoder.block.11.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
40
+ "encoder.block.11.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
41
+ "encoder.block.11.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
42
+ "encoder.block.11.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
43
+ "encoder.block.12.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
44
+ "encoder.block.12.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
45
+ "encoder.block.12.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
46
+ "encoder.block.12.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
47
+ "encoder.block.12.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
48
+ "encoder.block.12.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
49
+ "encoder.block.12.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
50
+ "encoder.block.12.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
51
+ "encoder.block.12.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
52
+ "encoder.block.13.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
53
+ "encoder.block.13.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
54
+ "encoder.block.13.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
55
+ "encoder.block.13.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
56
+ "encoder.block.13.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
57
+ "encoder.block.13.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
58
+ "encoder.block.13.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
59
+ "encoder.block.13.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
60
+ "encoder.block.13.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
61
+ "encoder.block.14.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
62
+ "encoder.block.14.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
63
+ "encoder.block.14.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
64
+ "encoder.block.14.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
65
+ "encoder.block.14.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
66
+ "encoder.block.14.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
67
+ "encoder.block.14.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
68
+ "encoder.block.14.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
69
+ "encoder.block.14.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
70
+ "encoder.block.15.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
71
+ "encoder.block.15.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
72
+ "encoder.block.15.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
73
+ "encoder.block.15.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
74
+ "encoder.block.15.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
75
+ "encoder.block.15.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
76
+ "encoder.block.15.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
77
+ "encoder.block.15.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
78
+ "encoder.block.15.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
79
+ "encoder.block.16.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
80
+ "encoder.block.16.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
81
+ "encoder.block.16.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
82
+ "encoder.block.16.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
83
+ "encoder.block.16.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
84
+ "encoder.block.16.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
85
+ "encoder.block.16.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
86
+ "encoder.block.16.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
87
+ "encoder.block.16.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
88
+ "encoder.block.17.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
89
+ "encoder.block.17.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
90
+ "encoder.block.17.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
91
+ "encoder.block.17.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
92
+ "encoder.block.17.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
93
+ "encoder.block.17.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
94
+ "encoder.block.17.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
95
+ "encoder.block.17.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
96
+ "encoder.block.17.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
97
+ "encoder.block.18.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
98
+ "encoder.block.18.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
99
+ "encoder.block.18.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
100
+ "encoder.block.18.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
101
+ "encoder.block.18.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
102
+ "encoder.block.18.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
103
+ "encoder.block.18.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
104
+ "encoder.block.18.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
105
+ "encoder.block.18.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
106
+ "encoder.block.19.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
107
+ "encoder.block.19.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
108
+ "encoder.block.19.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
109
+ "encoder.block.19.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
110
+ "encoder.block.19.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
111
+ "encoder.block.19.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
112
+ "encoder.block.19.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
113
+ "encoder.block.19.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
114
+ "encoder.block.19.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
115
+ "encoder.block.2.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
116
+ "encoder.block.2.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
117
+ "encoder.block.2.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
118
+ "encoder.block.2.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
119
+ "encoder.block.2.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
120
+ "encoder.block.2.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
121
+ "encoder.block.2.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
122
+ "encoder.block.2.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
123
+ "encoder.block.2.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
124
+ "encoder.block.20.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
125
+ "encoder.block.20.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
126
+ "encoder.block.20.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
127
+ "encoder.block.20.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
128
+ "encoder.block.20.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
129
+ "encoder.block.20.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
130
+ "encoder.block.20.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
131
+ "encoder.block.20.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
132
+ "encoder.block.20.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
133
+ "encoder.block.21.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
134
+ "encoder.block.21.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
135
+ "encoder.block.21.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
136
+ "encoder.block.21.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
137
+ "encoder.block.21.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
138
+ "encoder.block.21.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
139
+ "encoder.block.21.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
140
+ "encoder.block.21.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
141
+ "encoder.block.21.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
142
+ "encoder.block.22.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
143
+ "encoder.block.22.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
144
+ "encoder.block.22.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
145
+ "encoder.block.22.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
146
+ "encoder.block.22.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
147
+ "encoder.block.22.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
148
+ "encoder.block.22.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
149
+ "encoder.block.22.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
150
+ "encoder.block.22.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
151
+ "encoder.block.23.layer.0.SelfAttention.k.weight": "model-00002-of-00002.safetensors",
152
+ "encoder.block.23.layer.0.SelfAttention.o.weight": "model-00002-of-00002.safetensors",
153
+ "encoder.block.23.layer.0.SelfAttention.q.weight": "model-00002-of-00002.safetensors",
154
+ "encoder.block.23.layer.0.SelfAttention.v.weight": "model-00002-of-00002.safetensors",
155
+ "encoder.block.23.layer.0.layer_norm.weight": "model-00002-of-00002.safetensors",
156
+ "encoder.block.23.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00002.safetensors",
157
+ "encoder.block.23.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00002.safetensors",
158
+ "encoder.block.23.layer.1.DenseReluDense.wo.weight": "model-00002-of-00002.safetensors",
159
+ "encoder.block.23.layer.1.layer_norm.weight": "model-00002-of-00002.safetensors",
160
+ "encoder.block.3.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
161
+ "encoder.block.3.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
162
+ "encoder.block.3.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
163
+ "encoder.block.3.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
164
+ "encoder.block.3.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
165
+ "encoder.block.3.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
166
+ "encoder.block.3.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
167
+ "encoder.block.3.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
168
+ "encoder.block.3.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
169
+ "encoder.block.4.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
170
+ "encoder.block.4.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
171
+ "encoder.block.4.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
172
+ "encoder.block.4.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
173
+ "encoder.block.4.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
174
+ "encoder.block.4.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
175
+ "encoder.block.4.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
176
+ "encoder.block.4.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
177
+ "encoder.block.4.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
178
+ "encoder.block.5.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
179
+ "encoder.block.5.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
180
+ "encoder.block.5.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
181
+ "encoder.block.5.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
182
+ "encoder.block.5.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
183
+ "encoder.block.5.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
184
+ "encoder.block.5.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
185
+ "encoder.block.5.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
186
+ "encoder.block.5.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
187
+ "encoder.block.6.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
188
+ "encoder.block.6.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
189
+ "encoder.block.6.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
190
+ "encoder.block.6.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
191
+ "encoder.block.6.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
192
+ "encoder.block.6.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
193
+ "encoder.block.6.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
194
+ "encoder.block.6.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
195
+ "encoder.block.6.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
196
+ "encoder.block.7.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
197
+ "encoder.block.7.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
198
+ "encoder.block.7.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
199
+ "encoder.block.7.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
200
+ "encoder.block.7.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
201
+ "encoder.block.7.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
202
+ "encoder.block.7.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
203
+ "encoder.block.7.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
204
+ "encoder.block.7.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
205
+ "encoder.block.8.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
206
+ "encoder.block.8.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
207
+ "encoder.block.8.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
208
+ "encoder.block.8.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
209
+ "encoder.block.8.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
210
+ "encoder.block.8.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
211
+ "encoder.block.8.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
212
+ "encoder.block.8.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
213
+ "encoder.block.8.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
214
+ "encoder.block.9.layer.0.SelfAttention.k.weight": "model-00001-of-00002.safetensors",
215
+ "encoder.block.9.layer.0.SelfAttention.o.weight": "model-00001-of-00002.safetensors",
216
+ "encoder.block.9.layer.0.SelfAttention.q.weight": "model-00001-of-00002.safetensors",
217
+ "encoder.block.9.layer.0.SelfAttention.v.weight": "model-00001-of-00002.safetensors",
218
+ "encoder.block.9.layer.0.layer_norm.weight": "model-00001-of-00002.safetensors",
219
+ "encoder.block.9.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00002.safetensors",
220
+ "encoder.block.9.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00002.safetensors",
221
+ "encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00001-of-00002.safetensors",
222
+ "encoder.block.9.layer.1.layer_norm.weight": "model-00001-of-00002.safetensors",
223
+ "encoder.final_layer_norm.weight": "model-00002-of-00002.safetensors",
224
+ "shared.weight": "model-00001-of-00002.safetensors"
225
+ }
226
+ }
tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|endoftext|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "49406": {
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49407": {
13
+ "content": "<|endoftext|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "bos_token": "<|startoftext|>",
22
+ "clean_up_tokenization_spaces": true,
23
+ "do_lower_case": true,
24
+ "eos_token": "<|endoftext|>",
25
+ "errors": "replace",
26
+ "model_max_length": 77,
27
+ "pad_token": "<|endoftext|>",
28
+ "tokenizer_class": "CLIPTokenizer",
29
+ "unk_token": "<|endoftext|>"
30
+ }
tokenizer/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_2/special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "!",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer_2/tokenizer_config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "!",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "49406": {
13
+ "content": "<|startoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "49407": {
21
+ "content": "<|endoftext|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "bos_token": "<|startoftext|>",
30
+ "clean_up_tokenization_spaces": true,
31
+ "do_lower_case": true,
32
+ "eos_token": "<|endoftext|>",
33
+ "errors": "replace",
34
+ "model_max_length": 77,
35
+ "pad_token": "!",
36
+ "tokenizer_class": "CLIPTokenizer",
37
+ "unk_token": "<|endoftext|>"
38
+ }
tokenizer_2/vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_3/special_tokens_map.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": {
105
+ "content": "</s>",
106
+ "lstrip": false,
107
+ "normalized": false,
108
+ "rstrip": false,
109
+ "single_word": false
110
+ },
111
+ "pad_token": {
112
+ "content": "<pad>",
113
+ "lstrip": false,
114
+ "normalized": false,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "unk_token": {
119
+ "content": "<unk>",
120
+ "lstrip": false,
121
+ "normalized": false,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ }
125
+ }
tokenizer_3/spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
tokenizer_3/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_3/tokenizer_config.json ADDED
@@ -0,0 +1,940 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<pad>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "</s>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "<unk>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "32000": {
29
+ "content": "<extra_id_99>",
30
+ "lstrip": true,
31
+ "normalized": false,
32
+ "rstrip": true,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "32001": {
37
+ "content": "<extra_id_98>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": true,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "32002": {
45
+ "content": "<extra_id_97>",
46
+ "lstrip": true,
47
+ "normalized": false,
48
+ "rstrip": true,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "32003": {
53
+ "content": "<extra_id_96>",
54
+ "lstrip": true,
55
+ "normalized": false,
56
+ "rstrip": true,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "32004": {
61
+ "content": "<extra_id_95>",
62
+ "lstrip": true,
63
+ "normalized": false,
64
+ "rstrip": true,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "32005": {
69
+ "content": "<extra_id_94>",
70
+ "lstrip": true,
71
+ "normalized": false,
72
+ "rstrip": true,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "32006": {
77
+ "content": "<extra_id_93>",
78
+ "lstrip": true,
79
+ "normalized": false,
80
+ "rstrip": true,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "32007": {
85
+ "content": "<extra_id_92>",
86
+ "lstrip": true,
87
+ "normalized": false,
88
+ "rstrip": true,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "32008": {
93
+ "content": "<extra_id_91>",
94
+ "lstrip": true,
95
+ "normalized": false,
96
+ "rstrip": true,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "32009": {
101
+ "content": "<extra_id_90>",
102
+ "lstrip": true,
103
+ "normalized": false,
104
+ "rstrip": true,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "32010": {
109
+ "content": "<extra_id_89>",
110
+ "lstrip": true,
111
+ "normalized": false,
112
+ "rstrip": true,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "32011": {
117
+ "content": "<extra_id_88>",
118
+ "lstrip": true,
119
+ "normalized": false,
120
+ "rstrip": true,
121
+ "single_word": false,
122
+ "special": true
123
+ },
124
+ "32012": {
125
+ "content": "<extra_id_87>",
126
+ "lstrip": true,
127
+ "normalized": false,
128
+ "rstrip": true,
129
+ "single_word": false,
130
+ "special": true
131
+ },
132
+ "32013": {
133
+ "content": "<extra_id_86>",
134
+ "lstrip": true,
135
+ "normalized": false,
136
+ "rstrip": true,
137
+ "single_word": false,
138
+ "special": true
139
+ },
140
+ "32014": {
141
+ "content": "<extra_id_85>",
142
+ "lstrip": true,
143
+ "normalized": false,
144
+ "rstrip": true,
145
+ "single_word": false,
146
+ "special": true
147
+ },
148
+ "32015": {
149
+ "content": "<extra_id_84>",
150
+ "lstrip": true,
151
+ "normalized": false,
152
+ "rstrip": true,
153
+ "single_word": false,
154
+ "special": true
155
+ },
156
+ "32016": {
157
+ "content": "<extra_id_83>",
158
+ "lstrip": true,
159
+ "normalized": false,
160
+ "rstrip": true,
161
+ "single_word": false,
162
+ "special": true
163
+ },
164
+ "32017": {
165
+ "content": "<extra_id_82>",
166
+ "lstrip": true,
167
+ "normalized": false,
168
+ "rstrip": true,
169
+ "single_word": false,
170
+ "special": true
171
+ },
172
+ "32018": {
173
+ "content": "<extra_id_81>",
174
+ "lstrip": true,
175
+ "normalized": false,
176
+ "rstrip": true,
177
+ "single_word": false,
178
+ "special": true
179
+ },
180
+ "32019": {
181
+ "content": "<extra_id_80>",
182
+ "lstrip": true,
183
+ "normalized": false,
184
+ "rstrip": true,
185
+ "single_word": false,
186
+ "special": true
187
+ },
188
+ "32020": {
189
+ "content": "<extra_id_79>",
190
+ "lstrip": true,
191
+ "normalized": false,
192
+ "rstrip": true,
193
+ "single_word": false,
194
+ "special": true
195
+ },
196
+ "32021": {
197
+ "content": "<extra_id_78>",
198
+ "lstrip": true,
199
+ "normalized": false,
200
+ "rstrip": true,
201
+ "single_word": false,
202
+ "special": true
203
+ },
204
+ "32022": {
205
+ "content": "<extra_id_77>",
206
+ "lstrip": true,
207
+ "normalized": false,
208
+ "rstrip": true,
209
+ "single_word": false,
210
+ "special": true
211
+ },
212
+ "32023": {
213
+ "content": "<extra_id_76>",
214
+ "lstrip": true,
215
+ "normalized": false,
216
+ "rstrip": true,
217
+ "single_word": false,
218
+ "special": true
219
+ },
220
+ "32024": {
221
+ "content": "<extra_id_75>",
222
+ "lstrip": true,
223
+ "normalized": false,
224
+ "rstrip": true,
225
+ "single_word": false,
226
+ "special": true
227
+ },
228
+ "32025": {
229
+ "content": "<extra_id_74>",
230
+ "lstrip": true,
231
+ "normalized": false,
232
+ "rstrip": true,
233
+ "single_word": false,
234
+ "special": true
235
+ },
236
+ "32026": {
237
+ "content": "<extra_id_73>",
238
+ "lstrip": true,
239
+ "normalized": false,
240
+ "rstrip": true,
241
+ "single_word": false,
242
+ "special": true
243
+ },
244
+ "32027": {
245
+ "content": "<extra_id_72>",
246
+ "lstrip": true,
247
+ "normalized": false,
248
+ "rstrip": true,
249
+ "single_word": false,
250
+ "special": true
251
+ },
252
+ "32028": {
253
+ "content": "<extra_id_71>",
254
+ "lstrip": true,
255
+ "normalized": false,
256
+ "rstrip": true,
257
+ "single_word": false,
258
+ "special": true
259
+ },
260
+ "32029": {
261
+ "content": "<extra_id_70>",
262
+ "lstrip": true,
263
+ "normalized": false,
264
+ "rstrip": true,
265
+ "single_word": false,
266
+ "special": true
267
+ },
268
+ "32030": {
269
+ "content": "<extra_id_69>",
270
+ "lstrip": true,
271
+ "normalized": false,
272
+ "rstrip": true,
273
+ "single_word": false,
274
+ "special": true
275
+ },
276
+ "32031": {
277
+ "content": "<extra_id_68>",
278
+ "lstrip": true,
279
+ "normalized": false,
280
+ "rstrip": true,
281
+ "single_word": false,
282
+ "special": true
283
+ },
284
+ "32032": {
285
+ "content": "<extra_id_67>",
286
+ "lstrip": true,
287
+ "normalized": false,
288
+ "rstrip": true,
289
+ "single_word": false,
290
+ "special": true
291
+ },
292
+ "32033": {
293
+ "content": "<extra_id_66>",
294
+ "lstrip": true,
295
+ "normalized": false,
296
+ "rstrip": true,
297
+ "single_word": false,
298
+ "special": true
299
+ },
300
+ "32034": {
301
+ "content": "<extra_id_65>",
302
+ "lstrip": true,
303
+ "normalized": false,
304
+ "rstrip": true,
305
+ "single_word": false,
306
+ "special": true
307
+ },
308
+ "32035": {
309
+ "content": "<extra_id_64>",
310
+ "lstrip": true,
311
+ "normalized": false,
312
+ "rstrip": true,
313
+ "single_word": false,
314
+ "special": true
315
+ },
316
+ "32036": {
317
+ "content": "<extra_id_63>",
318
+ "lstrip": true,
319
+ "normalized": false,
320
+ "rstrip": true,
321
+ "single_word": false,
322
+ "special": true
323
+ },
324
+ "32037": {
325
+ "content": "<extra_id_62>",
326
+ "lstrip": true,
327
+ "normalized": false,
328
+ "rstrip": true,
329
+ "single_word": false,
330
+ "special": true
331
+ },
332
+ "32038": {
333
+ "content": "<extra_id_61>",
334
+ "lstrip": true,
335
+ "normalized": false,
336
+ "rstrip": true,
337
+ "single_word": false,
338
+ "special": true
339
+ },
340
+ "32039": {
341
+ "content": "<extra_id_60>",
342
+ "lstrip": true,
343
+ "normalized": false,
344
+ "rstrip": true,
345
+ "single_word": false,
346
+ "special": true
347
+ },
348
+ "32040": {
349
+ "content": "<extra_id_59>",
350
+ "lstrip": true,
351
+ "normalized": false,
352
+ "rstrip": true,
353
+ "single_word": false,
354
+ "special": true
355
+ },
356
+ "32041": {
357
+ "content": "<extra_id_58>",
358
+ "lstrip": true,
359
+ "normalized": false,
360
+ "rstrip": true,
361
+ "single_word": false,
362
+ "special": true
363
+ },
364
+ "32042": {
365
+ "content": "<extra_id_57>",
366
+ "lstrip": true,
367
+ "normalized": false,
368
+ "rstrip": true,
369
+ "single_word": false,
370
+ "special": true
371
+ },
372
+ "32043": {
373
+ "content": "<extra_id_56>",
374
+ "lstrip": true,
375
+ "normalized": false,
376
+ "rstrip": true,
377
+ "single_word": false,
378
+ "special": true
379
+ },
380
+ "32044": {
381
+ "content": "<extra_id_55>",
382
+ "lstrip": true,
383
+ "normalized": false,
384
+ "rstrip": true,
385
+ "single_word": false,
386
+ "special": true
387
+ },
388
+ "32045": {
389
+ "content": "<extra_id_54>",
390
+ "lstrip": true,
391
+ "normalized": false,
392
+ "rstrip": true,
393
+ "single_word": false,
394
+ "special": true
395
+ },
396
+ "32046": {
397
+ "content": "<extra_id_53>",
398
+ "lstrip": true,
399
+ "normalized": false,
400
+ "rstrip": true,
401
+ "single_word": false,
402
+ "special": true
403
+ },
404
+ "32047": {
405
+ "content": "<extra_id_52>",
406
+ "lstrip": true,
407
+ "normalized": false,
408
+ "rstrip": true,
409
+ "single_word": false,
410
+ "special": true
411
+ },
412
+ "32048": {
413
+ "content": "<extra_id_51>",
414
+ "lstrip": true,
415
+ "normalized": false,
416
+ "rstrip": true,
417
+ "single_word": false,
418
+ "special": true
419
+ },
420
+ "32049": {
421
+ "content": "<extra_id_50>",
422
+ "lstrip": true,
423
+ "normalized": false,
424
+ "rstrip": true,
425
+ "single_word": false,
426
+ "special": true
427
+ },
428
+ "32050": {
429
+ "content": "<extra_id_49>",
430
+ "lstrip": true,
431
+ "normalized": false,
432
+ "rstrip": true,
433
+ "single_word": false,
434
+ "special": true
435
+ },
436
+ "32051": {
437
+ "content": "<extra_id_48>",
438
+ "lstrip": true,
439
+ "normalized": false,
440
+ "rstrip": true,
441
+ "single_word": false,
442
+ "special": true
443
+ },
444
+ "32052": {
445
+ "content": "<extra_id_47>",
446
+ "lstrip": true,
447
+ "normalized": false,
448
+ "rstrip": true,
449
+ "single_word": false,
450
+ "special": true
451
+ },
452
+ "32053": {
453
+ "content": "<extra_id_46>",
454
+ "lstrip": true,
455
+ "normalized": false,
456
+ "rstrip": true,
457
+ "single_word": false,
458
+ "special": true
459
+ },
460
+ "32054": {
461
+ "content": "<extra_id_45>",
462
+ "lstrip": true,
463
+ "normalized": false,
464
+ "rstrip": true,
465
+ "single_word": false,
466
+ "special": true
467
+ },
468
+ "32055": {
469
+ "content": "<extra_id_44>",
470
+ "lstrip": true,
471
+ "normalized": false,
472
+ "rstrip": true,
473
+ "single_word": false,
474
+ "special": true
475
+ },
476
+ "32056": {
477
+ "content": "<extra_id_43>",
478
+ "lstrip": true,
479
+ "normalized": false,
480
+ "rstrip": true,
481
+ "single_word": false,
482
+ "special": true
483
+ },
484
+ "32057": {
485
+ "content": "<extra_id_42>",
486
+ "lstrip": true,
487
+ "normalized": false,
488
+ "rstrip": true,
489
+ "single_word": false,
490
+ "special": true
491
+ },
492
+ "32058": {
493
+ "content": "<extra_id_41>",
494
+ "lstrip": true,
495
+ "normalized": false,
496
+ "rstrip": true,
497
+ "single_word": false,
498
+ "special": true
499
+ },
500
+ "32059": {
501
+ "content": "<extra_id_40>",
502
+ "lstrip": true,
503
+ "normalized": false,
504
+ "rstrip": true,
505
+ "single_word": false,
506
+ "special": true
507
+ },
508
+ "32060": {
509
+ "content": "<extra_id_39>",
510
+ "lstrip": true,
511
+ "normalized": false,
512
+ "rstrip": true,
513
+ "single_word": false,
514
+ "special": true
515
+ },
516
+ "32061": {
517
+ "content": "<extra_id_38>",
518
+ "lstrip": true,
519
+ "normalized": false,
520
+ "rstrip": true,
521
+ "single_word": false,
522
+ "special": true
523
+ },
524
+ "32062": {
525
+ "content": "<extra_id_37>",
526
+ "lstrip": true,
527
+ "normalized": false,
528
+ "rstrip": true,
529
+ "single_word": false,
530
+ "special": true
531
+ },
532
+ "32063": {
533
+ "content": "<extra_id_36>",
534
+ "lstrip": true,
535
+ "normalized": false,
536
+ "rstrip": true,
537
+ "single_word": false,
538
+ "special": true
539
+ },
540
+ "32064": {
541
+ "content": "<extra_id_35>",
542
+ "lstrip": true,
543
+ "normalized": false,
544
+ "rstrip": true,
545
+ "single_word": false,
546
+ "special": true
547
+ },
548
+ "32065": {
549
+ "content": "<extra_id_34>",
550
+ "lstrip": true,
551
+ "normalized": false,
552
+ "rstrip": true,
553
+ "single_word": false,
554
+ "special": true
555
+ },
556
+ "32066": {
557
+ "content": "<extra_id_33>",
558
+ "lstrip": true,
559
+ "normalized": false,
560
+ "rstrip": true,
561
+ "single_word": false,
562
+ "special": true
563
+ },
564
+ "32067": {
565
+ "content": "<extra_id_32>",
566
+ "lstrip": true,
567
+ "normalized": false,
568
+ "rstrip": true,
569
+ "single_word": false,
570
+ "special": true
571
+ },
572
+ "32068": {
573
+ "content": "<extra_id_31>",
574
+ "lstrip": true,
575
+ "normalized": false,
576
+ "rstrip": true,
577
+ "single_word": false,
578
+ "special": true
579
+ },
580
+ "32069": {
581
+ "content": "<extra_id_30>",
582
+ "lstrip": true,
583
+ "normalized": false,
584
+ "rstrip": true,
585
+ "single_word": false,
586
+ "special": true
587
+ },
588
+ "32070": {
589
+ "content": "<extra_id_29>",
590
+ "lstrip": true,
591
+ "normalized": false,
592
+ "rstrip": true,
593
+ "single_word": false,
594
+ "special": true
595
+ },
596
+ "32071": {
597
+ "content": "<extra_id_28>",
598
+ "lstrip": true,
599
+ "normalized": false,
600
+ "rstrip": true,
601
+ "single_word": false,
602
+ "special": true
603
+ },
604
+ "32072": {
605
+ "content": "<extra_id_27>",
606
+ "lstrip": true,
607
+ "normalized": false,
608
+ "rstrip": true,
609
+ "single_word": false,
610
+ "special": true
611
+ },
612
+ "32073": {
613
+ "content": "<extra_id_26>",
614
+ "lstrip": true,
615
+ "normalized": false,
616
+ "rstrip": true,
617
+ "single_word": false,
618
+ "special": true
619
+ },
620
+ "32074": {
621
+ "content": "<extra_id_25>",
622
+ "lstrip": true,
623
+ "normalized": false,
624
+ "rstrip": true,
625
+ "single_word": false,
626
+ "special": true
627
+ },
628
+ "32075": {
629
+ "content": "<extra_id_24>",
630
+ "lstrip": true,
631
+ "normalized": false,
632
+ "rstrip": true,
633
+ "single_word": false,
634
+ "special": true
635
+ },
636
+ "32076": {
637
+ "content": "<extra_id_23>",
638
+ "lstrip": true,
639
+ "normalized": false,
640
+ "rstrip": true,
641
+ "single_word": false,
642
+ "special": true
643
+ },
644
+ "32077": {
645
+ "content": "<extra_id_22>",
646
+ "lstrip": true,
647
+ "normalized": false,
648
+ "rstrip": true,
649
+ "single_word": false,
650
+ "special": true
651
+ },
652
+ "32078": {
653
+ "content": "<extra_id_21>",
654
+ "lstrip": true,
655
+ "normalized": false,
656
+ "rstrip": true,
657
+ "single_word": false,
658
+ "special": true
659
+ },
660
+ "32079": {
661
+ "content": "<extra_id_20>",
662
+ "lstrip": true,
663
+ "normalized": false,
664
+ "rstrip": true,
665
+ "single_word": false,
666
+ "special": true
667
+ },
668
+ "32080": {
669
+ "content": "<extra_id_19>",
670
+ "lstrip": true,
671
+ "normalized": false,
672
+ "rstrip": true,
673
+ "single_word": false,
674
+ "special": true
675
+ },
676
+ "32081": {
677
+ "content": "<extra_id_18>",
678
+ "lstrip": true,
679
+ "normalized": false,
680
+ "rstrip": true,
681
+ "single_word": false,
682
+ "special": true
683
+ },
684
+ "32082": {
685
+ "content": "<extra_id_17>",
686
+ "lstrip": true,
687
+ "normalized": false,
688
+ "rstrip": true,
689
+ "single_word": false,
690
+ "special": true
691
+ },
692
+ "32083": {
693
+ "content": "<extra_id_16>",
694
+ "lstrip": true,
695
+ "normalized": false,
696
+ "rstrip": true,
697
+ "single_word": false,
698
+ "special": true
699
+ },
700
+ "32084": {
701
+ "content": "<extra_id_15>",
702
+ "lstrip": true,
703
+ "normalized": false,
704
+ "rstrip": true,
705
+ "single_word": false,
706
+ "special": true
707
+ },
708
+ "32085": {
709
+ "content": "<extra_id_14>",
710
+ "lstrip": true,
711
+ "normalized": false,
712
+ "rstrip": true,
713
+ "single_word": false,
714
+ "special": true
715
+ },
716
+ "32086": {
717
+ "content": "<extra_id_13>",
718
+ "lstrip": true,
719
+ "normalized": false,
720
+ "rstrip": true,
721
+ "single_word": false,
722
+ "special": true
723
+ },
724
+ "32087": {
725
+ "content": "<extra_id_12>",
726
+ "lstrip": true,
727
+ "normalized": false,
728
+ "rstrip": true,
729
+ "single_word": false,
730
+ "special": true
731
+ },
732
+ "32088": {
733
+ "content": "<extra_id_11>",
734
+ "lstrip": true,
735
+ "normalized": false,
736
+ "rstrip": true,
737
+ "single_word": false,
738
+ "special": true
739
+ },
740
+ "32089": {
741
+ "content": "<extra_id_10>",
742
+ "lstrip": true,
743
+ "normalized": false,
744
+ "rstrip": true,
745
+ "single_word": false,
746
+ "special": true
747
+ },
748
+ "32090": {
749
+ "content": "<extra_id_9>",
750
+ "lstrip": true,
751
+ "normalized": false,
752
+ "rstrip": true,
753
+ "single_word": false,
754
+ "special": true
755
+ },
756
+ "32091": {
757
+ "content": "<extra_id_8>",
758
+ "lstrip": true,
759
+ "normalized": false,
760
+ "rstrip": true,
761
+ "single_word": false,
762
+ "special": true
763
+ },
764
+ "32092": {
765
+ "content": "<extra_id_7>",
766
+ "lstrip": true,
767
+ "normalized": false,
768
+ "rstrip": true,
769
+ "single_word": false,
770
+ "special": true
771
+ },
772
+ "32093": {
773
+ "content": "<extra_id_6>",
774
+ "lstrip": true,
775
+ "normalized": false,
776
+ "rstrip": true,
777
+ "single_word": false,
778
+ "special": true
779
+ },
780
+ "32094": {
781
+ "content": "<extra_id_5>",
782
+ "lstrip": true,
783
+ "normalized": false,
784
+ "rstrip": true,
785
+ "single_word": false,
786
+ "special": true
787
+ },
788
+ "32095": {
789
+ "content": "<extra_id_4>",
790
+ "lstrip": true,
791
+ "normalized": false,
792
+ "rstrip": true,
793
+ "single_word": false,
794
+ "special": true
795
+ },
796
+ "32096": {
797
+ "content": "<extra_id_3>",
798
+ "lstrip": true,
799
+ "normalized": false,
800
+ "rstrip": true,
801
+ "single_word": false,
802
+ "special": true
803
+ },
804
+ "32097": {
805
+ "content": "<extra_id_2>",
806
+ "lstrip": true,
807
+ "normalized": false,
808
+ "rstrip": true,
809
+ "single_word": false,
810
+ "special": true
811
+ },
812
+ "32098": {
813
+ "content": "<extra_id_1>",
814
+ "lstrip": true,
815
+ "normalized": false,
816
+ "rstrip": true,
817
+ "single_word": false,
818
+ "special": true
819
+ },
820
+ "32099": {
821
+ "content": "<extra_id_0>",
822
+ "lstrip": true,
823
+ "normalized": false,
824
+ "rstrip": true,
825
+ "single_word": false,
826
+ "special": true
827
+ }
828
+ },
829
+ "additional_special_tokens": [
830
+ "<extra_id_0>",
831
+ "<extra_id_1>",
832
+ "<extra_id_2>",
833
+ "<extra_id_3>",
834
+ "<extra_id_4>",
835
+ "<extra_id_5>",
836
+ "<extra_id_6>",
837
+ "<extra_id_7>",
838
+ "<extra_id_8>",
839
+ "<extra_id_9>",
840
+ "<extra_id_10>",
841
+ "<extra_id_11>",
842
+ "<extra_id_12>",
843
+ "<extra_id_13>",
844
+ "<extra_id_14>",
845
+ "<extra_id_15>",
846
+ "<extra_id_16>",
847
+ "<extra_id_17>",
848
+ "<extra_id_18>",
849
+ "<extra_id_19>",
850
+ "<extra_id_20>",
851
+ "<extra_id_21>",
852
+ "<extra_id_22>",
853
+ "<extra_id_23>",
854
+ "<extra_id_24>",
855
+ "<extra_id_25>",
856
+ "<extra_id_26>",
857
+ "<extra_id_27>",
858
+ "<extra_id_28>",
859
+ "<extra_id_29>",
860
+ "<extra_id_30>",
861
+ "<extra_id_31>",
862
+ "<extra_id_32>",
863
+ "<extra_id_33>",
864
+ "<extra_id_34>",
865
+ "<extra_id_35>",
866
+ "<extra_id_36>",
867
+ "<extra_id_37>",
868
+ "<extra_id_38>",
869
+ "<extra_id_39>",
870
+ "<extra_id_40>",
871
+ "<extra_id_41>",
872
+ "<extra_id_42>",
873
+ "<extra_id_43>",
874
+ "<extra_id_44>",
875
+ "<extra_id_45>",
876
+ "<extra_id_46>",
877
+ "<extra_id_47>",
878
+ "<extra_id_48>",
879
+ "<extra_id_49>",
880
+ "<extra_id_50>",
881
+ "<extra_id_51>",
882
+ "<extra_id_52>",
883
+ "<extra_id_53>",
884
+ "<extra_id_54>",
885
+ "<extra_id_55>",
886
+ "<extra_id_56>",
887
+ "<extra_id_57>",
888
+ "<extra_id_58>",
889
+ "<extra_id_59>",
890
+ "<extra_id_60>",
891
+ "<extra_id_61>",
892
+ "<extra_id_62>",
893
+ "<extra_id_63>",
894
+ "<extra_id_64>",
895
+ "<extra_id_65>",
896
+ "<extra_id_66>",
897
+ "<extra_id_67>",
898
+ "<extra_id_68>",
899
+ "<extra_id_69>",
900
+ "<extra_id_70>",
901
+ "<extra_id_71>",
902
+ "<extra_id_72>",
903
+ "<extra_id_73>",
904
+ "<extra_id_74>",
905
+ "<extra_id_75>",
906
+ "<extra_id_76>",
907
+ "<extra_id_77>",
908
+ "<extra_id_78>",
909
+ "<extra_id_79>",
910
+ "<extra_id_80>",
911
+ "<extra_id_81>",
912
+ "<extra_id_82>",
913
+ "<extra_id_83>",
914
+ "<extra_id_84>",
915
+ "<extra_id_85>",
916
+ "<extra_id_86>",
917
+ "<extra_id_87>",
918
+ "<extra_id_88>",
919
+ "<extra_id_89>",
920
+ "<extra_id_90>",
921
+ "<extra_id_91>",
922
+ "<extra_id_92>",
923
+ "<extra_id_93>",
924
+ "<extra_id_94>",
925
+ "<extra_id_95>",
926
+ "<extra_id_96>",
927
+ "<extra_id_97>",
928
+ "<extra_id_98>",
929
+ "<extra_id_99>"
930
+ ],
931
+ "clean_up_tokenization_spaces": true,
932
+ "eos_token": "</s>",
933
+ "extra_ids": 100,
934
+ "legacy": true,
935
+ "model_max_length": 512,
936
+ "pad_token": "<pad>",
937
+ "sp_model_kwargs": {},
938
+ "tokenizer_class": "T5Tokenizer",
939
+ "unk_token": "<unk>"
940
+ }
transformer/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "SD3Transformer2DModel",
3
+ "_diffusers_version": "0.31.0.dev0",
4
+ "dual_attention_layers": [
5
+ 0,
6
+ 1,
7
+ 2,
8
+ 3,
9
+ 4,
10
+ 5,
11
+ 6,
12
+ 7,
13
+ 8,
14
+ 9,
15
+ 10,
16
+ 11,
17
+ 12
18
+ ],
19
+ "attention_head_dim": 64,
20
+ "caption_projection_dim": 1536,
21
+ "in_channels": 16,
22
+ "joint_attention_dim": 4096,
23
+ "num_attention_heads": 24,
24
+ "num_layers": 24,
25
+ "out_channels": 16,
26
+ "patch_size": 2,
27
+ "pooled_projection_dim": 2048,
28
+ "pos_embed_max_size": 384,
29
+ "qk_norm": "rms_norm",
30
+ "sample_size": 128
31
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f81eb93a348be218af757dd095cbda45090380d9bbda91049442e0e40bb4cc95
3
+ size 4939433672
vae copy/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.31.0.dev0",
4
+ "_name_or_path": "../sdxl-vae/",
5
+ "act_fn": "silu",
6
+ "block_out_channels": [
7
+ 128,
8
+ 256,
9
+ 512,
10
+ 512
11
+ ],
12
+ "down_block_types": [
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D",
16
+ "DownEncoderBlock2D"
17
+ ],
18
+ "force_upcast": true,
19
+ "in_channels": 3,
20
+ "latent_channels": 16,
21
+ "latents_mean": null,
22
+ "latents_std": null,
23
+ "layers_per_block": 2,
24
+ "mid_block_add_attention": true,
25
+ "norm_num_groups": 32,
26
+ "out_channels": 3,
27
+ "sample_size": 1024,
28
+ "scaling_factor": 1.5305,
29
+ "shift_factor": 0.0609,
30
+ "up_block_types": [
31
+ "UpDecoderBlock2D",
32
+ "UpDecoderBlock2D",
33
+ "UpDecoderBlock2D",
34
+ "UpDecoderBlock2D"
35
+ ],
36
+ "use_post_quant_conv": false,
37
+ "use_quant_conv": false
38
+ }
vae copy/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f53304a79335b55e13ec50f63e5157fee4deb2f30d5fae0654e2b2653c109dc
3
+ size 167666902
vae/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.31.0.dev0",
4
+ "_name_or_path": "../sdxl-vae/",
5
+ "act_fn": "silu",
6
+ "block_out_channels": [
7
+ 128,
8
+ 256,
9
+ 512,
10
+ 512
11
+ ],
12
+ "down_block_types": [
13
+ "DownEncoderBlock2D",
14
+ "DownEncoderBlock2D",
15
+ "DownEncoderBlock2D",
16
+ "DownEncoderBlock2D"
17
+ ],
18
+ "force_upcast": true,
19
+ "in_channels": 3,
20
+ "latent_channels": 16,
21
+ "latents_mean": null,
22
+ "latents_std": null,
23
+ "layers_per_block": 2,
24
+ "mid_block_add_attention": true,
25
+ "norm_num_groups": 32,
26
+ "out_channels": 3,
27
+ "sample_size": 1024,
28
+ "scaling_factor": 1.5305,
29
+ "shift_factor": 0.0609,
30
+ "up_block_types": [
31
+ "UpDecoderBlock2D",
32
+ "UpDecoderBlock2D",
33
+ "UpDecoderBlock2D",
34
+ "UpDecoderBlock2D"
35
+ ],
36
+ "use_post_quant_conv": false,
37
+ "use_quant_conv": false
38
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f53304a79335b55e13ec50f63e5157fee4deb2f30d5fae0654e2b2653c109dc
3
+ size 167666902