Upload PixArtSigmaPipeline
Browse files- README.md +3 -0
- transformer/config.json +8 -3
- transformer/diffusion_pytorch_model.safetensors +2 -2
- vae/config.json +7 -7
- vae/diffusion_pytorch_model.safetensors +2 -2
README.md
CHANGED
@@ -1 +1,4 @@
|
|
|
|
|
|
|
|
1 |
This is still not trained, this is an attempt at sticking a 16 channels VAE to a Pixart-Sigma pipeline.
|
|
|
1 |
+
---
|
2 |
+
library_name: diffusers
|
3 |
+
---
|
4 |
This is still not trained, this is an attempt at sticking a 16 channels VAE to a Pixart-Sigma pipeline.
|
transformer/config.json
CHANGED
@@ -1,14 +1,16 @@
|
|
1 |
{
|
2 |
"_class_name": "PixArtTransformer2DModel",
|
3 |
"_diffusers_version": "0.30.2",
|
|
|
4 |
"activation_fn": "gelu-approximate",
|
5 |
"attention_bias": true,
|
6 |
"attention_head_dim": 72,
|
7 |
"attention_type": "default",
|
8 |
"caption_channels": 4096,
|
9 |
"cross_attention_dim": 1152,
|
|
|
10 |
"dropout": 0.0,
|
11 |
-
"in_channels":
|
12 |
"interpolation_scale": 1,
|
13 |
"norm_elementwise_affine": false,
|
14 |
"norm_eps": 1e-06,
|
@@ -17,9 +19,12 @@
|
|
17 |
"num_attention_heads": 16,
|
18 |
"num_embeds_ada_norm": 1000,
|
19 |
"num_layers": 28,
|
20 |
-
"
|
|
|
|
|
21 |
"patch_size": 2,
|
22 |
"sample_size": 64,
|
23 |
"upcast_attention": false,
|
24 |
-
"use_additional_conditions":
|
|
|
25 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "PixArtTransformer2DModel",
|
3 |
"_diffusers_version": "0.30.2",
|
4 |
+
"_name_or_path": "frutiemax/TwistedReality-pixart-512ms",
|
5 |
"activation_fn": "gelu-approximate",
|
6 |
"attention_bias": true,
|
7 |
"attention_head_dim": 72,
|
8 |
"attention_type": "default",
|
9 |
"caption_channels": 4096,
|
10 |
"cross_attention_dim": 1152,
|
11 |
+
"double_self_attention": false,
|
12 |
"dropout": 0.0,
|
13 |
+
"in_channels": 4,
|
14 |
"interpolation_scale": 1,
|
15 |
"norm_elementwise_affine": false,
|
16 |
"norm_eps": 1e-06,
|
|
|
19 |
"num_attention_heads": 16,
|
20 |
"num_embeds_ada_norm": 1000,
|
21 |
"num_layers": 28,
|
22 |
+
"num_vector_embeds": null,
|
23 |
+
"only_cross_attention": false,
|
24 |
+
"out_channels": 8,
|
25 |
"patch_size": 2,
|
26 |
"sample_size": 64,
|
27 |
"upcast_attention": false,
|
28 |
+
"use_additional_conditions": null,
|
29 |
+
"use_linear_projection": false
|
30 |
}
|
transformer/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92c9ace52b60fe1da0c5997859c8ecc6ad1da55a68d5519110c89b66b59ee61
|
3 |
+
size 2443492488
|
vae/config.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
"_diffusers_version": "0.30.2",
|
4 |
-
"_name_or_path": "
|
5 |
"act_fn": "silu",
|
6 |
"block_out_channels": [
|
|
|
7 |
128,
|
8 |
256,
|
9 |
-
512,
|
10 |
512
|
11 |
],
|
12 |
"down_block_types": [
|
@@ -15,18 +15,18 @@
|
|
15 |
"DownEncoderBlock2D",
|
16 |
"DownEncoderBlock2D"
|
17 |
],
|
18 |
-
"force_upcast":
|
19 |
"in_channels": 3,
|
20 |
"latent_channels": 16,
|
21 |
"latents_mean": null,
|
22 |
"latents_std": null,
|
23 |
"layers_per_block": 2,
|
24 |
-
"mid_block_add_attention":
|
25 |
"norm_num_groups": 32,
|
26 |
"out_channels": 3,
|
27 |
-
"sample_size":
|
28 |
-
"scaling_factor": 0.
|
29 |
-
"shift_factor":
|
30 |
"up_block_types": [
|
31 |
"UpDecoderBlock2D",
|
32 |
"UpDecoderBlock2D",
|
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
"_diffusers_version": "0.30.2",
|
4 |
+
"_name_or_path": "ostris/vae-kl-f8-d16",
|
5 |
"act_fn": "silu",
|
6 |
"block_out_channels": [
|
7 |
+
128,
|
8 |
128,
|
9 |
256,
|
|
|
10 |
512
|
11 |
],
|
12 |
"down_block_types": [
|
|
|
15 |
"DownEncoderBlock2D",
|
16 |
"DownEncoderBlock2D"
|
17 |
],
|
18 |
+
"force_upcast": true,
|
19 |
"in_channels": 3,
|
20 |
"latent_channels": 16,
|
21 |
"latents_mean": null,
|
22 |
"latents_std": null,
|
23 |
"layers_per_block": 2,
|
24 |
+
"mid_block_add_attention": true,
|
25 |
"norm_num_groups": 32,
|
26 |
"out_channels": 3,
|
27 |
+
"sample_size": 512,
|
28 |
+
"scaling_factor": 0.2614,
|
29 |
+
"shift_factor": null,
|
30 |
"up_block_types": [
|
31 |
"UpDecoderBlock2D",
|
32 |
"UpDecoderBlock2D",
|
vae/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6468f242218bc72981284b6fda570cc7c07ce043e84979cc1bb7d99d39a64a2
|
3 |
+
size 229094420
|