File size: 766 Bytes
e6d2ce0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 |
num_frames = 1
fps = 1
image_size = (2560, 1536)
# image_size = (2048, 2048)
model = dict(
type="PixArt-XL/2",
from_pretrained="PixArt-Sigma-XL-2-2K-MS.pth",
space_scale=4,
no_temporal_pos_emb=True,
enable_flash_attn=True,
enable_layernorm_kernel=True,
base_size=2048 // 8,
)
vae = dict(
type="VideoAutoencoderKL",
from_pretrained="PixArt-alpha/pixart_sigma_sdxlvae_T5_diffusers",
subfolder="vae",
)
text_encoder = dict(
type="t5",
from_pretrained="DeepFloyd/t5-v1_1-xxl",
model_max_length=300,
)
scheduler = dict(
type="dpm-solver",
num_sampling_steps=14,
cfg_scale=4.5,
)
dtype = "bf16"
# Others
batch_size = 1
seed = 42
prompt_path = "./assets/texts/t2i_sigma.txt"
save_dir = "./samples/samples/"
|