{ "architectures": [ "AsymmetricMagVitV2Pipline" ], "decoder": { "ch": 128, "ch_mult": [ 1, 2, 4, 4 ], "double_z": true, "in_channels": 3, "num_res_blocks": 2, "out_ch": 3, "temporal_up_layers": [ 2, 3 ], "type": "VideoDecoder", "video_frame_num": 17, "z_channels": 16 }, "encoder": { "ch": 128, "ch_mult": [ 1, 2, 4, 4 ], "double_z": true, "down_sampling_layer": [ 1, 2 ], "in_channels": 3, "num_res_blocks": 2, "out_ch": 3, "type": "VideoEncoder", "video_frame_num": 17, "z_channels": 16 }, "model_type": "AsymmetricMagVitV2Pipline", "regularizer": { "type": "DiagonalGaussianRegularizer" }, "torch_dtype": "bfloat16", "transformers_version": "4.19.1" }