Yuxiao319 commited on
Commit
bf8d480
1 Parent(s): 930259b

add_mv_enhance

Browse files
mvdiffusion/config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNetMV2DConditionModel",
3
+ "_diffusers_version": "0.19.3",
4
+ "_name_or_path": "/mvfs/workspace/code/mv_proj/outputs-v6/from_crop_17500step_single_obj/unet-50000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "block_out_channels": [
11
+ 320,
12
+ 640,
13
+ 1280,
14
+ 1280
15
+ ],
16
+ "cd_attention_last": false,
17
+ "cd_attention_mid": true,
18
+ "center_input_sample": false,
19
+ "class_embed_type": "projection",
20
+ "class_embeddings_concat": false,
21
+ "conv_in_kernel": 3,
22
+ "conv_out_kernel": 3,
23
+ "cross_attention_dim": 768,
24
+ "cross_attention_norm": null,
25
+ "down_block_types": [
26
+ "CrossAttnDownBlockMV2D",
27
+ "CrossAttnDownBlockMV2D",
28
+ "CrossAttnDownBlockMV2D",
29
+ "DownBlock2D"
30
+ ],
31
+ "downsample_padding": 1,
32
+ "dual_cross_attention": false,
33
+ "encoder_hid_dim": null,
34
+ "encoder_hid_dim_type": null,
35
+ "flip_sin_to_cos": true,
36
+ "freq_shift": 0,
37
+ "in_channels": 8,
38
+ "layers_per_block": 2,
39
+ "mid_block_only_cross_attention": null,
40
+ "mid_block_scale_factor": 1,
41
+ "mid_block_type": "UNetMidBlockMV2DCrossAttn",
42
+ "multiview_attention": true,
43
+ "mvcd_attention": false,
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "num_views": 6,
49
+ "only_cross_attention": false,
50
+ "out_channels": 4,
51
+ "projection_class_embeddings_input_dim": 14,
52
+ "resnet_out_scale_factor": 1.0,
53
+ "resnet_skip_time_act": false,
54
+ "resnet_time_scale_shift": "default",
55
+ "sample_size": 32,
56
+ "sparse_mv_attention": false,
57
+ "time_cond_proj_dim": null,
58
+ "time_embedding_act_fn": null,
59
+ "time_embedding_dim": null,
60
+ "time_embedding_type": "positional",
61
+ "timestep_post_act": null,
62
+ "transformer_layers_per_block": 1,
63
+ "up_block_types": [
64
+ "UpBlock2D",
65
+ "CrossAttnUpBlockMV2D",
66
+ "CrossAttnUpBlockMV2D",
67
+ "CrossAttnUpBlockMV2D"
68
+ ],
69
+ "upcast_attention": false,
70
+ "use_linear_projection": false
71
+ }
mvdiffusion/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a338df9e3e913ac9de83fb6d1585ea01031dba03434e2adc32237127fddbab
3
+ size 3643509774