wushuang98 commited on
Commit
3fc5183
·
verified ·
1 Parent(s): 0ee10aa

Upload 5 files

Browse files
direct3d-s2-v-1-0/config.yaml ADDED
@@ -0,0 +1,161 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dense_vae:
2
+ target: direct3d_s2.models.autoencoders.dense_vae.DenseShapeVAE
3
+ params:
4
+ use_checkpoint: true
5
+ embed_dim: 8
6
+ in_channels: 1
7
+ out_channels: 1
8
+ model_channels_encoder: [32, 128, 512]
9
+ num_res_blocks_encoder: 2
10
+ num_res_blocks_middle_encoder: 2
11
+ model_channels_decoder: [512, 128, 64]
12
+ num_res_blocks_decoder: 4
13
+ num_res_blocks_middle_decoder: 4
14
+ use_fp16: true
15
+ latents_scale: 1.0
16
+ latents_shift: 0.0
17
+
18
+ dense_dit:
19
+ target: direct3d_s2.models.transformers.dense_dit.DenseDiT
20
+ params:
21
+ resolution: 16
22
+ in_channels: 8
23
+ out_channels: 8
24
+ model_channels: 1024
25
+ cond_channels: 1024
26
+ num_blocks: 24
27
+ num_heads: 16
28
+ mlp_ratio: 4
29
+ patch_size: 1
30
+ pe_mode: ape
31
+ qk_rms_norm: true
32
+ use_checkpoint: true
33
+ use_fp16: true
34
+ latent_shape: [8, 16, 16, 16]
35
+
36
+ dense_image_encoder:
37
+ target: direct3d_s2.models.conditioner.DinoEncoder
38
+ params:
39
+ model: facebookresearch/dinov2
40
+ version: dinov2_vitl14_reg
41
+ size: 518
42
+
43
+ dense_scheduler:
44
+ target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
45
+ params:
46
+ num_train_timesteps: 1000
47
+ shift: 6.0
48
+
49
+ sparse_vae_512:
50
+ target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
51
+ params:
52
+ use_checkpoint: true
53
+ embed_dim: 16
54
+ num_head_channels_encoder: 64
55
+ model_channels_encoder: 512
56
+ num_heads_encoder: 8
57
+ num_blocks_encoder: 4
58
+ num_head_channels_decoder: 64
59
+ model_channels_decoder: 512
60
+ num_heads_decoder: 8
61
+ num_blocks_decoder: 4
62
+ resolution: 64
63
+ out_channels: 1
64
+ use_fp16: true
65
+ latents_scale: 1.0
66
+ latents_shift: 0.0
67
+
68
+ sparse_dit_512:
69
+ target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
70
+ params:
71
+ resolution: 64
72
+ in_channels: 16
73
+ out_channels: 16
74
+ model_channels: 1024
75
+ cond_channels: 1024
76
+ num_blocks: 24
77
+ num_heads: 32
78
+ num_kv_heads: 2
79
+ compression_block_size: 4
80
+ selection_block_size: 8
81
+ topk: 32
82
+ compression_version: v2
83
+ pe_mode: ape
84
+ factor: 1.0
85
+ sparse_conditions: true
86
+ qk_rms_norm: true
87
+ use_shift: true
88
+ use_checkpoint: true
89
+ use_fp16: true
90
+
91
+ sparse_scheduler_512:
92
+ target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
93
+ params:
94
+ num_train_timesteps: 1000
95
+ shift: 6.0
96
+
97
+ sparse_vae_1024:
98
+ target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
99
+ params:
100
+ use_checkpoint: true
101
+ embed_dim: 16
102
+ num_head_channels_encoder: 64
103
+ model_channels_encoder: 512
104
+ num_heads_encoder: 8
105
+ num_blocks_encoder: 4
106
+ num_head_channels_decoder: 64
107
+ model_channels_decoder: 512
108
+ num_heads_decoder: 8
109
+ num_blocks_decoder: 4
110
+ resolution: 128
111
+ out_channels: 1
112
+ use_fp16: true
113
+ latents_scale: 1.0
114
+ latents_shift: 0.0
115
+ chunk_size: 4
116
+
117
+ sparse_dit_1024:
118
+ target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
119
+ params:
120
+ resolution: 128
121
+ in_channels: 16
122
+ out_channels: 16
123
+ model_channels: 1024
124
+ cond_channels: 1024
125
+ num_blocks: 24
126
+ num_heads: 32
127
+ num_kv_heads: 2
128
+ compression_block_size: 4
129
+ selection_block_size: 8
130
+ topk: 8
131
+ compression_version: v2
132
+ pe_mode: ape
133
+ factor: 0.5
134
+ sparse_conditions: true
135
+ qk_rms_norm: true
136
+ use_shift: true
137
+ use_checkpoint: true
138
+ use_fp16: true
139
+
140
+ sparse_scheduler_1024:
141
+ target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
142
+ params:
143
+ num_train_timesteps: 1000
144
+ shift: 8.0
145
+
146
+ sparse_image_encoder:
147
+ target: direct3d_s2.models.conditioner.DinoEncoder
148
+ params:
149
+ model: facebookresearch/dinov2
150
+ version: dinov2_vitl14_reg
151
+ size: 518
152
+
153
+ refiner:
154
+ target: direct3d_s2.models.refiner.unet_refiner.Voxel_RefinerXL
155
+ params:
156
+ in_channels: 1
157
+ out_channels: 1
158
+ layers_per_block: 2
159
+ layers_mid_block: 2
160
+ patch_size: 192
161
+ use_fp16: true
direct3d-s2-v-1-0/model_dense.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e6598155f907ca15eb9e4fb96905f9df4d10ebc319f9567ea947db8c684d8fd
3
+ size 1505767932
direct3d-s2-v-1-0/model_refiner.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eb0f70d323a43d63ab37c91790c8a7c2b9ada1d7771ffe99ef7a647bdbc99e4
3
+ size 269562302
direct3d-s2-v-1-0/model_sparse_1024.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2fe3f7daab2a07b99248665501ddb52ced65b632557688227921b79faf8b9a1
3
+ size 1116239946
direct3d-s2-v-1-0/model_sparse_512.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cc7fe7d4978cf8ff96121ece226b5344c543486283f05d108b7acb3126f0c69
3
+ size 1116238952