Upload 5 files
Browse files
direct3d-s2-v-1-0/config.yaml
ADDED
@@ -0,0 +1,161 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
dense_vae:
|
2 |
+
target: direct3d_s2.models.autoencoders.dense_vae.DenseShapeVAE
|
3 |
+
params:
|
4 |
+
use_checkpoint: true
|
5 |
+
embed_dim: 8
|
6 |
+
in_channels: 1
|
7 |
+
out_channels: 1
|
8 |
+
model_channels_encoder: [32, 128, 512]
|
9 |
+
num_res_blocks_encoder: 2
|
10 |
+
num_res_blocks_middle_encoder: 2
|
11 |
+
model_channels_decoder: [512, 128, 64]
|
12 |
+
num_res_blocks_decoder: 4
|
13 |
+
num_res_blocks_middle_decoder: 4
|
14 |
+
use_fp16: true
|
15 |
+
latents_scale: 1.0
|
16 |
+
latents_shift: 0.0
|
17 |
+
|
18 |
+
dense_dit:
|
19 |
+
target: direct3d_s2.models.transformers.dense_dit.DenseDiT
|
20 |
+
params:
|
21 |
+
resolution: 16
|
22 |
+
in_channels: 8
|
23 |
+
out_channels: 8
|
24 |
+
model_channels: 1024
|
25 |
+
cond_channels: 1024
|
26 |
+
num_blocks: 24
|
27 |
+
num_heads: 16
|
28 |
+
mlp_ratio: 4
|
29 |
+
patch_size: 1
|
30 |
+
pe_mode: ape
|
31 |
+
qk_rms_norm: true
|
32 |
+
use_checkpoint: true
|
33 |
+
use_fp16: true
|
34 |
+
latent_shape: [8, 16, 16, 16]
|
35 |
+
|
36 |
+
dense_image_encoder:
|
37 |
+
target: direct3d_s2.models.conditioner.DinoEncoder
|
38 |
+
params:
|
39 |
+
model: facebookresearch/dinov2
|
40 |
+
version: dinov2_vitl14_reg
|
41 |
+
size: 518
|
42 |
+
|
43 |
+
dense_scheduler:
|
44 |
+
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
45 |
+
params:
|
46 |
+
num_train_timesteps: 1000
|
47 |
+
shift: 6.0
|
48 |
+
|
49 |
+
sparse_vae_512:
|
50 |
+
target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
|
51 |
+
params:
|
52 |
+
use_checkpoint: true
|
53 |
+
embed_dim: 16
|
54 |
+
num_head_channels_encoder: 64
|
55 |
+
model_channels_encoder: 512
|
56 |
+
num_heads_encoder: 8
|
57 |
+
num_blocks_encoder: 4
|
58 |
+
num_head_channels_decoder: 64
|
59 |
+
model_channels_decoder: 512
|
60 |
+
num_heads_decoder: 8
|
61 |
+
num_blocks_decoder: 4
|
62 |
+
resolution: 64
|
63 |
+
out_channels: 1
|
64 |
+
use_fp16: true
|
65 |
+
latents_scale: 1.0
|
66 |
+
latents_shift: 0.0
|
67 |
+
|
68 |
+
sparse_dit_512:
|
69 |
+
target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
|
70 |
+
params:
|
71 |
+
resolution: 64
|
72 |
+
in_channels: 16
|
73 |
+
out_channels: 16
|
74 |
+
model_channels: 1024
|
75 |
+
cond_channels: 1024
|
76 |
+
num_blocks: 24
|
77 |
+
num_heads: 32
|
78 |
+
num_kv_heads: 2
|
79 |
+
compression_block_size: 4
|
80 |
+
selection_block_size: 8
|
81 |
+
topk: 32
|
82 |
+
compression_version: v2
|
83 |
+
pe_mode: ape
|
84 |
+
factor: 1.0
|
85 |
+
sparse_conditions: true
|
86 |
+
qk_rms_norm: true
|
87 |
+
use_shift: true
|
88 |
+
use_checkpoint: true
|
89 |
+
use_fp16: true
|
90 |
+
|
91 |
+
sparse_scheduler_512:
|
92 |
+
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
93 |
+
params:
|
94 |
+
num_train_timesteps: 1000
|
95 |
+
shift: 6.0
|
96 |
+
|
97 |
+
sparse_vae_1024:
|
98 |
+
target: direct3d_s2.models.autoencoders.ss_vae.SparseSDFVAE
|
99 |
+
params:
|
100 |
+
use_checkpoint: true
|
101 |
+
embed_dim: 16
|
102 |
+
num_head_channels_encoder: 64
|
103 |
+
model_channels_encoder: 512
|
104 |
+
num_heads_encoder: 8
|
105 |
+
num_blocks_encoder: 4
|
106 |
+
num_head_channels_decoder: 64
|
107 |
+
model_channels_decoder: 512
|
108 |
+
num_heads_decoder: 8
|
109 |
+
num_blocks_decoder: 4
|
110 |
+
resolution: 128
|
111 |
+
out_channels: 1
|
112 |
+
use_fp16: true
|
113 |
+
latents_scale: 1.0
|
114 |
+
latents_shift: 0.0
|
115 |
+
chunk_size: 4
|
116 |
+
|
117 |
+
sparse_dit_1024:
|
118 |
+
target: direct3d_s2.models.transformers.sparse_dit.SparseDiT
|
119 |
+
params:
|
120 |
+
resolution: 128
|
121 |
+
in_channels: 16
|
122 |
+
out_channels: 16
|
123 |
+
model_channels: 1024
|
124 |
+
cond_channels: 1024
|
125 |
+
num_blocks: 24
|
126 |
+
num_heads: 32
|
127 |
+
num_kv_heads: 2
|
128 |
+
compression_block_size: 4
|
129 |
+
selection_block_size: 8
|
130 |
+
topk: 8
|
131 |
+
compression_version: v2
|
132 |
+
pe_mode: ape
|
133 |
+
factor: 0.5
|
134 |
+
sparse_conditions: true
|
135 |
+
qk_rms_norm: true
|
136 |
+
use_shift: true
|
137 |
+
use_checkpoint: true
|
138 |
+
use_fp16: true
|
139 |
+
|
140 |
+
sparse_scheduler_1024:
|
141 |
+
target: diffusers.schedulers.FlowMatchEulerDiscreteScheduler
|
142 |
+
params:
|
143 |
+
num_train_timesteps: 1000
|
144 |
+
shift: 8.0
|
145 |
+
|
146 |
+
sparse_image_encoder:
|
147 |
+
target: direct3d_s2.models.conditioner.DinoEncoder
|
148 |
+
params:
|
149 |
+
model: facebookresearch/dinov2
|
150 |
+
version: dinov2_vitl14_reg
|
151 |
+
size: 518
|
152 |
+
|
153 |
+
refiner:
|
154 |
+
target: direct3d_s2.models.refiner.unet_refiner.Voxel_RefinerXL
|
155 |
+
params:
|
156 |
+
in_channels: 1
|
157 |
+
out_channels: 1
|
158 |
+
layers_per_block: 2
|
159 |
+
layers_mid_block: 2
|
160 |
+
patch_size: 192
|
161 |
+
use_fp16: true
|
direct3d-s2-v-1-0/model_dense.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e6598155f907ca15eb9e4fb96905f9df4d10ebc319f9567ea947db8c684d8fd
|
3 |
+
size 1505767932
|
direct3d-s2-v-1-0/model_refiner.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eb0f70d323a43d63ab37c91790c8a7c2b9ada1d7771ffe99ef7a647bdbc99e4
|
3 |
+
size 269562302
|
direct3d-s2-v-1-0/model_sparse_1024.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2fe3f7daab2a07b99248665501ddb52ced65b632557688227921b79faf8b9a1
|
3 |
+
size 1116239946
|
direct3d-s2-v-1-0/model_sparse_512.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc7fe7d4978cf8ff96121ece226b5344c543486283f05d108b7acb3126f0c69
|
3 |
+
size 1116238952
|