Mariam-Elz commited on
Commit
d1c6df5
·
verified ·
1 Parent(s): 5dc17ed

Upload imagedream/configs/sd_v2_base_ipmv.yaml with huggingface_hub

Browse files
imagedream/configs/sd_v2_base_ipmv.yaml CHANGED
@@ -1,61 +1,61 @@
1
- model:
2
- target: imagedream.ldm.interface.LatentDiffusionInterface
3
- params:
4
- linear_start: 0.00085
5
- linear_end: 0.0120
6
- timesteps: 1000
7
- scale_factor: 0.18215
8
- parameterization: "eps"
9
-
10
- unet_config:
11
- target: imagedream.ldm.modules.diffusionmodules.openaimodel.MultiViewUNetModel
12
- params:
13
- image_size: 32 # unused
14
- in_channels: 4
15
- out_channels: 4
16
- model_channels: 320
17
- attention_resolutions: [ 4, 2, 1 ]
18
- num_res_blocks: 2
19
- channel_mult: [ 1, 2, 4, 4 ]
20
- num_head_channels: 64 # need to fix for flash-attn
21
- use_spatial_transformer: True
22
- use_linear_in_transformer: True
23
- transformer_depth: 1
24
- context_dim: 1024
25
- use_checkpoint: False
26
- legacy: False
27
- camera_dim: 16
28
- with_ip: True
29
- ip_dim: 16 # ip token length
30
- ip_mode: "local_resample"
31
-
32
- vae_config:
33
- target: imagedream.ldm.models.autoencoder.AutoencoderKL
34
- params:
35
- embed_dim: 4
36
- monitor: val/rec_loss
37
- ddconfig:
38
- #attn_type: "vanilla-xformers"
39
- double_z: true
40
- z_channels: 4
41
- resolution: 256
42
- in_channels: 3
43
- out_ch: 3
44
- ch: 128
45
- ch_mult:
46
- - 1
47
- - 2
48
- - 4
49
- - 4
50
- num_res_blocks: 2
51
- attn_resolutions: []
52
- dropout: 0.0
53
- lossconfig:
54
- target: torch.nn.Identity
55
-
56
- clip_config:
57
- target: imagedream.ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
58
- params:
59
- freeze: True
60
- layer: "penultimate"
61
- ip_mode: "local_resample"
 
1
+ model:
2
+ target: imagedream.ldm.interface.LatentDiffusionInterface
3
+ params:
4
+ linear_start: 0.00085
5
+ linear_end: 0.0120
6
+ timesteps: 1000
7
+ scale_factor: 0.18215
8
+ parameterization: "eps"
9
+
10
+ unet_config:
11
+ target: imagedream.ldm.modules.diffusionmodules.openaimodel.MultiViewUNetModel
12
+ params:
13
+ image_size: 32 # unused
14
+ in_channels: 4
15
+ out_channels: 4
16
+ model_channels: 320
17
+ attention_resolutions: [ 4, 2, 1 ]
18
+ num_res_blocks: 2
19
+ channel_mult: [ 1, 2, 4, 4 ]
20
+ num_head_channels: 64 # need to fix for flash-attn
21
+ use_spatial_transformer: True
22
+ use_linear_in_transformer: True
23
+ transformer_depth: 1
24
+ context_dim: 1024
25
+ use_checkpoint: False
26
+ legacy: False
27
+ camera_dim: 16
28
+ with_ip: True
29
+ ip_dim: 16 # ip token length
30
+ ip_mode: "local_resample"
31
+
32
+ vae_config:
33
+ target: imagedream.ldm.models.autoencoder.AutoencoderKL
34
+ params:
35
+ embed_dim: 4
36
+ monitor: val/rec_loss
37
+ ddconfig:
38
+ #attn_type: "vanilla-xformers"
39
+ double_z: true
40
+ z_channels: 4
41
+ resolution: 256
42
+ in_channels: 3
43
+ out_ch: 3
44
+ ch: 128
45
+ ch_mult:
46
+ - 1
47
+ - 2
48
+ - 4
49
+ - 4
50
+ num_res_blocks: 2
51
+ attn_resolutions: []
52
+ dropout: 0.0
53
+ lossconfig:
54
+ target: torch.nn.Identity
55
+
56
+ clip_config:
57
+ target: imagedream.ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
58
+ params:
59
+ freeze: True
60
+ layer: "penultimate"
61
+ ip_mode: "local_resample"