Mariam-Elz commited on
Commit
1eaea84
·
verified ·
1 Parent(s): e6d9a90

Upload imagedream/configs/sd_v2_base_ipmv.yaml with huggingface_hub

Browse files
imagedream/configs/sd_v2_base_ipmv.yaml ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ target: imagedream.ldm.interface.LatentDiffusionInterface
3
+ params:
4
+ linear_start: 0.00085
5
+ linear_end: 0.0120
6
+ timesteps: 1000
7
+ scale_factor: 0.18215
8
+ parameterization: "eps"
9
+
10
+ unet_config:
11
+ target: imagedream.ldm.modules.diffusionmodules.openaimodel.MultiViewUNetModel
12
+ params:
13
+ image_size: 32 # unused
14
+ in_channels: 4
15
+ out_channels: 4
16
+ model_channels: 320
17
+ attention_resolutions: [ 4, 2, 1 ]
18
+ num_res_blocks: 2
19
+ channel_mult: [ 1, 2, 4, 4 ]
20
+ num_head_channels: 64 # need to fix for flash-attn
21
+ use_spatial_transformer: True
22
+ use_linear_in_transformer: True
23
+ transformer_depth: 1
24
+ context_dim: 1024
25
+ use_checkpoint: False
26
+ legacy: False
27
+ camera_dim: 16
28
+ with_ip: True
29
+ ip_dim: 16 # ip token length
30
+ ip_mode: "local_resample"
31
+
32
+ vae_config:
33
+ target: imagedream.ldm.models.autoencoder.AutoencoderKL
34
+ params:
35
+ embed_dim: 4
36
+ monitor: val/rec_loss
37
+ ddconfig:
38
+ #attn_type: "vanilla-xformers"
39
+ double_z: true
40
+ z_channels: 4
41
+ resolution: 256
42
+ in_channels: 3
43
+ out_ch: 3
44
+ ch: 128
45
+ ch_mult:
46
+ - 1
47
+ - 2
48
+ - 4
49
+ - 4
50
+ num_res_blocks: 2
51
+ attn_resolutions: []
52
+ dropout: 0.0
53
+ lossconfig:
54
+ target: torch.nn.Identity
55
+
56
+ clip_config:
57
+ target: imagedream.ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder
58
+ params:
59
+ freeze: True
60
+ layer: "penultimate"
61
+ ip_mode: "local_resample"