Qwen_Image / qwen_image_depth_controlnet.json
svjack's picture
Upload qwen_image_depth_controlnet.json
1502bf1 verified
{
"id": "91f6bbe2-ed41-4fd6-bac7-71d5b5864ecb",
"revision": 0,
"last_node_id": 84,
"last_link_id": 173,
"nodes": [
{
"id": 8,
"type": "VAEDecode",
"pos": [
1210,
190
],
"size": [
210,
46
],
"flags": {},
"order": 19,
"mode": 0,
"inputs": [
{
"name": "samples",
"type": "LATENT",
"link": 128
},
{
"name": "vae",
"type": "VAE",
"link": 76
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"slot_index": 0,
"links": [
110
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "VAEDecode"
},
"widgets_values": []
},
{
"id": 7,
"type": "CLIPTextEncode",
"pos": [
413,
389
],
"size": [
425.27801513671875,
180.6060791015625
],
"flags": {},
"order": 6,
"mode": 0,
"inputs": [
{
"name": "clip",
"type": "CLIP",
"link": 75
}
],
"outputs": [
{
"name": "CONDITIONING",
"type": "CONDITIONING",
"slot_index": 0,
"links": [
52
]
}
],
"title": "CLIP Text Encode (Negative Prompt)",
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "CLIPTextEncode"
},
"widgets_values": [
" "
],
"color": "#322",
"bgcolor": "#533"
},
{
"id": 66,
"type": "ModelSamplingAuraFlow",
"pos": [
469.15350341796875,
39.34361267089844
],
"size": [
270,
58
],
"flags": {},
"order": 17,
"mode": 0,
"inputs": [
{
"name": "model",
"type": "MODEL",
"link": 157
}
],
"outputs": [
{
"name": "MODEL",
"type": "MODEL",
"links": [
125
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "ModelSamplingAuraFlow"
},
"widgets_values": [
3.500000000000001
]
},
{
"id": 37,
"type": "UNETLoader",
"pos": [
20,
60
],
"size": [
346.7470703125,
82
],
"flags": {},
"order": 0,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "MODEL",
"type": "MODEL",
"slot_index": 0,
"links": [
129
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "UNETLoader"
},
"widgets_values": [
"qwen_image_fp8_e4m3fn.safetensors",
"default"
],
"color": "#223",
"bgcolor": "#335"
},
{
"id": 38,
"type": "CLIPLoader",
"pos": [
20,
190
],
"size": [
380,
106
],
"flags": {},
"order": 1,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "CLIP",
"type": "CLIP",
"slot_index": 0,
"links": [
75,
131
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "CLIPLoader"
},
"widgets_values": [
"qwen_2.5_vl_7b_fp8_scaled.safetensors",
"qwen_image",
"default"
],
"color": "#223",
"bgcolor": "#335"
},
{
"id": 39,
"type": "VAELoader",
"pos": [
20,
340
],
"size": [
330,
60
],
"flags": {},
"order": 2,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "VAE",
"type": "VAE",
"slot_index": 0,
"links": [
76,
158
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "VAELoader"
},
"widgets_values": [
"qwen_image_vae.safetensors"
],
"color": "#223",
"bgcolor": "#335"
},
{
"id": 76,
"type": "ModelPatchLoader",
"pos": [
754.4307861328125,
-356.5053405761719
],
"size": [
270,
58
],
"flags": {},
"order": 3,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "MODEL_PATCH",
"type": "MODEL_PATCH",
"links": [
159
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "ModelPatchLoader"
},
"widgets_values": [
"qwen_image_depth_diffsynth_controlnet.safetensors"
]
},
{
"id": 79,
"type": "DownloadAndLoadDepthAnythingV2Model",
"pos": [
-648.7250366210938,
225.08016967773438
],
"size": [
365.3121032714844,
82
],
"flags": {},
"order": 4,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "da_v2_model",
"type": "DAMODEL",
"links": [
161
]
}
],
"properties": {
"cnr_id": "comfyui-depthanythingv2",
"ver": "d505cbca99803fc63327b8305618a23e59a18b42",
"Node name for S&R": "DownloadAndLoadDepthAnythingV2Model"
},
"widgets_values": [
"depth_anything_v2_vitl_fp32.safetensors",
"auto"
]
},
{
"id": 78,
"type": "DepthAnything_V2",
"pos": [
-195.6370849609375,
294.94244384765625
],
"size": [
156.64413452148438,
46
],
"flags": {},
"order": 10,
"mode": 0,
"inputs": [
{
"name": "da_model",
"type": "DAMODEL",
"link": 161
},
{
"name": "images",
"type": "IMAGE",
"link": 172
}
],
"outputs": [
{
"name": "image",
"type": "IMAGE",
"links": [
165
]
}
],
"properties": {
"cnr_id": "comfyui-depthanythingv2",
"ver": "d505cbca99803fc63327b8305618a23e59a18b42",
"Node name for S&R": "DepthAnything_V2"
},
"widgets_values": []
},
{
"id": 82,
"type": "PreviewImage",
"pos": [
88.48049926757812,
462.6634521484375
],
"size": [
140,
246
],
"flags": {},
"order": 15,
"mode": 0,
"inputs": [
{
"name": "images",
"type": "IMAGE",
"link": 166
}
],
"outputs": [],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "PreviewImage"
},
"widgets_values": []
},
{
"id": 58,
"type": "EmptySD3LatentImage",
"pos": [
426.35382080078125,
653.2474975585938
],
"size": [
270,
106
],
"flags": {},
"order": 14,
"mode": 0,
"inputs": [
{
"name": "width",
"type": "INT",
"widget": {
"name": "width"
},
"link": 169
},
{
"name": "height",
"type": "INT",
"widget": {
"name": "height"
},
"link": 170
}
],
"outputs": [
{
"name": "LATENT",
"type": "LATENT",
"links": [
107
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "EmptySD3LatentImage"
},
"widgets_values": [
768,
768,
1
]
},
{
"id": 73,
"type": "QwenImageDiffsynthControlnet",
"pos": [
923.51220703125,
-167.88821411132812
],
"size": [
294.1841735839844,
138
],
"flags": {},
"order": 16,
"mode": 0,
"inputs": [
{
"name": "model",
"type": "MODEL",
"link": 156
},
{
"name": "model_patch",
"type": "MODEL_PATCH",
"link": 159
},
{
"name": "vae",
"type": "VAE",
"link": 158
},
{
"name": "image",
"type": "IMAGE",
"link": 167
},
{
"name": "mask",
"shape": 7,
"type": "MASK",
"link": null
}
],
"outputs": [
{
"name": "MODEL",
"type": "MODEL",
"links": [
157
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "QwenImageDiffsynthControlnet"
},
"widgets_values": [
1
]
},
{
"id": 3,
"type": "KSampler",
"pos": [
863,
187
],
"size": [
315,
262
],
"flags": {},
"order": 18,
"mode": 0,
"inputs": [
{
"name": "model",
"type": "MODEL",
"link": 125
},
{
"name": "positive",
"type": "CONDITIONING",
"link": 46
},
{
"name": "negative",
"type": "CONDITIONING",
"link": 52
},
{
"name": "latent_image",
"type": "LATENT",
"link": 107
}
],
"outputs": [
{
"name": "LATENT",
"type": "LATENT",
"slot_index": 0,
"links": [
128
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "KSampler"
},
"widgets_values": [
43096239287214,
"randomize",
15,
4,
"euler",
"simple",
1
]
},
{
"id": 81,
"type": "ImageBlur",
"pos": [
-583.8450927734375,
-2.699789047241211
],
"size": [
270,
82
],
"flags": {},
"order": 13,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 165
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
166,
167
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "ImageBlur"
},
"widgets_values": [
2,
2
]
},
{
"id": 83,
"type": "GetImageSize",
"pos": [
122.48853302001953,
868.90380859375
],
"size": [
140,
124
],
"flags": {},
"order": 11,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 173
}
],
"outputs": [
{
"name": "width",
"type": "INT",
"links": [
169
]
},
{
"name": "height",
"type": "INT",
"links": [
170
]
},
{
"name": "batch_size",
"type": "INT",
"links": null
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "GetImageSize"
},
"widgets_values": [
"width: 636, height: 1135\n batch size: 1"
]
},
{
"id": 68,
"type": "LoraLoader",
"pos": [
66.83535766601562,
-205.47305297851562
],
"size": [
270,
126
],
"flags": {},
"order": 7,
"mode": 0,
"inputs": [
{
"name": "model",
"type": "MODEL",
"link": 129
},
{
"name": "clip",
"type": "CLIP",
"link": 131
}
],
"outputs": [
{
"name": "MODEL",
"type": "MODEL",
"links": [
141
]
},
{
"name": "CLIP",
"type": "CLIP",
"links": [
139
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.49",
"Node name for S&R": "LoraLoader"
},
"widgets_values": [
"qwen_image_anime_landscape_lora_v1_000002000.safetensors",
1,
1
]
},
{
"id": 60,
"type": "SaveImage",
"pos": [
1239.4698486328125,
337.7687072753906
],
"size": [
821.0496215820312,
871.7067260742188
],
"flags": {},
"order": 20,
"mode": 0,
"inputs": [
{
"name": "images",
"type": "IMAGE",
"link": 110
}
],
"outputs": [],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48"
},
"widgets_values": [
"ComfyUI"
]
},
{
"id": 6,
"type": "CLIPTextEncode",
"pos": [
415,
186
],
"size": [
422.84503173828125,
164.31304931640625
],
"flags": {},
"order": 12,
"mode": 0,
"inputs": [
{
"name": "clip",
"type": "CLIP",
"link": 154
}
],
"outputs": [
{
"name": "CONDITIONING",
"type": "CONDITIONING",
"slot_index": 0,
"links": [
46
]
}
],
"title": "CLIP Text Encode (Positive Prompt)",
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.48",
"Node name for S&R": "CLIPTextEncode"
},
"widgets_values": [
"anime style,\nIn the style of Infinite future landscape , This is a digitally created, hyper-realistic CGI image depicting a fantastical aerial view of a sprawling cityscape. The image showcases a massive, ancient stone arch bridge stretching across the foreground, with intricate, gothic-style spires and towers along its edges. Below the bridge, a vast, turquoise ocean with visible coral reefs and islands can be seen. The city itself is densely packed with tall, dark buildings and spires, creating a labyrinthine effect. The background features a vibrant blue sky filled with fluffy white clouds, with the sun shining brightly in the top right corner, casting dramatic shadows. The overall color palette is dominated by rich blues and greens, with contrasting dark stone textures."
],
"color": "#232",
"bgcolor": "#353"
},
{
"id": 70,
"type": "LoraLoader",
"pos": [
480.5247497558594,
-205.89479064941406
],
"size": [
270,
126
],
"flags": {},
"order": 9,
"mode": 4,
"inputs": [
{
"name": "model",
"type": "MODEL",
"link": 141
},
{
"name": "clip",
"type": "CLIP",
"link": 139
}
],
"outputs": [
{
"name": "MODEL",
"type": "MODEL",
"links": [
156
]
},
{
"name": "CLIP",
"type": "CLIP",
"links": [
154
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.49",
"Node name for S&R": "LoraLoader"
},
"widgets_values": [
"qwen_image_infinite_future_lora_v1_000002750.safetensors",
1,
1
]
},
{
"id": 77,
"type": "LoadImage",
"pos": [
-779.0413208007812,
460.957275390625
],
"size": [
270,
314.0000305175781
],
"flags": {},
"order": 5,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
171
]
},
{
"name": "MASK",
"type": "MASK",
"links": null
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "LoadImage"
},
"widgets_values": [
"image - 2025-08-21T194913.118.jpg",
"image"
]
},
{
"id": 84,
"type": "ImageScaleBy",
"pos": [
-386.33404541015625,
503.70269775390625
],
"size": [
270,
82
],
"flags": {},
"order": 8,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 171
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
172,
173
]
}
],
"properties": {
"cnr_id": "comfy-core",
"ver": "0.3.51",
"Node name for S&R": "ImageScaleBy"
},
"widgets_values": [
"nearest-exact",
0.3
]
}
],
"links": [
[
46,
6,
0,
3,
1,
"CONDITIONING"
],
[
52,
7,
0,
3,
2,
"CONDITIONING"
],
[
75,
38,
0,
7,
0,
"CLIP"
],
[
76,
39,
0,
8,
1,
"VAE"
],
[
107,
58,
0,
3,
3,
"LATENT"
],
[
110,
8,
0,
60,
0,
"IMAGE"
],
[
125,
66,
0,
3,
0,
"MODEL"
],
[
128,
3,
0,
8,
0,
"LATENT"
],
[
129,
37,
0,
68,
0,
"MODEL"
],
[
131,
38,
0,
68,
1,
"CLIP"
],
[
139,
68,
1,
70,
1,
"CLIP"
],
[
141,
68,
0,
70,
0,
"MODEL"
],
[
154,
70,
1,
6,
0,
"CLIP"
],
[
156,
70,
0,
73,
0,
"MODEL"
],
[
157,
73,
0,
66,
0,
"MODEL"
],
[
158,
39,
0,
73,
2,
"VAE"
],
[
159,
76,
0,
73,
1,
"MODEL_PATCH"
],
[
161,
79,
0,
78,
0,
"DAMODEL"
],
[
165,
78,
0,
81,
0,
"IMAGE"
],
[
166,
81,
0,
82,
0,
"IMAGE"
],
[
167,
81,
0,
73,
3,
"IMAGE"
],
[
169,
83,
0,
58,
0,
"INT"
],
[
170,
83,
1,
58,
1,
"INT"
],
[
171,
77,
0,
84,
0,
"IMAGE"
],
[
172,
84,
0,
78,
1,
"IMAGE"
],
[
173,
84,
0,
83,
0,
"IMAGE"
]
],
"groups": [],
"config": {},
"extra": {
"ds": {
"scale": 0.6934334949441455,
"offset": [
1336.7112849425441,
2.432450082515594
]
},
"frontendVersion": "1.25.9",
"VHS_latentpreview": false,
"VHS_latentpreviewrate": 0,
"VHS_MetadataImage": true,
"VHS_KeepIntermediate": true
},
"version": 0.4
}