File size: 9,304 Bytes
886f105
7d40369
d7e3825
226c832
6bcec5f
9461fdc
 
 
 
 
 
 
 
e8ea8da
9461fdc
7d40369
9dab390
 
f8ad000
 
 
6c007e9
9dab390
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0de6d5a
9dab390
0de6d5a
 
9dab390
 
 
 
 
 
0de6d5a
9dab390
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7d40369
9461fdc
7d40369
9461fdc
072be42
 
 
 
40e3650
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9461fdc
 
40e3650
 
 
 
 
 
 
 
 
 
 
9461fdc
 
 
 
40e3650
a0e45a8
9461fdc
8f2de47
0de6d5a
7d40369
 
7054a36
9461fdc
 
e8ea8da
9461fdc
7054a36
99d1063
 
7054a36
920ac22
cdd3493
 
 
 
 
 
 
 
920ac22
7d40369
 
 
072be42
7d40369
99d1063
7d40369
cdd3493
920ac22
e8ea8da
 
 
 
072be42
48b54d6
 
e8ea8da
cdd3493
 
7d40369
 
 
 
cdd3493
e8ea8da
cdd3493
920ac22
e8ea8da
 
 
072be42
6c007e9
 
7d40369
9461fdc
7d40369
 
886f105
499951f
71c5d37
fbcf80b
71c5d37
 
 
b4bf7d7
71c5d37
6e85f96
56d288b
 
 
 
 
 
 
 
 
3718c59
6c007e9
56d288b
6e85f96
56d288b
cdd3493
71c5d37
0de6d5a
71c5d37
 
9461fdc
 
7d40369
9461fdc
7d40369
 
 
d7e3825
 
 
 
 
 
 
 
 
 
 
499951f
d7e3825
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9461fdc
 
 
 
 
7d40369
499951f
 
 
 
 
 
 
7d40369
 
 
9461fdc
7d40369
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
import spaces
import torch
import random
import numpy as np
from inspect import signature
from diffusers import (
    FluxPipeline,
    StableDiffusion3Pipeline,
    PixArtSigmaPipeline,
    SanaPipeline,
    AuraFlowPipeline,
    Kandinsky3Pipeline,
    HunyuanDiTPipeline,
    LuminaText2ImgPipeline,AutoPipelineForText2Image
)
import gradio as gr
from diffusers.pipelines.pipeline_utils import DiffusionPipeline

MAX_SEED = np.iinfo(np.int32).max
MAX_IMAGE_SIZE = 1024

class ProgressPipeline(DiffusionPipeline):
    def __init__(self, original_pipeline):
        super().__init__()
        self.original_pipeline = original_pipeline
        # Register all components from the original pipeline
        for attr_name, attr_value in vars(original_pipeline).items():
            setattr(self, attr_name, attr_value)
    
    @torch.no_grad()
    def __call__(
        self,
        prompt,
        num_inference_steps=30,
        generator=None,
        guidance_scale=7.5,
        callback=None,
        callback_steps=1,
        **kwargs
    ):
        # Initialize the progress tracking
        self._num_inference_steps = num_inference_steps
        self._step = 0
        
        def progress_callback(step_index, timestep, callback_kwargs):
            if callback and step_index % callback_steps == 0:
                # Pass self (the pipeline) to the callback
                callback(self, step_index, timestep, callback_kwargs)
            return callback_kwargs
        
        # Monkey patch the original pipeline's progress tracking
        original_step = self.original_pipeline.scheduler.step
        def wrapped_step(*args, **kwargs):
            self._step += 1
            progress_callback(self._step, None, {})
            return original_step(*args, **kwargs)
        
        self.original_pipeline.scheduler.step = wrapped_step
        
        try:
            # Call the original pipeline
            result = self.original_pipeline(
                prompt=prompt,
                num_inference_steps=num_inference_steps,
                generator=generator,
                guidance_scale=guidance_scale,
                **kwargs
            )
            
            return result
        finally:
            # Restore the original step function
            self.original_pipeline.scheduler.step = original_step

cache_dir = '/workspace/hf_cache'

MODEL_CONFIGS = {
        "FLUX": {
        "repo_id": "black-forest-labs/FLUX.1-dev",
        "pipeline_class": FluxPipeline,
    },
    "Stable Diffusion 3.5": {
        "repo_id": "stabilityai/stable-diffusion-3.5-large",
        "pipeline_class": StableDiffusion3Pipeline,
         
    },
    "PixArt": {
        "repo_id": "PixArt-alpha/PixArt-Sigma-XL-2-1024-MS",
        "pipeline_class": PixArtSigmaPipeline,
        
    },
    "SANA": {
        "repo_id": "Efficient-Large-Model/Sana_1600M_1024px_BF16_diffusers",
        "pipeline_class": SanaPipeline,
         
    },
    "AuraFlow": {
        "repo_id": "fal/AuraFlow",
        "pipeline_class": AuraFlowPipeline,
         
    },
    "Kandinsky": {
        "repo_id": "kandinsky-community/kandinsky-3",
        "pipeline_class": Kandinsky3Pipeline,
        
    },
    "Hunyuan": {
        "repo_id": "Tencent-Hunyuan/HunyuanDiT-Diffusers",
        "pipeline_class": HunyuanDiTPipeline,
         
    },
    "Lumina": {
        "repo_id": "Alpha-VLLM/Lumina-Next-SFT-diffusers",
        "pipeline_class": LuminaText2ImgPipeline,
         
    }
}

def generate_image_with_progress(model_name,pipe, prompt, num_steps, guidance_scale=None, seed=None, progress=gr.Progress(track_tqdm=True)):
    generator = None
    if seed is not None:
        generator = torch.Generator("cuda").manual_seed(seed)

    def callback(pipe, step_index, timestep, callback_kwargs):
        print(f" callback => {step_index}, {timestep}")
        if step_index is None:
            step_index = 0
        cur_prg = step_index / num_steps
        progress(cur_prg, desc=f"Step {step_index}/{num_steps}")
        return callback_kwargs
    print(f"START GENR ")
    # Get the signature of the pipe
    pipe_signature = signature(pipe)
    
    # Check for the presence of "guidance_scale" and "callback_on_step_end" in the signature
    has_guidance_scale = "guidance_scale" in pipe_signature.parameters
    has_callback_on_step_end = "callback_on_step_end" in pipe_signature.parameters
    
    if has_guidance_scale and has_callback_on_step_end:
        print("has callback_on_step_end and has guidance_scale")
        image = pipe(
            prompt,
            num_inference_steps=num_steps,
            generator=generator,
            guidance_scale=guidance_scale,
            callback_on_step_end=callback,
        ).images[0]
    elif not has_callback_on_step_end and has_guidance_scale:
        print("NO callback_on_step_end and has guidance_scale")
        image = pipe(
            prompt,
            num_inference_steps=num_steps,
            guidance_scale=guidance_scale,
            generator=generator,
            callback=callback,
            callback_steps=1,
        ).images[0]
    elif has_callback_on_step_end and not has_guidance_scale:
        print("has callback_on_step_end and NO guidance_scale")
        image = pipe(
            prompt,
            num_inference_steps=num_steps,
            generator=generator,
            callback_on_step_end=callback,
        ).images[0]
    elif not has_callback_on_step_end and not has_guidance_scale:
        print("NO callback_on_step_end and NO guidance_scale")
        image = pipe(
            prompt,
            num_inference_steps=num_steps,
            generator=generator,
            callback=callback,
            callback_steps=1,
        ).images[0]

    return image

@spaces.GPU(duration=170)
def create_pipeline_logic(prompt_text, model_name, negative_prompt="",  seed=42, randomize_seed=False, width=1024, height=1024, guidance_scale=4.5, num_inference_steps=40,):
    print(f"starting {model_name}")
    progress = gr.Progress(track_tqdm=True)
    num_steps = 30
    guidance_scale = 7.5  # Example guidance scale, can be adjusted per model
    seed = 42
    config = MODEL_CONFIGS[model_name]
    pipe_class = config["pipeline_class"]
    pipe = None
    b_pipe = AutoPipelineForText2Image.from_pretrained(
        config["repo_id"],
        #variant="fp16",
        #cache_dir=config["cache_dir"],
        torch_dtype=torch.bfloat16
    ).to("cuda")
    pipe_signature = signature(b_pipe)
    # Check for the presence of "callback_on_step_end" in the signature
    has_callback_on_step_end = "callback_on_step_end" in pipe_signature.parameters
    if not has_callback_on_step_end:
        pipe = ProgressPipeline(b_pipe)
        print("ProgressPipeline specal")
    else:
        pipe = b_pipe
        
    image = generate_image_with_progress(
        model_name,pipe, prompt_text, num_steps=num_steps, guidance_scale=guidance_scale, seed=seed, progress=progress
    )
    return f"Seed: {seed}", image

def main():
    with gr.Blocks() as app:
        gr.Markdown("# Dynamic Multiple Model Image Generation")

        prompt_text = gr.Textbox(label="Enter prompt")

        with gr.Accordion("Advanced Settings", open=False):
            negative_prompt = gr.Text(
                label="Negative prompt",
                max_lines=1,
                placeholder="Enter a negative prompt",
            )

            seed = gr.Slider(
                label="Seed",
                minimum=0,
                maximum=MAX_SEED,
                step=100,
                value=0,
            )

            randomize_seed = gr.Checkbox(label="Randomize seed", value=True)

            with gr.Row():
                width = gr.Slider(
                    label="Width",
                    minimum=512,
                    maximum=MAX_IMAGE_SIZE,
                    step=32,
                    value=1024,
                )
                height = gr.Slider(
                    label="Height",
                    minimum=512,
                    maximum=MAX_IMAGE_SIZE,
                    step=32,
                    value=1024,
                )

            with gr.Row():
                guidance_scale = gr.Slider(
                    label="Guidance scale",
                    minimum=0.0,
                    maximum=7.5,
                    step=0.1,
                    value=4.5,
                )
                num_inference_steps = gr.Slider(
                    label="Number of inference steps",
                    minimum=1,
                    maximum=50,
                    step=1,
                    value=40,
                )

        for model_name, config in MODEL_CONFIGS.items():
            with gr.Tab(model_name):
                button = gr.Button(f"Run {model_name}")
                output = gr.Textbox(label="Status")
                img = gr.Image(label=model_name, height=300)

                button.click(fn=create_pipeline_logic, inputs=[prompt_text, gr.Text(value= model_name,visible=False), negative_prompt,
            seed,
            randomize_seed,
            width,
            height,
            guidance_scale,
            num_inference_steps], outputs=[output, img])

    app.launch()


if __name__ == "__main__":
    main()