Spaces:

radames
/

Real-Time-Latent-Consistency-Model

Runtime error

App Files Files Community

radames commited on Mar 20, 2024

Commit

d8457bc

1 Parent(s): 5f1aa51

cleanup

Browse files

Files changed (2) hide show

server/pipelines/pix2pix/pix2pix_turbo.py +1 -0
server/pipelines/pix2pixTurbo.py +17 -17

server/pipelines/pix2pix/pix2pix_turbo.py CHANGED Viewed

@@ -153,6 +153,7 @@ class Pix2Pix_Turbo(torch.nn.Module):
         self.caption_enc = None
         self.device = "cuda"
     def forward(self, c_t, prompt, deterministic=True, r=1.0, noise_map=1.0):
         # encode the text prompt
         if prompt != self.last_prompt:

         self.caption_enc = None
         self.device = "cuda"
+    @torch.no_grad()
     def forward(self, c_t, prompt, deterministic=True, r=1.0, noise_map=1.0):
         # encode the text prompt
         if prompt != self.last_prompt:

server/pipelines/pix2pixTurbo.py CHANGED Viewed

@@ -5,7 +5,7 @@ from config import Args
 from pydantic import BaseModel, Field
 from PIL import Image
 from pipelines.pix2pix.pix2pix_turbo import Pix2Pix_Turbo
-from pipelines.utils.canny_gpu import SobelOperator
 default_prompt = "close-up photo of the joker"
 page_content = """
@@ -19,6 +19,11 @@ page_content = """
     class="text-blue-500 underline hover:no-underline">One-Step Image Translation with Text-to-Image Models
     </a>
 </p>
 """
@@ -62,7 +67,7 @@ class Pipeline:
             id="deterministic",
         )
         canny_low_threshold: float = Field(
-            0.31,
             min=0,
             max=1.0,
             step=0.001,
@@ -72,7 +77,7 @@ class Pipeline:
             id="canny_low_threshold",
         )
         canny_high_threshold: float = Field(
-            0.125,
             min=0,
             max=1.0,
             step=0.001,
@@ -91,30 +96,25 @@ class Pipeline:
     def __init__(self, args: Args, device: torch.device, torch_dtype: torch.dtype):
         self.model = Pix2Pix_Turbo("edge_to_image")
-        self.canny_torch = SobelOperator(device=device)
         self.device = device
         self.last_time = 0.0
     def predict(self, params: "Pipeline.InputParams") -> Image.Image:
-        # generator = torch.manual_seed(params.seed)
-        # pipe = self.pipes[params.base_model_id]
         canny_pil, canny_tensor = self.canny_torch(
             params.image,
             params.canny_low_threshold,
             params.canny_high_threshold,
             output_type="pil,tensor",
         )
-        with torch.no_grad():
-            canny_tensor = torch.cat((canny_tensor, canny_tensor, canny_tensor), dim=1)
-            output_image = self.model(
-                canny_tensor,
-                params.prompt,
-                params.deterministic,
-                params.strength,
-            )
-            output_pil = transforms.ToPILImage()(output_image[0].cpu() * 0.5 + 0.5)
         result_image = output_pil
         if params.debug_canny:

 from pydantic import BaseModel, Field
 from PIL import Image
 from pipelines.pix2pix.pix2pix_turbo import Pix2Pix_Turbo
+from pipelines.utils.canny_gpu import ScharrOperator
 default_prompt = "close-up photo of the joker"
 page_content = """
     class="text-blue-500 underline hover:no-underline">One-Step Image Translation with Text-to-Image Models
     </a>
 </p>
+<p class="text-sm text-gray-500">
+    Web app <a href="https://github.com/radames/Real-Time-Latent-Consistency-Model" target="_blank" class="text-blue-500 underline hover:no-underline">
+    Real-Time Latent Consistency Models
+    </a>
+</p>
 """
             id="deterministic",
         )
         canny_low_threshold: float = Field(
+            0.0,
             min=0,
             max=1.0,
             step=0.001,
             id="canny_low_threshold",
         )
         canny_high_threshold: float = Field(
+            1.0,
             min=0,
             max=1.0,
             step=0.001,
     def __init__(self, args: Args, device: torch.device, torch_dtype: torch.dtype):
         self.model = Pix2Pix_Turbo("edge_to_image")
+        self.canny_torch = ScharrOperator(device=device)
         self.device = device
         self.last_time = 0.0
     def predict(self, params: "Pipeline.InputParams") -> Image.Image:
         canny_pil, canny_tensor = self.canny_torch(
             params.image,
             params.canny_low_threshold,
             params.canny_high_threshold,
             output_type="pil,tensor",
         )
+        canny_tensor = torch.cat((canny_tensor, canny_tensor, canny_tensor), dim=1)
+        output_image = self.model(
+            canny_tensor,
+            params.prompt,
+            params.deterministic,
+            params.strength,
+        )
+        output_pil = transforms.ToPILImage()(output_image[0].cpu() * 0.5 + 0.5)
         result_image = output_pil
         if params.debug_canny: