StableDesign

Running on Zero

App Files Files Community

nick_93 commited on Apr 7

Commit

f493b13

•

1 Parent(s): 8df3de7

init

Browse files

Files changed (1) hide show

app.py +37 -35

app.py CHANGED Viewed

@@ -19,6 +19,34 @@ device = "cuda"
 dtype = torch.float16
 css = """
 #img-display-container {
     max-height: 50vh;
@@ -78,8 +106,8 @@ def get_segmentation_pipeline(
 @spaces.GPU
 def segment_image(
         image: Image,
-        image_processor: AutoImageProcessor,
-        image_segmentor: UperNetForSemanticSegmentation
 ) -> Image:
     """
     Segments an image using a semantic segmentation model.
@@ -182,38 +210,12 @@ class ControlNetDepthDesignModelMulti:
     def __init__(self):
         """ Initialize your model(s) here """
         #os.environ['HF_HUB_OFFLINE'] = "True"
-        controlnet_depth= ControlNetModel.from_pretrained(
-            "controlnet_depth", torch_dtype=dtype, use_safetensors=True)
-        controlnet_seg = ControlNetModel.from_pretrained(
-            "own_controlnet", torch_dtype=dtype, use_safetensors=True)
-        self.pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
-            "SG161222/Realistic_Vision_V5.1_noVAE",
-            #"models/runwayml--stable-diffusion-inpainting",
-            controlnet=[controlnet_depth, controlnet_seg],
-            safety_checker=None,
-            torch_dtype=dtype
-        )
-        self.pipe.load_ip_adapter("h94/IP-Adapter", subfolder="models",
-                                  weight_name="ip-adapter_sd15.bin")
-        self.pipe.set_ip_adapter_scale(0.4)
-        self.pipe.scheduler = UniPCMultistepScheduler.from_config(self.pipe.scheduler.config)
-        self.pipe = self.pipe.to(device)
-        self.guide_pipe = StableDiffusionXLPipeline.from_pretrained("segmind/SSD-1B",
-                                                                    torch_dtype=dtype, use_safetensors=True, variant="fp16")
-        self.guide_pipe = self.guide_pipe.to(device)
         self.seed = 323*111
         self.neg_prompt = "window, door, low resolution, banner, logo, watermark, text, deformed, blurry, out of focus, surreal, ugly, beginner"
         self.control_items = ["windowpane;window", "door;double;door"]
         self.additional_quality_suffix = "interior design, 4K, high resolution, photorealistic"
-        self.seg_image_processor, self.image_segmentor = get_segmentation_pipeline()
-        self.depth_feature_extractor, self.depth_estimator = get_depth_pipeline()
-        self.depth_estimator = self.depth_estimator.to(device)
     @spaces.GPU
     def generate_design(self, empty_room_image: Image, prompt: str, guidance_scale: int = 10, num_steps: int = 50, strength: float =0.9, img_size: int = 640) -> Image:
         """
@@ -235,9 +237,9 @@ class ControlNetDepthDesignModelMulti:
         orig_w, orig_h = empty_room_image.size
         new_width, new_height = resize_dimensions(empty_room_image.size, img_size)
         input_image = empty_room_image.resize((new_width, new_height))
-        real_seg = np.array(segment_image(input_image,
-                                          self.seg_image_processor,
-                                          self.image_segmentor))
         unique_colors = np.unique(real_seg.reshape(-1, real_seg.shape[2]), axis=0)
         unique_colors = [tuple(color) for color in unique_colors]
         segment_items = [map_colors_rgb(i) for i in unique_colors]
@@ -256,13 +258,13 @@ class ControlNetDepthDesignModelMulti:
         mask_image = Image.fromarray((mask * 255).astype(np.uint8)).convert("RGB")
         segmentation_cond_image = Image.fromarray(real_seg).convert("RGB")
-        image_depth = get_depth_image(image, self.depth_feature_extractor, self.depth_estimator)
         # generate image that would be used as IP-adapter
         flush()
         new_width_ip = int(new_width / 8) * 8
         new_height_ip = int(new_height / 8) * 8
-        ip_image = self.guide_pipe(pos_prompt,
                                    num_inference_steps=num_steps,
                                    negative_prompt=self.neg_prompt,
                                    height=new_height_ip,
@@ -270,7 +272,7 @@ class ControlNetDepthDesignModelMulti:
                                    generator=[self.generator]).images[0]
         flush()
-        generated_image = self.pipe(
             prompt=pos_prompt,
             negative_prompt=self.neg_prompt,
             num_inference_steps=num_steps,

 dtype = torch.float16
+controlnet_depth= ControlNetModel.from_pretrained(
+    "controlnet_depth", torch_dtype=dtype, use_safetensors=True)
+controlnet_seg = ControlNetModel.from_pretrained(
+    "own_controlnet", torch_dtype=dtype, use_safetensors=True)
+pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
+    "SG161222/Realistic_Vision_V5.1_noVAE",
+    #"models/runwayml--stable-diffusion-inpainting",
+    controlnet=[controlnet_depth, controlnet_seg],
+    safety_checker=None,
+    torch_dtype=dtype
+)
+pipe.load_ip_adapter("h94/IP-Adapter", subfolder="models",
+                     weight_name="ip-adapter_sd15.bin")
+pipe.set_ip_adapter_scale(0.4)
+pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
+pipe = pipe.to(device)
+guide_pipe = StableDiffusionXLPipeline.from_pretrained("segmind/SSD-1B",
+                                                       torch_dtype=dtype, use_safetensors=True, variant="fp16")
+guide_pipe = guide_pipe.to(device)
+seg_image_processor, image_segmentor = get_segmentation_pipeline()
+depth_feature_extractor, depth_estimator = get_depth_pipeline()
+depth_estimator = depth_estimator.to(device)
 css = """
 #img-display-container {
     max-height: 50vh;
 @spaces.GPU
 def segment_image(
         image: Image,
+        #image_processor: AutoImageProcessor,
+        #image_segmentor: UperNetForSemanticSegmentation
 ) -> Image:
     """
     Segments an image using a semantic segmentation model.
     def __init__(self):
         """ Initialize your model(s) here """
         #os.environ['HF_HUB_OFFLINE'] = "True"
         self.seed = 323*111
         self.neg_prompt = "window, door, low resolution, banner, logo, watermark, text, deformed, blurry, out of focus, surreal, ugly, beginner"
         self.control_items = ["windowpane;window", "door;double;door"]
         self.additional_quality_suffix = "interior design, 4K, high resolution, photorealistic"
     @spaces.GPU
     def generate_design(self, empty_room_image: Image, prompt: str, guidance_scale: int = 10, num_steps: int = 50, strength: float =0.9, img_size: int = 640) -> Image:
         """
         orig_w, orig_h = empty_room_image.size
         new_width, new_height = resize_dimensions(empty_room_image.size, img_size)
         input_image = empty_room_image.resize((new_width, new_height))
+        real_seg = np.array(segment_image(input_image))#,
+                                          #seg_image_processor,
+                                          #image_segmentor))
         unique_colors = np.unique(real_seg.reshape(-1, real_seg.shape[2]), axis=0)
         unique_colors = [tuple(color) for color in unique_colors]
         segment_items = [map_colors_rgb(i) for i in unique_colors]
         mask_image = Image.fromarray((mask * 255).astype(np.uint8)).convert("RGB")
         segmentation_cond_image = Image.fromarray(real_seg).convert("RGB")
+        image_depth = get_depth_image(image, depth_feature_extractor, depth_estimator)
         # generate image that would be used as IP-adapter
         flush()
         new_width_ip = int(new_width / 8) * 8
         new_height_ip = int(new_height / 8) * 8
+        ip_image = guide_pipe(pos_prompt,
                                    num_inference_steps=num_steps,
                                    negative_prompt=self.neg_prompt,
                                    height=new_height_ip,
                                    generator=[self.generator]).images[0]
         flush()
+        generated_image = pipe(
             prompt=pos_prompt,
             negative_prompt=self.neg_prompt,
             num_inference_steps=num_steps,