Spaces:

John6666
/

StableDesign

Runtime error

App Files Files Community

John6666 commited on Apr 14

Commit

af4b6de

verified ·

1 Parent(s): be39db2

Upload folder using huggingface_hub

Browse files

Files changed (16) hide show

.gitattributes +5 -0
README.md +5 -4
app.py +377 -0
colors.py +344 -0
controlnet_depth/config.json +52 -0
imgs/bedroom_1.jpg +3 -0
imgs/bedroom_2.jpg +3 -0
imgs/dinning_room_1.jpg +3 -0
imgs/dinning_room_3.jpg +3 -0
imgs/image_1.jpg +0 -0
imgs/image_2.jpg +0 -0
imgs/living_room_1.jpg +3 -0
own_controlnet/config.json +53 -0
palette.py +37 -0
requirements.txt +10 -0
utils.py +83 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+imgs/bedroom_1.jpg filter=lfs diff=lfs merge=lfs -text
+imgs/bedroom_2.jpg filter=lfs diff=lfs merge=lfs -text
+imgs/dinning_room_1.jpg filter=lfs diff=lfs merge=lfs -text
+imgs/dinning_room_3.jpg filter=lfs diff=lfs merge=lfs -text
+imgs/living_room_1.jpg filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,12 +1,13 @@
 ---
 title: StableDesign
-emoji: 🌖
-colorFrom: gray
-colorTo: purple
 sdk: gradio
-sdk_version: 5.25.0
 app_file: app.py
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
 title: StableDesign
+emoji: 🏆
+colorFrom: yellow
+colorTo: gray
 sdk: gradio
+sdk_version: 4.26.0
 app_file: app.py
 pinned: false
+license: mit
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,377 @@

+import spaces
+from typing import Tuple, Union, List
+import os
+import numpy as np
+from PIL import Image
+import torch
+from diffusers.pipelines.controlnet import StableDiffusionControlNetInpaintPipeline
+from diffusers import ControlNetModel, UniPCMultistepScheduler, AutoPipelineForText2Image
+from transformers import AutoImageProcessor, UperNetForSemanticSegmentation, AutoModelForDepthEstimation
+from colors import ade_palette
+from utils import map_colors_rgb
+from diffusers import StableDiffusionXLPipeline
+import gradio as gr
+import gc
+device = "cuda"
+dtype = torch.float16
+css = """
+#img-display-container {
+    max-height: 50vh;
+    }
+#img-display-input {
+    max-height: 40vh;
+    }
+#img-display-output {
+    max-height: 40vh;
+    }
+"""
+def filter_items(
+    colors_list: Union[List, np.ndarray],
+    items_list: Union[List, np.ndarray],
+    items_to_remove: Union[List, np.ndarray]
+) -> Tuple[Union[List, np.ndarray], Union[List, np.ndarray]]:
+    """
+    Filters items and their corresponding colors from given lists, excluding
+    specified items.
+    Args:
+        colors_list: A list or numpy array of colors corresponding to items.
+        items_list: A list or numpy array of items.
+        items_to_remove: A list or numpy array of items to be removed.
+    Returns:
+        A tuple of two lists or numpy arrays: filtered colors and filtered
+        items.
+    """
+    filtered_colors = []
+    filtered_items = []
+    for color, item in zip(colors_list, items_list):
+        if item not in items_to_remove:
+            filtered_colors.append(color)
+            filtered_items.append(item)
+    return filtered_colors, filtered_items
+def get_segmentation_pipeline(
+) -> Tuple[AutoImageProcessor, UperNetForSemanticSegmentation]:
+    """Method to load the segmentation pipeline
+    Returns:
+        Tuple[AutoImageProcessor, UperNetForSemanticSegmentation]: segmentation pipeline
+    """
+    image_processor = AutoImageProcessor.from_pretrained(
+        "openmmlab/upernet-convnext-small"
+    )
+    image_segmentor = UperNetForSemanticSegmentation.from_pretrained(
+        "openmmlab/upernet-convnext-small"
+    )
+    return image_processor, image_segmentor
+@torch.inference_mode()
+@spaces.GPU
+def segment_image(
+        image: Image,
+        image_processor: AutoImageProcessor,
+        image_segmentor: UperNetForSemanticSegmentation
+) -> Image:
+    """
+    Segments an image using a semantic segmentation model.
+    Args:
+        image (Image): The input image to be segmented.
+        image_processor (AutoImageProcessor): The processor to prepare the
+            image for segmentation.
+        image_segmentor (UperNetForSemanticSegmentation): The semantic
+            segmentation model used to identify different segments in the image.
+    Returns:
+        Image: The segmented image with each segment colored differently based
+            on its identified class.
+    """
+    # image_processor, image_segmentor = get_segmentation_pipeline()
+    pixel_values = image_processor(image, return_tensors="pt").pixel_values
+    with torch.no_grad():
+        outputs = image_segmentor(pixel_values)
+    seg = image_processor.post_process_semantic_segmentation(
+        outputs, target_sizes=[image.size[::-1]])[0]
+    color_seg = np.zeros((seg.shape[0], seg.shape[1], 3), dtype=np.uint8)
+    palette = np.array(ade_palette())
+    for label, color in enumerate(palette):
+        color_seg[seg == label, :] = color
+    color_seg = color_seg.astype(np.uint8)
+    seg_image = Image.fromarray(color_seg).convert('RGB')
+    return seg_image
+def get_depth_pipeline():
+    feature_extractor = AutoImageProcessor.from_pretrained("LiheYoung/depth-anything-large-hf",
+                                                           torch_dtype=dtype)
+    depth_estimator = AutoModelForDepthEstimation.from_pretrained("LiheYoung/depth-anything-large-hf",
+                                                                  torch_dtype=dtype)
+    return feature_extractor, depth_estimator
+@torch.inference_mode()
+@spaces.GPU
+def get_depth_image(
+        image: Image,
+        feature_extractor: AutoImageProcessor,
+        depth_estimator: AutoModelForDepthEstimation
+) -> Image:
+    image_to_depth = feature_extractor(images=image, return_tensors="pt").to(device)
+    with torch.no_grad():
+        depth_map = depth_estimator(**image_to_depth).predicted_depth
+    width, height = image.size
+    depth_map = torch.nn.functional.interpolate(
+        depth_map.unsqueeze(1).float(),
+        size=(height, width),
+        mode="bicubic",
+        align_corners=False,
+    )
+    depth_min = torch.amin(depth_map, dim=[1, 2, 3], keepdim=True)
+    depth_max = torch.amax(depth_map, dim=[1, 2, 3], keepdim=True)
+    depth_map = (depth_map - depth_min) / (depth_max - depth_min)
+    image = torch.cat([depth_map] * 3, dim=1)
+    image = image.permute(0, 2, 3, 1).cpu().numpy()[0]
+    image = Image.fromarray((image * 255.0).clip(0, 255).astype(np.uint8))
+    return image
+def resize_dimensions(dimensions, target_size):
+    """
+    Resize PIL to target size while maintaining aspect ratio
+    If smaller than target size leave it as is
+    """
+    width, height = dimensions
+    # Check if both dimensions are smaller than the target size
+    if width < target_size and height < target_size:
+        return dimensions
+    # Determine the larger side
+    if width > height:
+        # Calculate the aspect ratio
+        aspect_ratio = height / width
+        # Resize dimensions
+        return (target_size, int(target_size * aspect_ratio))
+    else:
+        # Calculate the aspect ratio
+        aspect_ratio = width / height
+        # Resize dimensions
+        return (int(target_size * aspect_ratio), target_size)
+def flush():
+    gc.collect()
+    torch.cuda.empty_cache()
+class ControlNetDepthDesignModelMulti:
+    """ Produces random noise images """
+    def __init__(self):
+        """ Initialize your model(s) here """
+        #os.environ['HF_HUB_OFFLINE'] = "True"
+        self.seed = 323*111
+        self.neg_prompt = "window, door, low resolution, banner, logo, watermark, text, deformed, blurry, out of focus, surreal, ugly, beginner"
+        self.control_items = ["windowpane;window", "door;double;door"]
+        self.additional_quality_suffix = "interior design, 4K, high resolution, photorealistic"
+    @spaces.GPU
+    def generate_design(self, empty_room_image: Image, prompt: str, guidance_scale: int = 10, num_steps: int = 50, strength: float =0.9, img_size: int = 640) -> Image:
+        """
+        Given an image of an empty room and a prompt
+        generate the designed room according to the prompt
+        Inputs -
+            empty_room_image - An RGB PIL Image of the empty room
+            prompt - Text describing the target design elements of the room
+        Returns -
+            design_image - PIL Image of the same size as the empty room image
+                           If the size is not the same the submission will fail.
+        """
+        print(prompt)
+        flush()
+        self.generator = torch.Generator(device=device).manual_seed(self.seed)
+        pos_prompt = prompt + f', {self.additional_quality_suffix}'
+        orig_w, orig_h = empty_room_image.size
+        new_width, new_height = resize_dimensions(empty_room_image.size, img_size)
+        input_image = empty_room_image.resize((new_width, new_height))
+        real_seg = np.array(segment_image(input_image,
+                                          seg_image_processor,
+                                          image_segmentor))
+        unique_colors = np.unique(real_seg.reshape(-1, real_seg.shape[2]), axis=0)
+        unique_colors = [tuple(color) for color in unique_colors]
+        segment_items = [map_colors_rgb(i) for i in unique_colors]
+        chosen_colors, segment_items = filter_items(
+            colors_list=unique_colors,
+            items_list=segment_items,
+            items_to_remove=self.control_items
+        )
+        mask = np.zeros_like(real_seg)
+        for color in chosen_colors:
+            color_matches = (real_seg == color).all(axis=2)
+            mask[color_matches] = 1
+        image_np = np.array(input_image)
+        image = Image.fromarray(image_np).convert("RGB")
+        mask_image = Image.fromarray((mask * 255).astype(np.uint8)).convert("RGB")
+        segmentation_cond_image = Image.fromarray(real_seg).convert("RGB")
+        image_depth = get_depth_image(image, depth_feature_extractor, depth_estimator)
+        # generate image that would be used as IP-adapter
+        flush()
+        new_width_ip = int(new_width / 8) * 8
+        new_height_ip = int(new_height / 8) * 8
+        ip_image = guide_pipe(pos_prompt,
+                                   num_inference_steps=num_steps,
+                                   negative_prompt=self.neg_prompt,
+                                   height=new_height_ip,
+                                   width=new_width_ip,
+                                   generator=[self.generator]).images[0]
+        flush()
+        generated_image = pipe(
+            prompt=pos_prompt,
+            negative_prompt=self.neg_prompt,
+            num_inference_steps=num_steps,
+            strength=strength,
+            guidance_scale=guidance_scale,
+            generator=[self.generator],
+            image=image,
+            mask_image=mask_image,
+            ip_adapter_image=ip_image,
+            control_image=[image_depth, segmentation_cond_image],
+            controlnet_conditioning_scale=[0.5, 0.5]
+        ).images[0]
+        flush()
+        design_image = generated_image.resize(
+            (orig_w, orig_h), Image.Resampling.LANCZOS
+        )
+        return design_image
+def create_demo(model):
+    gr.Markdown("### Stable Design demo")
+    with gr.Row():
+        with gr.Column():
+            input_image = gr.Image(label="Input Image", type='pil', elem_id='img-display-input')
+            input_text = gr.Textbox(label='Prompt', placeholder='Please upload your image first', lines=2)
+            with gr.Accordion('Advanced options', open=False):
+                num_steps = gr.Slider(label='Steps',
+                                      minimum=1,
+                                      maximum=50,
+                                      value=50,
+                                      step=1)
+                img_size = gr.Slider(label='Image size',
+                                      minimum=256,
+                                      maximum=768,
+                                      value=768,
+                                      step=64)
+                guidance_scale = gr.Slider(label='Guidance Scale',
+                                           minimum=0.1,
+                                           maximum=30.0,
+                                           value=10.0,
+                                           step=0.1)
+                seed = gr.Slider(label='Seed',
+                                 minimum=-1,
+                                 maximum=2147483647,
+                                 value=323*111,
+                                 step=1,
+                                 randomize=True)
+                strength = gr.Slider(label='Strength',
+                                           minimum=0.1,
+                                           maximum=1.0,
+                                           value=0.9,
+                                           step=0.1)
+                a_prompt = gr.Textbox(
+                    label='Added Prompt',
+                    value="interior design, 4K, high resolution, photorealistic")
+                n_prompt = gr.Textbox(
+                    label='Negative Prompt',
+                    value="window, door, low resolution, banner, logo, watermark, text, deformed, blurry, out of focus, surreal, ugly, beginner")
+            submit = gr.Button("Submit")
+        with gr.Column():
+            design_image = gr.Image(label="Output Mask", elem_id='img-display-output')
+    def on_submit(image, text, num_steps, guidance_scale, seed, strength, a_prompt, n_prompt, img_size):
+        model.seed = seed
+        model.neg_prompt = n_prompt
+        model.additional_quality_suffix = a_prompt
+        with torch.no_grad():
+            out_img = model.generate_design(image, text, guidance_scale=guidance_scale, num_steps=num_steps, strength=strength, img_size=img_size)
+        return out_img
+    submit.click(on_submit, inputs=[input_image, input_text, num_steps, guidance_scale, seed, strength, a_prompt, n_prompt, img_size], outputs=design_image)
+    examples = gr.Examples(examples=[["imgs/bedroom_1.jpg", "An elegantly appointed bedroom in the Art Deco style, featuring a grand king-size bed with geometric bedding, a luxurious velvet armchair, and a mirrored nightstand that reflects the room's opulence. Art Deco-inspired artwork adds a touch of glamour"], ["imgs/bedroom_2.jpg", "A bedroom that exudes French country charm with a soft upholstered bed, walls adorned with floral wallpaper, and a vintage wooden wardrobe. A crystal chandelier casts a warm, inviting glow over the space"], ["imgs/dinning_room_1.jpg", "A cozy dining room that captures the essence of rustic charm with a solid wooden farmhouse table at its core, surrounded by an eclectic mix of mismatched chairs. An antique sideboard serves as a statement piece, and the ambiance is warmly lit by a series of quaint Edison bulbs dangling from the ceiling"], ["imgs/dinning_room_3.jpg", "A dining room that epitomizes contemporary elegance, anchored by a sleek, minimalist dining table paired with stylish modern chairs. Artistic lighting fixtures create a focal point above, while the surrounding minimalist decor ensures the space feels open, airy, and utterly modern"], ["imgs/image_1.jpg", "A glamorous master bedroom in Hollywood Regency style, boasting a plush tufted headboard, mirrored furniture reflecting elegance, luxurious fabrics in rich textures, and opulent gold accents for a touch of luxury."], ["imgs/image_2.jpg", "A vibrant living room with a tropical theme, complete with comfortable rattan furniture, large leafy plants bringing the outdoors in, bright cushions adding pops of color, and bamboo blinds for natural light control."], ["imgs/living_room_1.jpg", "A stylish living room embracing mid-century modern aesthetics, featuring a vintage teak coffee table at its center, complemented by a classic sunburst clock on the wall and a cozy shag rug underfoot, creating a warm and inviting atmosphere"]],
+                           inputs=[input_image, input_text], cache_examples=False)
+controlnet_depth= ControlNetModel.from_pretrained(
+    "controlnet_depth", torch_dtype=dtype, use_safetensors=True)
+controlnet_seg = ControlNetModel.from_pretrained(
+    "own_controlnet", torch_dtype=dtype, use_safetensors=True)
+pipe = StableDiffusionControlNetInpaintPipeline.from_pretrained(
+    "SG161222/Realistic_Vision_V5.1_noVAE",
+    #"models/runwayml--stable-diffusion-inpainting",
+    controlnet=[controlnet_depth, controlnet_seg],
+    safety_checker=None,
+    torch_dtype=dtype
+)
+pipe.load_ip_adapter("h94/IP-Adapter", subfolder="models",
+                     weight_name="ip-adapter_sd15.bin")
+pipe.set_ip_adapter_scale(0.4)
+pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
+pipe = pipe.to(device)
+guide_pipe = StableDiffusionXLPipeline.from_pretrained("segmind/SSD-1B",
+                                                       torch_dtype=dtype, use_safetensors=True, variant="fp16")
+guide_pipe = guide_pipe.to(device)
+seg_image_processor, image_segmentor = get_segmentation_pipeline()
+depth_feature_extractor, depth_estimator = get_depth_pipeline()
+depth_estimator = depth_estimator.to(device)
+def main():
+    model = ControlNetDepthDesignModelMulti()
+    print('Models uploaded successfully')
+    title = "# StableDesign"
+    description = """
+    <p style='font-size: 14px; margin-bottom: 10px;'><a href='https://www.linkedin.com/in/mykola-lavreniuk/'>Mykola Lavreniuk</a>, <a href='https://www.linkedin.com/in/bartosz-ludwiczuk-a677a760/'>Bartosz Ludwiczuk</a></p>
+    <p style='font-size: 16px; margin-bottom: 0px; margin-top=0px;'>Official demo for <strong>StableDesign:</strong> 2nd place solution for the Generative Interior Design 2024 <a href='https://www.aicrowd.com/challenges/generative-interior-design-challenge-2024/leaderboards?challenge_round_id=1314'>competition</a>. StableDesign is a deep learning model designed to harness the power of AI, providing innovative and creative tools for designers. Using our algorithms, images of empty rooms can be transformed into fully furnished spaces based on text descriptions. Please refer to our <a href='https://github.com/Lavreniuk/generative-interior-design'>GitHub</a> for more details.</p>
+    """
+    with gr.Blocks() as demo:
+        gr.Markdown(title)
+        gr.Markdown(description)
+        create_demo(model)
+        gr.HTML('''<br><br><br><center>You can duplicate this Space to skip the queue:<a href="https://huggingface.co/spaces/MykolaL/StableDesign?duplicate=true"><img src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a><br>
+                <p><img src="https://visitor-badge.glitch.me/badge?page_id=MykolaL/StableDesign" alt="visitors"></p></center>''')
+    demo.queue().launch(share=False)
+if __name__ == '__main__':
+    main()

colors.py ADDED Viewed

	@@ -0,0 +1,344 @@

+"""Color mappings"""
+from typing import List
+TRIVIA = {
+    "#B47878": "building;edifice",
+    "#06E6E6": "sky",
+    "#04C803": "tree",
+    "#8C8C8C": "road;route",
+    "#04FA07": "grass",
+    "#96053D": "person;individual;someone;somebody;mortal;soul",
+    "#CCFF04": "plant;flora;plant;life",
+    "#787846": "earth;ground",
+    "#FF09E0": "house",
+    "#0066C8": "car;auto;automobile;machine;motorcar",
+    "#3DE6FA": "water",
+    "#FF3D06": "railing;rail",
+    "#FF5C00": "arcade;machine",
+    "#FFE000": "stairs;steps",
+    "#00F5FF": "fan",
+    "#FF008F": "step;stair",
+    "#1F00FF": "stairway;staircase",
+    "#FFD600": "radiator",
+}
+OBJECTS = {
+    "#CC05FF": "bed",
+    "#FF0633": "painting;picture",
+    "#DCDCDC": "mirror",
+    "#00FF14": "box",
+    "#FF0000": "flower",
+    "#FFA300": "book",
+    "#00FFC2": "television;television;receiver;television;set;tv;tv;set;idiot;box;boob;tube;telly;goggle;box",
+    "#F500FF": "pot;flowerpot",
+    "#00FFCC": "vase",
+    "#29FF00": "tray",
+    "#8FFF00": "poster;posting;placard;notice;bill;card",
+    "#5CFF00": "basket;handbasket",
+    "#00ADFF": "screen;door;screen",
+}
+SITTING = {
+    "#0B66FF": "sofa;couch;lounge",
+    "#CC4603": "chair",
+    "#07FFE0": "seat",
+    "#08FFD6": "armchair",
+    "#FFC207": "cushion",
+    "#00EBFF": "pillow",
+    "#00D6FF": "stool",
+    "#1400FF": "blanket;cover",
+    "#0A00FF": "swivel;chair",
+    "#FF9900": "ottoman;pouf;pouffe;puff;hassock",
+}
+LIGHTING = {
+    "#E0FF08": "lamp",
+    "#FFAD00": "light;light;source",
+    "#001FFF": "chandelier;pendant;pendent",
+}
+TABLES = {
+    "#FF0652": "table",
+    "#0AFF47": "desk",
+}
+CLOSETS = {
+    "#E005FF": "cabinet",
+    "#FF0747": "shelf",
+    "#07FFFF": "wardrobe;closet;press",
+    "#0633FF": "chest;of;drawers;chest;bureau;dresser",
+    "#0000FF": "case;display;case;showcase;vitrine",
+}
+BATHROOM = {
+    "#6608FF": "bathtub;bathing;tub;bath;tub",
+    "#00FF85": "toilet;can;commode;crapper;pot;potty;stool;throne",
+    "#0085FF": "shower",
+    "#FF0066": "towel",
+}
+WINDOWS = {
+    "#FF3307": "curtain;drape;drapery;mantle;pall",
+    "#E6E6E6": "windowpane;window",
+    "#00FF3D": "awning;sunshade;sunblind",
+    "#003DFF": "blind;screen",
+}
+FLOOR = {
+    "#FF095C": "rug;carpet;carpeting",
+    "#503232": "floor;flooring",
+}
+INTERIOR = {
+    "#787878": "wall",
+    "#787850": "ceiling",
+    "#08FF33": "door;double;door",
+}
+KITCHEN = {
+    "#00FF29": "kitchen;island",
+    "#14FF00": "refrigerator;icebox",
+    "#00A3FF": "sink",
+    "#EB0CFF": "counter",
+    "#D6FF00": "dishwasher;dish;washer;dishwashing;machine",
+    "#FF00EB": "microwave;microwave;oven",
+    "#47FF00": "oven",
+    "#66FF00": "clock",
+    "#00FFB8": "plate",
+    "#19C2C2": "glass;drinking;glass",
+    "#00FF99": "bar",
+    "#00FF0A": "bottle",
+    "#FF7000": "buffet;counter;sideboard",
+    "#B800FF": "washer;automatic;washer;washing;machine",
+    "#00FF70": "coffee;table;cocktail;table",
+    "#008FFF": "countertop",
+    "#33FF00": "stove;kitchen;stove;range;kitchen;range;cooking;stove",
+}
+LIVINGROOM = {
+    "#FA0A0F": "fireplace;hearth;open;fireplace",
+    "#FF4700": "pool;table;billiard;table;snooker;table",
+}
+OFFICE = {
+    "#00FFAD": "computer;computing;machine;computing;device;data;processor;electronic;computer;information;processing;system",
+    "#00FFF5": "bookcase",
+    "#0633FF": "chest;of;drawers;chest;bureau;dresser",
+    "#005CFF": "monitor;monitoring;device",
+}
+COLOR_MAPPING_CATEGORY_ = {
+ 'keep background': {'#FFFFFF': 'background'},
+ 'trivia': TRIVIA,
+ 'objects': OBJECTS,
+ 'sitting': SITTING,
+ 'lighting': LIGHTING,
+ 'tables': TABLES,
+ 'closets': CLOSETS,
+ 'bathroom': BATHROOM,
+ 'windows': WINDOWS,
+ 'floor': FLOOR,
+ 'interior': INTERIOR,
+ 'kitchen': KITCHEN,
+ 'livingroom': LIVINGROOM,
+ 'office': OFFICE}
+COLOR_MAPPING_ = {
+    '#FFFFFF': 'background',
+    "#787878": "wall",
+    "#B47878": "building;edifice",
+    "#06E6E6": "sky",
+    "#503232": "floor;flooring",
+    "#04C803": "tree",
+    "#787850": "ceiling",
+    "#8C8C8C": "road;route",
+    "#CC05FF": "bed",
+    "#E6E6E6": "windowpane;window",
+    "#04FA07": "grass",
+    "#E005FF": "cabinet",
+    "#EBFF07": "sidewalk;pavement",
+    "#96053D": "person;individual;someone;somebody;mortal;soul",
+    "#787846": "earth;ground",
+    "#08FF33": "door;double;door",
+    "#FF0652": "table",
+    "#8FFF8C": "mountain;mount",
+    "#CCFF04": "plant;flora;plant;life",
+    "#FF3307": "curtain;drape;drapery;mantle;pall",
+    "#CC4603": "chair",
+    "#0066C8": "car;auto;automobile;machine;motorcar",
+    "#3DE6FA": "water",
+    "#FF0633": "painting;picture",
+    "#0B66FF": "sofa;couch;lounge",
+    "#FF0747": "shelf",
+    "#FF09E0": "house",
+    "#0907E6": "sea",
+    "#DCDCDC": "mirror",
+    "#FF095C": "rug;carpet;carpeting",
+    "#7009FF": "field",
+    "#08FFD6": "armchair",
+    "#07FFE0": "seat",
+    "#FFB806": "fence;fencing",
+    "#0AFF47": "desk",
+    "#FF290A": "rock;stone",
+    "#07FFFF": "wardrobe;closet;press",
+    "#E0FF08": "lamp",
+    "#6608FF": "bathtub;bathing;tub;bath;tub",
+    "#FF3D06": "railing;rail",
+    "#FFC207": "cushion",
+    "#FF7A08": "base;pedestal;stand",
+    "#00FF14": "box",
+    "#FF0829": "column;pillar",
+    "#FF0599": "signboard;sign",
+    "#0633FF": "chest;of;drawers;chest;bureau;dresser",
+    "#EB0CFF": "counter",
+    "#A09614": "sand",
+    "#00A3FF": "sink",
+    "#8C8C8C": "skyscraper",
+    "#FA0A0F": "fireplace;hearth;open;fireplace",
+    "#14FF00": "refrigerator;icebox",
+    "#1FFF00": "grandstand;covered;stand",
+    "#FF1F00": "path",
+    "#FFE000": "stairs;steps",
+    "#99FF00": "runway",
+    "#0000FF": "case;display;case;showcase;vitrine",
+    "#FF4700": "pool;table;billiard;table;snooker;table",
+    "#00EBFF": "pillow",
+    "#00ADFF": "screen;door;screen",
+    "#1F00FF": "stairway;staircase",
+    "#0BC8C8": "river",
+    "#FF5200": "bridge;span",
+    "#00FFF5": "bookcase",
+    "#003DFF": "blind;screen",
+    "#00FF70": "coffee;table;cocktail;table",
+    "#00FF85": "toilet;can;commode;crapper;pot;potty;stool;throne",
+    "#FF0000": "flower",
+    "#FFA300": "book",
+    "#FF6600": "hill",
+    "#C2FF00": "bench",
+    "#008FFF": "countertop",
+    "#33FF00": "stove;kitchen;stove;range;kitchen;range;cooking;stove",
+    "#0052FF": "palm;palm;tree",
+    "#00FF29": "kitchen;island",
+    "#00FFAD": "computer;computing;machine;computing;device;data;processor;electronic;computer;information;processing;system",
+    "#0A00FF": "swivel;chair",
+    "#ADFF00": "boat",
+    "#00FF99": "bar",
+    "#FF5C00": "arcade;machine",
+    "#FF00FF": "hovel;hut;hutch;shack;shanty",
+    "#FF00F5": "bus;autobus;coach;charabanc;double-decker;jitney;motorbus;motorcoach;omnibus;passenger;vehicle",
+    "#FF0066": "towel",
+    "#FFAD00": "light;light;source",
+    "#FF0014": "truck;motortruck",
+    "#FFB8B8": "tower",
+    "#001FFF": "chandelier;pendant;pendent",
+    "#00FF3D": "awning;sunshade;sunblind",
+    "#0047FF": "streetlight;street;lamp",
+    "#FF00CC": "booth;cubicle;stall;kiosk",
+    "#00FFC2": "television;television;receiver;television;set;tv;tv;set;idiot;box;boob;tube;telly;goggle;box",
+    "#00FF52": "airplane;aeroplane;plane",
+    "#000AFF": "dirt;track",
+    "#0070FF": "apparel;wearing;apparel;dress;clothes",
+    "#3300FF": "pole",
+    "#00C2FF": "land;ground;soil",
+    "#007AFF": "bannister;banister;balustrade;balusters;handrail",
+    "#00FFA3": "escalator;moving;staircase;moving;stairway",
+    "#FF9900": "ottoman;pouf;pouffe;puff;hassock",
+    "#00FF0A": "bottle",
+    "#FF7000": "buffet;counter;sideboard",
+    "#8FFF00": "poster;posting;placard;notice;bill;card",
+    "#5200FF": "stage",
+    "#A3FF00": "van",
+    "#FFEB00": "ship",
+    "#08B8AA": "fountain",
+    "#8500FF": "conveyer;belt;conveyor;belt;conveyer;conveyor;transporter",
+    "#00FF5C": "canopy",
+    "#B800FF": "washer;automatic;washer;washing;machine",
+    "#FF001F": "plaything;toy",
+    "#00B8FF": "swimming;pool;swimming;bath;natatorium",
+    "#00D6FF": "stool",
+    "#FF0070": "barrel;cask",
+    "#5CFF00": "basket;handbasket",
+    "#00E0FF": "waterfall;falls",
+    "#70E0FF": "tent;collapsible;shelter",
+    "#46B8A0": "bag",
+    "#A300FF": "minibike;motorbike",
+    "#9900FF": "cradle",
+    "#47FF00": "oven",
+    "#FF00A3": "ball",
+    "#FFCC00": "food;solid;food",
+    "#FF008F": "step;stair",
+    "#00FFEB": "tank;storage;tank",
+    "#85FF00": "trade;name;brand;name;brand;marque",
+    "#FF00EB": "microwave;microwave;oven",
+    "#F500FF": "pot;flowerpot",
+    "#FF007A": "animal;animate;being;beast;brute;creature;fauna",
+    "#FFF500": "bicycle;bike;wheel;cycle",
+    "#0ABED4": "lake",
+    "#D6FF00": "dishwasher;dish;washer;dishwashing;machine",
+    "#00CCFF": "screen;silver;screen;projection;screen",
+    "#1400FF": "blanket;cover",
+    "#FFFF00": "sculpture",
+    "#0099FF": "hood;exhaust;hood",
+    "#0029FF": "sconce",
+    "#00FFCC": "vase",
+    "#2900FF": "traffic;light;traffic;signal;stoplight",
+    "#29FF00": "tray",
+    "#AD00FF": "ashcan;trash;can;garbage;can;wastebin;ash;bin;ash-bin;ashbin;dustbin;trash;barrel;trash;bin",
+    "#00F5FF": "fan",
+    "#4700FF": "pier;wharf;wharfage;dock",
+    "#7A00FF": "crt;screen",
+    "#00FFB8": "plate",
+    "#005CFF": "monitor;monitoring;device",
+    "#B8FF00": "bulletin;board;notice;board",
+    "#0085FF": "shower",
+    "#FFD600": "radiator",
+    "#19C2C2": "glass;drinking;glass",
+    "#66FF00": "clock",
+    "#5C00FF": "flag",
+}
+def ade_palette() -> List[List[int]]:
+    """ADE20K palette that maps each class to RGB values."""
+    return [[120, 120, 120], [180, 120, 120], [6, 230, 230], [80, 50, 50],
+            [4, 200, 3], [120, 120, 80], [140, 140, 140], [204, 5, 255],
+            [230, 230, 230], [4, 250, 7], [224, 5, 255], [235, 255, 7],
+            [150, 5, 61], [120, 120, 70], [8, 255, 51], [255, 6, 82],
+            [143, 255, 140], [204, 255, 4], [255, 51, 7], [204, 70, 3],
+            [0, 102, 200], [61, 230, 250], [255, 6, 51], [11, 102, 255],
+            [255, 7, 71], [255, 9, 224], [9, 7, 230], [220, 220, 220],
+            [255, 9, 92], [112, 9, 255], [8, 255, 214], [7, 255, 224],
+            [255, 184, 6], [10, 255, 71], [255, 41, 10], [7, 255, 255],
+            [224, 255, 8], [102, 8, 255], [255, 61, 6], [255, 194, 7],
+            [255, 122, 8], [0, 255, 20], [255, 8, 41], [255, 5, 153],
+            [6, 51, 255], [235, 12, 255], [160, 150, 20], [0, 163, 255],
+            [140, 140, 140], [250, 10, 15], [20, 255, 0], [31, 255, 0],
+            [255, 31, 0], [255, 224, 0], [153, 255, 0], [0, 0, 255],
+            [255, 71, 0], [0, 235, 255], [0, 173, 255], [31, 0, 255],
+            [11, 200, 200], [255, 82, 0], [0, 255, 245], [0, 61, 255],
+            [0, 255, 112], [0, 255, 133], [255, 0, 0], [255, 163, 0],
+            [255, 102, 0], [194, 255, 0], [0, 143, 255], [51, 255, 0],
+            [0, 82, 255], [0, 255, 41], [0, 255, 173], [10, 0, 255],
+            [173, 255, 0], [0, 255, 153], [255, 92, 0], [255, 0, 255],
+            [255, 0, 245], [255, 0, 102], [255, 173, 0], [255, 0, 20],
+            [255, 184, 184], [0, 31, 255], [0, 255, 61], [0, 71, 255],
+            [255, 0, 204], [0, 255, 194], [0, 255, 82], [0, 10, 255],
+            [0, 112, 255], [51, 0, 255], [0, 194, 255], [0, 122, 255],
+            [0, 255, 163], [255, 153, 0], [0, 255, 10], [255, 112, 0],
+            [143, 255, 0], [82, 0, 255], [163, 255, 0], [255, 235, 0],
+            [8, 184, 170], [133, 0, 255], [0, 255, 92], [184, 0, 255],
+            [255, 0, 31], [0, 184, 255], [0, 214, 255], [255, 0, 112],
+            [92, 255, 0], [0, 224, 255], [112, 224, 255], [70, 184, 160],
+            [163, 0, 255], [153, 0, 255], [71, 255, 0], [255, 0, 163],
+            [255, 204, 0], [255, 0, 143], [0, 255, 235], [133, 255, 0],
+            [255, 0, 235], [245, 0, 255], [255, 0, 122], [255, 245, 0],
+            [10, 190, 212], [214, 255, 0], [0, 204, 255], [20, 0, 255],
+            [255, 255, 0], [0, 153, 255], [0, 41, 255], [0, 255, 204],
+            [41, 0, 255], [41, 255, 0], [173, 0, 255], [0, 245, 255],
+            [71, 0, 255], [122, 0, 255], [0, 255, 184], [0, 92, 255],
+            [184, 255, 0], [0, 133, 255], [255, 214, 0], [25, 194, 194],
+            [102, 255, 0], [92, 0, 255]]

controlnet_depth/config.json ADDED Viewed

	@@ -0,0 +1,52 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.28.0.dev0",
+  "_name_or_path": "lllyasviel/sd-controlnet-depth",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 768,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_time_scale_shift": "default",
+  "transformer_layers_per_block": 1,
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

imgs/bedroom_1.jpg ADDED Viewed

Git LFS Details

SHA256: d08d2d4ccc42ba29a1482c38eb3a932ef69057d367c63e2280eb204a18cb5c97
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

imgs/bedroom_2.jpg ADDED Viewed

Git LFS Details

SHA256: 1633f673dd5cc53a97b767e7c2a45ea9476ae7f3c72fa010e8d125bb4978ad87
Pointer size: 131 Bytes
Size of remote file: 432 kB

imgs/dinning_room_1.jpg ADDED Viewed

Git LFS Details

SHA256: 413d388107a7c0b5b54ab17b5a6526e6f63ee44dcf9348ec4ecee0744521cdf7
Pointer size: 131 Bytes
Size of remote file: 268 kB

imgs/dinning_room_3.jpg ADDED Viewed

Git LFS Details

SHA256: 9342f85cc9b7ff08e7a8ce113dbe7e16bde1c005d39228b020fa296bec054948
Pointer size: 131 Bytes
Size of remote file: 221 kB

imgs/image_1.jpg ADDED Viewed

imgs/image_2.jpg ADDED Viewed

imgs/living_room_1.jpg ADDED Viewed

Git LFS Details

SHA256: b58c299725c99e0671fd6dd86db1088e0d5d55059bb0845dee732d5b59af5c61
Pointer size: 131 Bytes
Size of remote file: 362 kB

own_controlnet/config.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "_class_name": "ControlNetModel",
+  "_diffusers_version": "0.21.1",
+  "_name_or_path": "BertChristiaens/controlnet-seg-room",
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "class_embed_type": null,
+  "conditioning_channels": 3,
+  "conditioning_embedding_out_channels": [
+    16,
+    32,
+    96,
+    256
+  ],
+  "controlnet_conditioning_channel_order": "rgb",
+  "cross_attention_dim": 768,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "global_pool_conditions": false,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_scale_factor": 1,
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_time_scale_shift": "default",
+  "sample_size": 32,
+  "transformer_layers_per_block": 1,
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

palette.py ADDED Viewed

	@@ -0,0 +1,37 @@

+from typing import Dict
+from colors import COLOR_MAPPING_, COLOR_MAPPING_CATEGORY_
+def convert_hex_to_rgba(hex_code: str) -> str:
+    """Convert hex code to rgba.
+    Args:
+        hex_code (str): hex string
+    Returns:
+        str: rgba string
+    """
+    hex_code = hex_code.lstrip('#')
+    return "rgba(" + str(int(hex_code[0:2], 16)) + ", " + str(int(hex_code[2:4], 16)) + ", " + str(int(hex_code[4:6], 16)) + ", 1.0)"
+def convert_dict_to_rgba(color_dict: Dict) -> Dict:
+    """Convert hex code to rgba for all elements in a dictionary.
+    Args:
+        color_dict (Dict): color dictionary
+    Returns:
+        Dict: color dictionary with rgba values
+    """
+    updated_dict = {}
+    for k, v in color_dict.items():
+        updated_dict[convert_hex_to_rgba(k)] = v
+    return updated_dict
+def convert_nested_dict_to_rgba(nested_dict):
+    updated_dict = {}
+    for k, v in nested_dict.items():
+        updated_dict[k] = convert_dict_to_rgba(v)
+    return updated_dict
+COLOR_MAPPING = convert_dict_to_rgba(COLOR_MAPPING_)
+COLOR_MAPPING_CATEGORY = convert_nested_dict_to_rgba(COLOR_MAPPING_CATEGORY_)

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+diffusers==0.25.0
+xformers==0.0.23.post1
+transformers==4.39.1
+torchvision
+accelerate==0.26.1
+opencv-python==4.9.0.80
+scipy==1.11.4
+triton==2.1.0
+altair==4.1.0
+pandas==2.1.4

utils.py ADDED Viewed

	@@ -0,0 +1,83 @@

+import gc
+import numpy as np
+from PIL import Image
+import torch
+from scipy.signal import fftconvolve
+from palette import COLOR_MAPPING, COLOR_MAPPING_
+def to_rgb(color: str) -> tuple:
+    """Convert hex color to rgb.
+    Args:
+        color (str): hex color
+    Returns:
+        tuple: rgb color
+    """
+    return tuple(int(color[i:i+2], 16) for i in (1, 3, 5))
+def map_colors(color: str) -> str:
+    """Map color to hex value.
+    Args:
+        color (str): color name
+    Returns:
+        str: hex value
+    """
+    return COLOR_MAPPING[color]
+def map_colors_rgb(color: tuple) -> str:
+    return COLOR_MAPPING_RGB[color]
+def convolution(mask: Image.Image, size=9) -> Image:
+    """Method to blur the mask
+    Args:
+        mask (Image): masking image
+        size (int, optional): size of the blur. Defaults to 9.
+    Returns:
+        Image: blurred mask
+    """
+    mask = np.array(mask.convert("L"))
+    conv = np.ones((size, size)) / size**2
+    mask_blended = fftconvolve(mask, conv, 'same')
+    mask_blended = mask_blended.astype(np.uint8).copy()
+    border = size
+    # replace borders with original values
+    mask_blended[:border, :] = mask[:border, :]
+    mask_blended[-border:, :] = mask[-border:, :]
+    mask_blended[:, :border] = mask[:, :border]
+    mask_blended[:, -border:] = mask[:, -border:]
+    return Image.fromarray(mask_blended).convert("L")
+def flush():
+    gc.collect()
+    torch.cuda.empty_cache()
+def postprocess_image_masking(inpainted: Image, image: Image,
+                              mask: Image) -> Image:
+    """Method to postprocess the inpainted image
+    Args:
+        inpainted (Image): inpainted image
+        image (Image): original image
+        mask (Image): mask
+    Returns:
+        Image: inpainted image
+    """
+    final_inpainted = Image.composite(inpainted.convert("RGBA"),
+                                      image.convert("RGBA"), mask)
+    return final_inpainted.convert("RGB")
+COLOR_NAMES = list(COLOR_MAPPING.keys())
+COLOR_RGB = [to_rgb(k) for k in COLOR_MAPPING_.keys()] + [(0, 0, 0),
+                                                          (255, 255, 255)]
+INVERSE_COLORS = {v: to_rgb(k) for k, v in COLOR_MAPPING_.items()}
+COLOR_MAPPING_RGB = {to_rgb(k): v for k, v in COLOR_MAPPING_.items()}