logo-in-context

Paused

App Files Files Community

multimodalart HF staff commited on 5 days ago

Commit

70db990

•

1 Parent(s): daa5f41

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -54

app.py CHANGED Viewed

@@ -118,63 +118,62 @@ with gr.Blocks() as demo:
             Note: The generation process might take a few moments.
             """)
-    with gr.Tab("🧨 diffusers"):
         gr.Markdown("The way this works is combining the [IC LoRA](https://github.com/ali-vilab/In-Context-LoRA) with image-to-image + inpainting. Where the image on the left (the logo) is uploaded by the user, and the image on the right is masked and applied on the product by the LoRA. Based on the [ComfyUI workflow by WizardWhitebeard/klinter](https://civitai.com/articles/8779). Below is a diffusers implementation of the idea")
-        gr.Code(language="python", value="""
-        import torch
-        from diffusers import FluxInpaintPipeline
-        pipe = FluxInpaintPipeline.from_pretrained("black-forest-labs/FLUX.1-dev", torch_dtype=torch.bfloat16)
-        pipe.to("cuda")
-        pipe.load_lora_weights("ali-vilab/In-Context-LoRA", weight_name="visual-identity-design.safetensors")
-        from PIL import Image
-        def square_center_crop(img, target_size=768):
-            if img.mode in ('RGBA', 'P'):
-                img = img.convert('RGB')
-            width, height = img.size
-            crop_size = min(width, height)
-            left = (width - crop_size) // 2
-            top = (height - crop_size) // 2
-            right = left + crop_size
-            bottom = top + crop_size
-            img_cropped = img.crop((left, top, right, bottom))
-            return img_cropped.resize((target_size, target_size), Image.Resampling.LANCZOS)
-        def duplicate_horizontally(img):
-            width, height = img.size
-            if width != height:
-                raise ValueError(f"Input image must be square, got {width}x{height}")
-            new_image = Image.new('RGB', (width * 2, height))
-            new_image.paste(img, (0, 0))
-            new_image.paste(img, (width, 0))
-            return new_image
-        mask = load_image("mask_square.png")
-        image = load_image("the_logo.png")
-        cropped_image = square_center_crop(image)
-        logo_dupli = duplicate_horizontally(cropped_image)
-        prompt_structure = "The two-panel image showcases the logo of a brand, [LEFT] the left panel is showing the logo [RIGHT] the right panel has this logo applied to "
-        prompt = prompt_structure + "an coconut, engraved logo on a green coconut"
-        out = pipe(
-            prompt=prompt,
-            image=logo_dupli,
-            mask_image=mask,
-            guidance_scale=6,
-            height=768,
-            width=1536,
-            num_inference_steps=28,
-            max_sequence_length=256,
-            strength=1
-        ).images[0]
-        out
-        """
         )
     # Set up the click event

             Note: The generation process might take a few moments.
             """)
+    with gr.Tab("🧨 diffusers implementation"):
         gr.Markdown("The way this works is combining the [IC LoRA](https://github.com/ali-vilab/In-Context-LoRA) with image-to-image + inpainting. Where the image on the left (the logo) is uploaded by the user, and the image on the right is masked and applied on the product by the LoRA. Based on the [ComfyUI workflow by WizardWhitebeard/klinter](https://civitai.com/articles/8779). Below is a diffusers implementation of the idea")
+        gr.Code(language="python", value="""# Support functions
+def square_center_crop(img, target_size=768):
+    if img.mode in ('RGBA', 'P'):
+        img = img.convert('RGB')
+    width, height = img.size
+    crop_size = min(width, height)
+    left = (width - crop_size) // 2
+    top = (height - crop_size) // 2
+    right = left + crop_size
+    bottom = top + crop_size
+    img_cropped = img.crop((left, top, right, bottom))
+    return img_cropped.resize((target_size, target_size), Image.Resampling.LANCZOS)
+def duplicate_horizontally(img):
+    width, height = img.size
+    if width != height:
+        raise ValueError(f"Input image must be square, got {width}x{height}")
+    new_image = Image.new('RGB', (width * 2, height))
+    new_image.paste(img, (0, 0))
+    new_image.paste(img, (width, 0))
+    return new_image"""
+        )
+        gr.Code(language="python", value="""import torch
+from diffusers import FluxInpaintPipeline
+from PIL import Image
+pipe = FluxInpaintPipeline.from_pretrained("black-forest-labs/FLUX.1-dev", torch_dtype=torch.bfloat16)
+pipe.to("cuda")
+pipe.load_lora_weights("ali-vilab/In-Context-LoRA", weight_name="visual-identity-design.safetensors")
+mask = load_image("mask_square.png")
+image = load_image("the_logo.png")
+cropped_image = square_center_crop(image) #crop the image you upload to square
+logo_dupli = duplicate_horizontally(cropped_image) #duplicate it so the right side can be masked
+prompt_structure = "The two-panel image showcases the logo of a brand, [LEFT] the left panel is showing the logo [RIGHT] the right panel has this logo applied to "
+prompt = prompt_structure + "an coconut, engraved logo on a green coconut"
+out = pipe(
+    prompt=prompt,
+    image=logo_dupli,
+    mask_image=mask,
+    guidance_scale=6,
+    height=768,
+    width=1536,
+    num_inference_steps=28,
+    max_sequence_length=256,
+    strength=1
+).images[0]"""
         )
     # Set up the click event