Spaces:

TencentARC
/

IC-Custom

Running on Zero

App Files Files Community

Yaowei222 commited on 9 days ago

Commit

0da2326

1 Parent(s): 9bc4f8c

fix md and pipeline

Browse files

Files changed (4) hide show

app/business_logic.py +12 -12
app/ui_components.py +7 -7
ic_custom/pipelines/ic_custom_pipeline.py +14 -1
ic_custom/utils/model_utils.py +26 -4

app/business_logic.py CHANGED Viewed

@@ -412,8 +412,8 @@ def change_custmization_mode(custmization_mode, input_mask_mode):
                 gr.update(value="<s>Select a input mask mode</s>", visible=False),
                 gr.update(value="<s>Input target image & mask (Iterate clicking or brushing until the target is covered)</s>", visible=False),
                 gr.update(value="<s>View or modify the target mask</s>", visible=False),
-                gr.update(value="3. Input text prompt (necessary)"),
-                gr.update(value="4. Submit and view the output"),
                 gr.update(visible=False),
                 gr.update(visible=False),
@@ -426,11 +426,11 @@ def change_custmization_mode(custmization_mode, input_mask_mode):
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
-                    gr.update(value="3. Select a input mask mode", visible=True),
-                    gr.update(value="4. Input target image & mask (Iterate clicking or brushing until the target is covered)", visible=True),
-                    gr.update(value="6. View or modify the target mask", visible=True),
-                    gr.update(value="5. Input text prompt (optional)", visible=True),
-                    gr.update(value="7. Submit and view the output", visible=True),
                     gr.update(visible=True, value="Precise mask"),
                     gr.update(visible=True),
                     )
@@ -441,11 +441,11 @@ def change_custmization_mode(custmization_mode, input_mask_mode):
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
-                    gr.update(value="3. Select a input mask mode", visible=True),
-                    gr.update(value="4. Input target image & mask (Iterate clicking or brushing until the target is covered)", visible=True),
-                    gr.update(value="6. View or modify the target mask", visible=True),
-                    gr.update(value="5. Input text prompt (optional)", visible=True),
-                    gr.update(value="7. Submit and view the output", visible=True),
                     gr.update(visible=True, value="User-drawn mask"),
                     gr.update(visible=True),
                     )

                 gr.update(value="<s>Select a input mask mode</s>", visible=False),
                 gr.update(value="<s>Input target image & mask (Iterate clicking or brushing until the target is covered)</s>", visible=False),
                 gr.update(value="<s>View or modify the target mask</s>", visible=False),
+                gr.update(value="3\. Input text prompt (necessary)"),
+                gr.update(value="4\. Submit and view the output"),
                 gr.update(visible=False),
                 gr.update(visible=False),
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
+                    gr.update(value="3\. Select a input mask mode", visible=True),
+                    gr.update(value="4\. Input target image & mask (Iterate clicking or brushing until the target is covered)", visible=True),
+                    gr.update(value="6\. View or modify the target mask", visible=True),
+                    gr.update(value="5\. Input text prompt (optional)", visible=True),
+                    gr.update(value="7\. Submit and view the output", visible=True),
                     gr.update(visible=True, value="Precise mask"),
                     gr.update(visible=True),
                     )
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
                     gr.update(interactive=True, visible=True),
+                    gr.update(value="3\. Select a input mask mode", visible=True),
+                    gr.update(value="4\. Input target image & mask (Iterate clicking or brushing until the target is covered)", visible=True),
+                    gr.update(value="6\. View or modify the target mask", visible=True),
+                    gr.update(value="5\. Input text prompt (optional)", visible=True),
+                    gr.update(value="7\. Submit and view the output", visible=True),
                     gr.update(visible=True, value="User-drawn mask"),
                     gr.update(visible=True),
                     )

app/ui_components.py CHANGED Viewed

@@ -44,7 +44,7 @@ def create_customization_section():
     with gr.Row():
         # Add a note to remind users to click Clear before starting
         md_custmization_mode = gr.Markdown(
-            "1. Select a Customization Mode\n\n*Tip: Please click the Clear button first to reset all states before starting a new task.*"
         )
     with gr.Row():
         custmization_mode = gr.Radio(
@@ -61,7 +61,7 @@ def create_customization_section():
 def create_image_input_section():
     """Create image input section optimized for left column layout."""
     # Reference image section
-    md_image_reference = gr.Markdown("2. Input reference image")
     with gr.Group():
         image_reference = gr.Image(
             label="Reference Image",
@@ -73,7 +73,7 @@ def create_image_input_section():
         )
     # Input mask mode selection
-    md_input_mask_mode = gr.Markdown("3. Select input mask mode")
     with gr.Group():
         input_mask_mode = gr.Radio(
             ["Precise mask", "User-drawn mask"],
@@ -84,7 +84,7 @@ def create_image_input_section():
         )
     # Target image section
-    md_target_image = gr.Markdown("4. Input target image & mask (Iterate clicking or brushing until the target is covered)")
     # Precise mask mode
     with gr.Group():
@@ -129,7 +129,7 @@ def create_image_input_section():
 def create_prompt_section():
     """Create the text prompt input section with improved layout."""
-    md_prompt = gr.Markdown("5. Input text prompt (optional)")
     with gr.Group():
         prompt = gr.Textbox(
             placeholder="Please input the description for the target scene.",
@@ -243,7 +243,7 @@ def create_advanced_options_section():
 def create_mask_operation_section():
     """Create mask operation section optimized for right column (outputs)."""
-    md_mask_operation = gr.Markdown("6. View or modify the target mask")
     with gr.Group():
         # Mask gallery with responsive layout
@@ -293,7 +293,7 @@ def create_mask_operation_section():
 def create_output_section():
     """Create the output section optimized for right column."""
-    md_submit = gr.Markdown("7. Submit and view the output")
     # Generation controls at top for better workflow
     with gr.Group():

     with gr.Row():
         # Add a note to remind users to click Clear before starting
         md_custmization_mode = gr.Markdown(
+            "1\. Select a Customization Mode\n\n*Tip: Please click the Clear button first to reset all states before starting a new task.*"
         )
     with gr.Row():
         custmization_mode = gr.Radio(
 def create_image_input_section():
     """Create image input section optimized for left column layout."""
     # Reference image section
+    md_image_reference = gr.Markdown("2\. Input reference image")
     with gr.Group():
         image_reference = gr.Image(
             label="Reference Image",
         )
     # Input mask mode selection
+    md_input_mask_mode = gr.Markdown("3\. Select input mask mode")
     with gr.Group():
         input_mask_mode = gr.Radio(
             ["Precise mask", "User-drawn mask"],
         )
     # Target image section
+    md_target_image = gr.Markdown("4\. Input target image & mask (Iterate clicking or brushing until the target is covered)")
     # Precise mask mode
     with gr.Group():
 def create_prompt_section():
     """Create the text prompt input section with improved layout."""
+    md_prompt = gr.Markdown("5\. Input text prompt (optional)")
     with gr.Group():
         prompt = gr.Textbox(
             placeholder="Please input the description for the target scene.",
 def create_mask_operation_section():
     """Create mask operation section optimized for right column (outputs)."""
+    md_mask_operation = gr.Markdown("6\. View or modify the target mask")
     with gr.Group():
         # Mask gallery with responsive layout
 def create_output_section():
     """Create the output section optimized for right column."""
+    md_submit = gr.Markdown("7\. Submit and view the output")
     # Generation controls at top for better workflow
     with gr.Group():

ic_custom/pipelines/ic_custom_pipeline.py CHANGED Viewed

@@ -1,4 +1,4 @@
 import re
 from typing import List, Optional, Union
@@ -128,6 +128,10 @@ class ICCustomPipeline:
         double_blocks_idx: str = None,
         single_blocks_idx: str = None,
         ):
         lora_path = resolve_model_path(
             name=lora_path,
             repo_id_field="repo_id",
@@ -181,6 +185,9 @@ class ICCustomPipeline:
         self.load_model_weights(weights, strict=False)
     def set_img_txt_in(self, img_txt_in_path: str):
         img_txt_in_path = resolve_model_path(
             name=img_txt_in_path,
             repo_id_field="repo_id",
@@ -192,6 +199,9 @@ class ICCustomPipeline:
         self.load_model_weights(weights, strict=False)
     def set_boundary_embeddings(self, boundary_embeddings_path: str):
         boundary_embeddings_path = resolve_model_path(
             name=boundary_embeddings_path,
             repo_id_field="repo_id",
@@ -203,6 +213,9 @@ class ICCustomPipeline:
         self.load_model_weights(weights, strict=False)
     def set_task_register_embeddings(self, task_register_embeddings_path: str):
         task_register_embeddings_path = resolve_model_path(
             name=task_register_embeddings_path,
             repo_id_field="repo_id",

+import os
 import re
 from typing import List, Optional, Union
         double_blocks_idx: str = None,
         single_blocks_idx: str = None,
         ):
+        if not os.path.exists(lora_path):
+            lora_path = "dit_lora_0x1561"
         lora_path = resolve_model_path(
             name=lora_path,
             repo_id_field="repo_id",
         self.load_model_weights(weights, strict=False)
     def set_img_txt_in(self, img_txt_in_path: str):
+        if not os.path.exists(img_txt_in_path):
+            img_txt_in_path = "dit_txt_img_in_0x1561"
         img_txt_in_path = resolve_model_path(
             name=img_txt_in_path,
             repo_id_field="repo_id",
         self.load_model_weights(weights, strict=False)
     def set_boundary_embeddings(self, boundary_embeddings_path: str):
+        if not os.path.exists(boundary_embeddings_path):
+            boundary_embeddings_path = "dit_boundary_embeddings_0x1561"
         boundary_embeddings_path = resolve_model_path(
             name=boundary_embeddings_path,
             repo_id_field="repo_id",
         self.load_model_weights(weights, strict=False)
     def set_task_register_embeddings(self, task_register_embeddings_path: str):
+        if not os.path.exists(task_register_embeddings_path):
+            task_register_embeddings_path = "dit_task_register_embeddings_0x1561"
         task_register_embeddings_path = resolve_model_path(
             name=task_register_embeddings_path,
             repo_id_field="repo_id",

ic_custom/utils/model_utils.py CHANGED Viewed

@@ -206,6 +206,9 @@ def load_dit(
         model: Loaded Flux model
     """
     # Loading Flux
     logger.info("Initializing Flux model")
     # Resolve checkpoint path
@@ -249,9 +252,11 @@ def load_ic_custom(
         model: Loaded IC_Custom model
     """
     logger.info("Initializing IC-Custom model")
     # Resolve checkpoint path
     ckpt_path = resolve_model_path(
         name=name,
         repo_id_field="repo_id",
@@ -312,8 +317,7 @@ def load_embedder(
         path,
         max_length=max_length,
         is_clip=is_clip,
-        torch_dtype=dtype,
-    ).to(device)
     return model
@@ -336,7 +340,11 @@ def load_t5(
     Returns:
         model: Loaded T5 model
     """
     logger.info(f"Loading T5 model: {name}")
     return load_embedder(
         name=name,
         is_clip=False,
@@ -362,7 +370,11 @@ def load_clip(
     Returns:
         model: Loaded CLIP model
     """
     logger.info(f"Loading CLIP model: {name}")
     return load_embedder(
         name=name,
         is_clip=True,
@@ -387,6 +399,10 @@ def load_ae(
     Returns:
         model: Loaded AutoEncoder model
     """
     logger.info(f"Loading AutoEncoder model: {name}")
     # Convert device string to torch.device if needed
@@ -429,6 +445,12 @@ def load_redux(
     Returns:
         model: Loaded Redux Image Encoder model
     """
     logger.info(f"Loading Redux Image Encoder: redux={redux_name}, siglip={siglip_name}")
     # Convert device string to torch.device if needed

         model: Loaded Flux model
     """
     # Loading Flux
+    if not os.path.exists(name):
+        name = "flux-fill-dev-dit"
     logger.info("Initializing Flux model")
     # Resolve checkpoint path
         model: Loaded IC_Custom model
     """
     logger.info("Initializing IC-Custom model")
     # Resolve checkpoint path
+    if not os.path.exists(name):
+        name = "flux-fill-dev-dit"
     ckpt_path = resolve_model_path(
         name=name,
         repo_id_field="repo_id",
         path,
         max_length=max_length,
         is_clip=is_clip,
+    ).to(device).to(dtype)
     return model
     Returns:
         model: Loaded T5 model
     """
+    if not os.path.exists(name):
+        name = "t5-v1_1-xxl"
     logger.info(f"Loading T5 model: {name}")
     return load_embedder(
         name=name,
         is_clip=False,
     Returns:
         model: Loaded CLIP model
     """
+    if not os.path.exists(name):
+        name = "clip-vit-large-patch14"
     logger.info(f"Loading CLIP model: {name}")
     return load_embedder(
         name=name,
         is_clip=True,
     Returns:
         model: Loaded AutoEncoder model
     """
+    if not os.path.exists(name):
+        name = "flux-fill-dev-ae"
     logger.info(f"Loading AutoEncoder model: {name}")
     # Convert device string to torch.device if needed
     Returns:
         model: Loaded Redux Image Encoder model
     """
+    if not os.path.exists(redux_name):
+        redux_name = "flux1-redux-dev"
+    if not os.path.exists(siglip_name):
+        siglip_name = "siglip-so400m-patch14-384"
     logger.info(f"Loading Redux Image Encoder: redux={redux_name}, siglip={siglip_name}")
     # Convert device string to torch.device if needed