Virtual-Try-On

Running on Zero

App Files Files Community

parokshsaxena commited on Jun 30

Commit

5ca0873

•

1 Parent(s): d3da15b

intensity transfer instead of color

Browse files

Files changed (2) hide show

app.py +5 -3
src/background_processor.py +52 -0

app.py CHANGED Viewed

@@ -153,9 +153,7 @@ def start_tryon(human_img_dict,garm_img,garment_des, background_img, is_checked,
     #human_img_orig = human_img_dict["background"].convert("RGB")   # ImageEditor
     human_img_orig = human_img_dict.convert("RGB")     # Image
-    if background_img:
-        human_img_orig = BackgroundProcessor.color_transfer(human_img_orig, background_img)
     """
     # Derive HEIGHT & WIDTH such that width is not more than 1000. This will cater to both Shein images (4160x6240) of 3:4 AR and model standard images ( 768x1024 ) of 2:3 AR
@@ -186,6 +184,10 @@ def start_tryon(human_img_dict,garm_img,garment_des, background_img, is_checked,
     else:
         human_img = human_img_orig.resize((WIDTH, HEIGHT))
     if is_checked:
         # internally openpose_model is resizing human_img to resolution 384 if not passed as input

     #human_img_orig = human_img_dict["background"].convert("RGB")   # ImageEditor
     human_img_orig = human_img_dict.convert("RGB")     # Image
     """
     # Derive HEIGHT & WIDTH such that width is not more than 1000. This will cater to both Shein images (4160x6240) of 3:4 AR and model standard images ( 768x1024 ) of 2:3 AR
     else:
         human_img = human_img_orig.resize((WIDTH, HEIGHT))
+    # Do color transfer from background image for better image harmonization
+    if background_img:
+        human_img = BackgroundProcessor.intensity_transfer(human_img, background_img)
     if is_checked:
         # internally openpose_model is resizing human_img to resolution 384 if not passed as input

src/background_processor.py CHANGED Viewed

@@ -235,6 +235,11 @@ class BackgroundProcessor:
     @classmethod
     def color_transfer(cls, source_pil: Image, target_pil: Image) -> Image:
         source = ImageFormatConvertor.pil_to_cv2(source_pil)
         target = ImageFormatConvertor.pil_to_cv2(target_pil)
         source = cv2.cvtColor(source, cv2.COLOR_BGR2LAB)
         target = cv2.cvtColor(target, cv2.COLOR_BGR2LAB)
@@ -254,4 +259,51 @@ class BackgroundProcessor:
         res = cv2.cvtColor(result, cv2.COLOR_LAB2BGR)
         res_pil = ImageFormatConvertor.cv2_to_pil(res)
         return res_pil

     @classmethod
     def color_transfer(cls, source_pil: Image, target_pil: Image) -> Image:
         source = ImageFormatConvertor.pil_to_cv2(source_pil)
+        # Resize background image
+        width, height = source_pil.width, source_pil.height
+        target_pil = target_pil.convert("RGB")
+        target_pil = target_pil.resize((width, height))
         target = ImageFormatConvertor.pil_to_cv2(target_pil)
         source = cv2.cvtColor(source, cv2.COLOR_BGR2LAB)
         target = cv2.cvtColor(target, cv2.COLOR_BGR2LAB)
         res = cv2.cvtColor(result, cv2.COLOR_LAB2BGR)
         res_pil = ImageFormatConvertor.cv2_to_pil(res)
+        return res_pil
+    @classmethod
+    def intensity_transfer(cls, source_pil: Image, target_pil: Image) -> Image:
+        """
+        Transfers the intensity distribution from the target image to the source image.
+        Parameters:
+        source (np.ndarray): The source image (foreground) to be harmonized.
+        target (np.ndarray): The target image (background) whose intensity distribution is to be matched.
+        eps (float): A small value to avoid division by zero.
+        Returns:
+        np.ndarray: The intensity-transferred source image.
+        """
+        source = ImageFormatConvertor.pil_to_cv2(source_pil)
+        # Resize background image
+        width, height = source_pil.width, source_pil.height
+        target_pil = target_pil.convert("RGB")
+        target_pil = target_pil.resize((width, height))
+        target = ImageFormatConvertor.pil_to_cv2(target_pil)
+        source_lab = cv2.cvtColor(source, cv2.COLOR_BGR2LAB)
+        target_lab = cv2.cvtColor(target, cv2.COLOR_BGR2LAB)
+        # Compute the mean and standard deviation of the L channel (intensity) of the source and target images
+        source_mean, source_std = cv2.meanStdDev(source_lab[:, :, 0])
+        target_mean, target_std = cv2.meanStdDev(target_lab[:, :, 0])
+        # Reshape the mean and std to (1, 1, 1) so they can be broadcast correctly
+        source_mean = source_mean.reshape((1, 1, 1))
+        source_std = source_std.reshape((1, 1, 1))
+        target_mean = target_mean.reshape((1, 1, 1))
+        target_std = target_std.reshape((1, 1, 1))
+        # Transfer the intensity (L channel)
+        result_l = (source_lab[:, :, 0] - source_mean) * (target_std / source_std) + target_mean
+        result_l = np.clip(result_l, 0, 255).astype(np.uint8)
+        # Combine the transferred L channel with the original A and B channels
+        result_lab = np.copy(source_lab)
+        result_lab[:, :, 0] = result_l
+        # return cv2.cvtColor(result_lab, cv2.COLOR_LAB2BGR)
+        res = cv2.cvtColor(result_lab, cv2.COLOR_LAB2BGR)
+        res_pil = ImageFormatConvertor.cv2_to_pil(res)
         return res_pil