From e3a400c9ac795cabb2a2cd72cbdcba134fe71371 Mon Sep 17 00:00:00 2001
From: semnisem <doldori102493@gmail.com>
Date: Sun, 24 Nov 2024 18:36:03 +0900
Subject: [PATCH 1/5] =?UTF-8?q?Fix:=20=ED=95=84=EA=B8=B0=20=EC=A0=9C?=
 =?UTF-8?q?=EA=B1=B0=20=EA=B8=B0=EB=8A=A5=20=EC=82=AC=EC=9A=A9=EC=84=B1=20?=
 =?UTF-8?q?=EA=B0=9C=EC=84=A0?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/AIProcessor.py | 133 +++++++++++++++++++++++++--------------------
 1 file changed, 73 insertions(+), 60 deletions(-)

diff --git a/app/AIProcessor.py b/app/AIProcessor.py
index 7e9d391..eec3baa 100644
--- a/app/AIProcessor.py
+++ b/app/AIProcessor.py
@@ -62,32 +62,6 @@ def object_detection(self, img):
         logging.info(f'객체 탐지 - {self.indices} 박스에 동그라미 존재')
         return bbox
 
-    def segment_from_points(self, image, user_points, user_labels, bbox,  save_path=None):
-        '''input_point = np.array(user_points)
-        input_label = np.array(user_labels)
-
-        masks_points, scores, logits = self.predictor.predict(
-            point_coords=input_point,
-            point_labels=input_label,
-            multimask_output=False,
-        )'''
-        # filtered_points, filtered_labels = self.remove_points_in_bboxes(user_points, user_labels, bbox)
-        # logging.info(f'2차 마스킹 - 사용자 입력 필터링: from {len(user_points)}개 to {len(filtered_points)}개')
-
-        # results = self.sam_model.predict(source=image, points=filtered_points, labels=filtered_labels)
-        results = self.sam_model.predict(source=image, bboxes=[user_points])
-        mask_points = results[0].masks.data
-
-        masks_np = np.zeros(mask_points.shape[-2:], dtype=np.uint8)
-        for mask in mask_points:
-            mask_np = mask.cpu().numpy().astype(np.uint8) * 255
-            mask_np = mask_np.squeeze()
-            masks_np = cv2.bitwise_or(masks_np, mask_np)
-
-        # cv2.imwrite(save_path, mask_points_uint8)
-        logging.info(f'2차 마스킹 - 사용자 입력에 대해 {len(mask_points)}개 영역으로 세그먼트 완료.')
-        return masks_np
-
     def segment_from_boxes(self, image, bbox, save_path=None):
         '''
         input_boxes = torch.tensor(bbox, device=self.predictor.device)
@@ -117,20 +91,58 @@ def segment_from_boxes(self, image, bbox, save_path=None):
         logging.info(f'1차 마스킹 - 바운딩 박스 {len(mask_boxes)}개 세그먼트 완료.')
         return masks_np
 
+    def segment_from_points(self, image, user_points, user_labels, bbox,  save_path=None):
+        '''input_point = np.array(user_points)
+        input_label = np.array(user_labels)
+
+        masks_points, scores, logits = self.predictor.predict(
+            point_coords=input_point,
+            point_labels=input_label,
+            multimask_output=False,
+        )'''
+        # filtered_points, filtered_labels = self.remove_points_in_bboxes(user_points, user_labels, bbox)
+        # logging.info(f'2차 마스킹 - 사용자 입력 필터링: from {len(user_points)}개 to {len(filtered_points)}개')
+
+        # results = self.sam_model.predict(source=image, points=filtered_points, labels=filtered_labels)
+        results = self.sam_model.predict(source=image, bboxes=[user_points])
+        mask_points = results[0].masks.data
+
+        masks_np = np.zeros(mask_points.shape[-2:], dtype=np.uint8)
+        for mask in mask_points:
+            mask_np = mask.cpu().numpy().astype(np.uint8) * 255
+            mask_np = mask_np.squeeze()
+            masks_np = cv2.bitwise_or(masks_np, mask_np)
+
+        # cv2.imwrite(save_path, mask_points_uint8)
+        logging.info(f'2차 마스킹 - 사용자 입력에 대해 {len(mask_points)}개 영역으로 세그먼트 완료.')
+        return masks_np
+
     def inpainting(self, image, mask_total):
-        # inpainted_image = cv2.inpaint(image.copy(), mask_total, 10, cv2.INPAINT_TELEA)
-        print(mask_total.shape)  # (1893, 1577) with 0 or 255
-        # print(image.shape)  # (1893, 1577, 3)
+        inpainted_image = cv2.inpaint(image.copy(), mask_total, 15, cv2.INPAINT_TELEA)
 
-        inpainted_image = image.copy()
-        inpainted_image[mask_total == 255] = [255, 255, 255]
-        final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.5, beta=10)
+        '''inpainted_image = image.copy()
+        inpainted_image[mask_total == 255] = [255, 255, 255]'''
+        final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.6, beta=10)
         # cv2.imwrite('test_images/inpainted_init.png', inpainted_image)
         # cv2.imwrite('test_images/inpainted_final.png', final_image)
         logging.info('인페인팅 및 후보정 완료.')
 
         return final_image
 
+    def inpaint_from_points(self, image, user_boxes, save_path=None):
+        masks_np = np.zeros(image.shape[:2], dtype=np.uint8)
+        for b in user_boxes:  # 박스 내부 다 채우기(마스킹)
+            minx, miny, maxx, maxy = b
+            masks_np[miny:maxy, minx:maxx] = 255  # 박스 영역을 255로 채움
+
+        # cv2.imwrite(save_path, mask_points_uint8)
+        inpainted_image = image.copy()
+        inpainted_image[masks_np == 255] = [255, 255, 255]
+        # final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.5, beta=10)
+
+        logging.info(f'2차 마스킹 & 인페인팅 - 사용자 입력 {len(user_boxes)}개 영역 인페인팅 완료.')
+        return masks_np, inpainted_image
+
     def combine_alpha(self, image_rgb):
         if self.alpha_channel is not None:  # RGBA
             image_rgba = cv2.merge([image_rgb, self.alpha_channel])
@@ -138,7 +150,7 @@ def combine_alpha(self, image_rgb):
         else:
             return image_rgb
 
-    def process(self, img_bytes, user_points, user_labels, extension='jpg'):
+    def process(self, img_bytes, user_inputs, user_labels, extension='jpg'):
         """ local test 용도 Vs. server test 용도 구분 """
         ### local 용도
         # img_path = img_bytes
@@ -147,6 +159,8 @@ def process(self, img_bytes, user_points, user_labels, extension='jpg'):
         ### server 용도
         buffer = np.frombuffer(img_bytes, dtype=np.uint8)
         image = cv2.imdecode(buffer, cv2.IMREAD_UNCHANGED)
+        image_output = image.copy()
+        logging.info(f"이미지 처리 시작 - 사이즈: {image.shape[:2]}")
 
         ### ready
         #self.load_sam_model()
@@ -156,42 +170,41 @@ def process(self, img_bytes, user_points, user_labels, extension='jpg'):
         ### 1차: Object Detection & Segment by Box
         bbox = self.object_detection(image)
         if len(bbox) > 0:
-            masks_by_box = self.segment_from_boxes(image, bbox, save_path=None)  # 'test_images/seg_box.png'
-            masks_total = cv2.bitwise_or(masks_total, masks_by_box)
+            logging.info("***** 객체 탐지 세그멘테이션 시작 ******")
+            masks_by_yolo = self.segment_from_boxes(image, bbox, save_path=None)  # 'test_images/seg_box.png'
+            masks_total = cv2.bitwise_or(masks_total, masks_by_yolo)
             #logging.info( f"1차 마스킹 후 shape 점검: YOLOv11 감지된 영역 shape: {masks_by_box.shape}, 이미지 영역 shape: {image.shape}")  # (1893, 1577, 3)  (1893, 1577)
         else:
-            masks_by_box = None
+            logging.info("***** 객체 탐지 세그멘테이션 스킵 ******")
+            masks_by_yolo = None
         ### 2차: points arguments by User & Segment by Points
-        if len(user_points) > 0:
-            mask_by_point = self.segment_from_points(image, user_points, user_labels, bbox, save_path=None)  # save_path='test_images/seg_points.png'
-            masks_total = cv2.bitwise_or(masks_total, mask_by_point)
+        if len(user_inputs) > 0:
+            logging.info("***** 사용자 입력 세그멘테이션 시작 ******")
+            # masks_by_user = self.segment_from_points(image, user_inputs, user_labels, bbox, save_path=None)  # save_path='test_images/seg_points.png'
+            # masks_total = cv2.bitwise_or(masks_total, masks_by_user)
+            masks_by_user, image_output = self.inpaint_from_points(image, user_inputs, save_path=None)
+            _, mask_bytes = cv2.imencode("." + extension, image_output)
         else:
-            mask_by_point = None
+            logging.info("***** 사용자 입력 세그멘테이션 스킵 ******")
+            masks_by_user = None
         # cv2.imwrite('test_images/mask_total.png', masks_total)
         if isinstance(masks_total, np.ndarray):
-            image_output = self.inpainting(image, masks_total)
-            logging.info('최종 마스킹 이미지 생성 완료')
+            image_output = self.inpainting(image_output, masks_total)
+            logging.info('***** 인페인팅 수행 완료 ******')
         else:
-            image_output = image
-            logging.info('최종 마스킹이 없거나, numpy 형식의 배열이 아님.')
+            logging.info('입력과 동일한 결과 이미지입니다.')
 
-        # image_input = self.combine_alpha(image_rgb)
-        # image_output = self.combine_alpha(image_output)
         _, input_bytes = cv2.imencode("." + extension, image)
-        _, mask_bytes = cv2.imencode("." + extension, masks_total.astype(np.uint8))
+        # _, mask_bytes = cv2.imencode("." + extension, masks_total.astype(np.uint8))
         _, result_bytes = cv2.imencode("." + extension, image_output)
 
-        if mask_by_point is not None and masks_by_box is not None:
-            _, mask_by_point_bytes = cv2.imencode("." + extension, mask_by_point.astype(np.uint8))
-            _, mask_by_box_bytes = cv2.imencode("." + extension, masks_by_box.astype(np.uint8))
-            return io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes), io.BytesIO(mask_by_box_bytes), io.BytesIO(mask_by_point_bytes)
-        elif mask_by_point is not None:
-            _, mask_by_point_bytes = cv2.imencode("." + extension, mask_by_point.astype(np.uint8))
-            return io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes), None, io.BytesIO(mask_by_point_bytes)
-        elif masks_by_box is not None:
-            _, mask_by_box_bytes = cv2.imencode("." + extension, masks_by_box.astype(np.uint8))
-            return io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes), io.BytesIO(mask_by_box_bytes), None
+        if masks_by_yolo is not None:
+            _, mask_by_yolo_bytes = cv2.imencode("." + extension, masks_by_yolo.astype(np.uint8))
         else:
-            return io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes), None, None
-
-
+            mask_by_yolo_bytes = None
+        if masks_by_user is not None:
+            _, mask_by_user_bytes = cv2.imencode("." + extension, masks_by_user.astype(np.uint8))
+        else:
+            mask_by_user_bytes = None
+        return (io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes),
+                io.BytesIO(mask_by_yolo_bytes), io.BytesIO(mask_by_user_bytes))

From 6c071249e9fa63aea4ddcf0b1a6b2d4fd922c1dd Mon Sep 17 00:00:00 2001
From: semnisem <doldori102493@gmail.com>
Date: Sun, 24 Nov 2024 18:37:22 +0900
Subject: [PATCH 2/5] =?UTF-8?q?Fix:=20=ED=95=84=EA=B8=B0=20=EC=A0=9C?=
 =?UTF-8?q?=EA=B1=B0=20=EA=B8=B0=EB=8A=A5=20=EC=82=AC=EC=9A=A9=EC=84=B1=20?=
 =?UTF-8?q?=EA=B0=9C=EC=84=A0?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/AIProcessor.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/app/AIProcessor.py b/app/AIProcessor.py
index eec3baa..5a59ccd 100644
--- a/app/AIProcessor.py
+++ b/app/AIProcessor.py
@@ -187,6 +187,7 @@ def process(self, img_bytes, user_inputs, user_labels, extension='jpg'):
         else:
             logging.info("***** 사용자 입력 세그멘테이션 스킵 ******")
             masks_by_user = None
+            mask_bytes = None
         # cv2.imwrite('test_images/mask_total.png', masks_total)
         if isinstance(masks_total, np.ndarray):
             image_output = self.inpainting(image_output, masks_total)

From c2826801fc249ba0448dd2a1b28baa772b4fdb6b Mon Sep 17 00:00:00 2001
From: semnisem <doldori102493@gmail.com>
Date: Sun, 24 Nov 2024 20:43:05 +0900
Subject: [PATCH 3/5] =?UTF-8?q?Hot-Fix:=20=EC=88=98=EC=A0=95=20process=20?=
 =?UTF-8?q?=ED=95=A8=EC=88=98=20=EC=A0=95=EC=9D=98=20=EB=B0=8F=20=ED=98=B8?=
 =?UTF-8?q?=EC=B6=9C?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/AIProcessor.py | 2 +-
 app/main.py        | 3 +--
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/app/AIProcessor.py b/app/AIProcessor.py
index 5a59ccd..dfe6196 100644
--- a/app/AIProcessor.py
+++ b/app/AIProcessor.py
@@ -150,7 +150,7 @@ def combine_alpha(self, image_rgb):
         else:
             return image_rgb
 
-    def process(self, img_bytes, user_inputs, user_labels, extension='jpg'):
+    def process(self, img_bytes, user_inputs, extension='jpg'):
         """ local test 용도 Vs. server test 용도 구분 """
         ### local 용도
         # img_path = img_bytes
diff --git a/app/main.py b/app/main.py
index b89c5c0..3dfd2f9 100644
--- a/app/main.py
+++ b/app/main.py
@@ -126,8 +126,7 @@ async def processShape(request: Request):
         # aiProcessor = AIProcessor(yolo_path='/Users/semin/models/yolo11_best.pt', sam_path='/Users/semin/models/mobile_sam.pt')  # local
         aiProcessor = AIProcessor(yolo_path="../models/yolo11_best.pt", sam_path="../models/mobile_sam.pt")  # server
         img_input_bytes, img_mask_bytes, img_output_bytes, one, two = aiProcessor.process(img_bytes=corrected_img_bytes,
-                                                                                          user_points=point_list,
-                                                                                          user_labels=label_list)
+                                                                                          user_inputs=point_list)
         logger.info("AI 필기 제거 프로세스 완료")
 
         upload_image_to_s3(img_input_bytes, paths["input_path"])

From 6eeb3b23402bcbcccd8083643ea9e042a08405f9 Mon Sep 17 00:00:00 2001
From: semnisem <doldori102493@gmail.com>
Date: Sun, 24 Nov 2024 21:11:39 +0900
Subject: [PATCH 4/5] =?UTF-8?q?Feat:=20=EB=B3=80=EA=B2=BD=20=EA=B2=B9?=
 =?UTF-8?q?=EC=B9=9C=20=EB=A7=88=ED=82=B9=20=ED=83=90=EC=A7=80=20=EB=B0=8F?=
 =?UTF-8?q?=20=EC=9D=B8=ED=8E=98=EC=9D=B8=ED=8C=85?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/AIProcessor.py | 108 ++++++++++++++++++++++++---------------------
 1 file changed, 57 insertions(+), 51 deletions(-)

diff --git a/app/AIProcessor.py b/app/AIProcessor.py
index dfe6196..9e0545d 100644
--- a/app/AIProcessor.py
+++ b/app/AIProcessor.py
@@ -62,17 +62,7 @@ def object_detection(self, img):
         logging.info(f'객체 탐지 - {self.indices} 박스에 동그라미 존재')
         return bbox
 
-    def segment_from_boxes(self, image, bbox, save_path=None):
-        '''
-        input_boxes = torch.tensor(bbox, device=self.predictor.device)
-        transformed_boxes = self.predictor.transform.apply_boxes_torch(input_boxes, image.shape[:2])
-        masks, _, _ = self.predictor.predict_torch(
-            point_coords=None,
-            point_labels=None,
-            boxes=transformed_boxes,
-            multimask_output=False,
-        )
-        '''
+    def segment_from_yolo(self, image, bbox, save_path=None):
         results = self.sam_model.predict(source=image, bboxes=bbox)
         mask_boxes = results[0].masks.data
 
@@ -80,10 +70,11 @@ def segment_from_boxes(self, image, bbox, save_path=None):
         for i, mask in enumerate(mask_boxes):
             mask_np = mask.cpu().numpy().astype(np.uint8) * 255  # True는 255, False는 0으로 변환
             mask_np = mask_np.squeeze()
-            if i in self.indices:
+            '''if i in self.indices:  # 원형 마킹이라면
+                mask_np = cv2.dilate(mask_np, np.ones((3, 3), np.uint8), iterations=1)
                 # kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (15, 15))  # Adjust size as needed
-                kernel = np.ones((15, 15), np.uint8)
-                mask_np = cv2.morphologyEx(mask_np, cv2.MORPH_GRADIENT, kernel)
+                # kernel = np.ones((15, 15), np.uint8)
+                # mask_np = cv2.morphologyEx(mask_np, cv2.MORPH_GRADIENT, kernel)'''
             masks_np = cv2.bitwise_or(masks_np, mask_np)
             # cv2.imwrite(f'mask_box{i}.jpg', masks_np)
 
@@ -91,20 +82,12 @@ def segment_from_boxes(self, image, bbox, save_path=None):
         logging.info(f'1차 마스킹 - 바운딩 박스 {len(mask_boxes)}개 세그먼트 완료.')
         return masks_np
 
-    def segment_from_points(self, image, user_points, user_labels, bbox,  save_path=None):
-        '''input_point = np.array(user_points)
-        input_label = np.array(user_labels)
-
-        masks_points, scores, logits = self.predictor.predict(
-            point_coords=input_point,
-            point_labels=input_label,
-            multimask_output=False,
-        )'''
+    def segment_from_user(self, image, user_inputs, bbox,  save_path=None):
         # filtered_points, filtered_labels = self.remove_points_in_bboxes(user_points, user_labels, bbox)
         # logging.info(f'2차 마스킹 - 사용자 입력 필터링: from {len(user_points)}개 to {len(filtered_points)}개')
 
         # results = self.sam_model.predict(source=image, points=filtered_points, labels=filtered_labels)
-        results = self.sam_model.predict(source=image, bboxes=[user_points])
+        results = self.sam_model.predict(source=image, bboxes=user_inputs)
         mask_points = results[0].masks.data
 
         masks_np = np.zeros(mask_points.shape[-2:], dtype=np.uint8)
@@ -117,22 +100,38 @@ def segment_from_points(self, image, user_points, user_labels, bbox,  save_path=
         logging.info(f'2차 마스킹 - 사용자 입력에 대해 {len(mask_points)}개 영역으로 세그먼트 완료.')
         return masks_np
 
-    def inpainting(self, image, mask_total):
-        inpainted_image = cv2.inpaint(image.copy(), mask_total, 15, cv2.INPAINT_TELEA)
+    def inpainting(self, image, mask_total, bbox=None):
+
+        mask_total = np.zeros(image.shape[:2], dtype=np.uint8)
+        text_np = np.zeros(image.shape[:2], dtype=np.uint8)  # 전체 roi_mask 저장
+        for b in bbox:
+            minx, miny, maxx, maxy = map(int, b)
+            mask_total[miny:maxy, minx:maxx] = 255  # 박스 영역을 255로 채움
+            roi = image[miny:maxy, minx:maxx]  # 해당 이미지만 크롭
+            roi_mask = cv2.inRange(roi, (0, 0, 0), (45, 45, 45))  # roi 내에서 인쇄된 글씨는 255값
+            text_np[miny:maxy, minx:maxx] = roi_mask
+
+        text_np = cv2.dilate(text_np, np.ones((4, 4), np.uint8), iterations=1)
+        text_np = cv2.erode(text_np, np.ones((2, 2), np.uint8), iterations=2)
+        cv2.imwrite('text_np.jpg', text_np.astype(np.uint8))
+
+        inpainted_image = image.copy()
+        inpainted_image[mask_total == 255] = [255, 255, 255]
+        inpainted_image[text_np == 255] = [30, 30, 30]
+        final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.5, beta=15)
+
 
-        '''inpainted_image = image.copy()
-        inpainted_image[mask_total == 255] = [255, 255, 255]'''
-        final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.6, beta=10)
+        # inpainted_image = cv2.inpaint(image.copy(), mask_total, 15, cv2.INPAINT_TELEA)
         # cv2.imwrite('test_images/inpainted_init.png', inpainted_image)
         # cv2.imwrite('test_images/inpainted_final.png', final_image)
-        logging.info('인페인팅 및 후보정 완료.')
+        logging.info('Yolo 결과 인페인팅 및 후보정 완료.')
 
         return final_image
 
-    def inpaint_from_points(self, image, user_boxes, save_path=None):
+    def inpaint_from_user(self, image, user_boxes, save_path=None):
         masks_np = np.zeros(image.shape[:2], dtype=np.uint8)
         for b in user_boxes:  # 박스 내부 다 채우기(마스킹)
-            minx, miny, maxx, maxy = b
+            minx, miny, maxx, maxy = map(int, b)
             masks_np[miny:maxy, minx:maxx] = 255  # 박스 영역을 255로 채움
 
         # cv2.imwrite(save_path, mask_points_uint8)
@@ -167,45 +166,52 @@ def process(self, img_bytes, user_inputs, extension='jpg'):
         #self.predictor.set_image(image)
         masks_total = np.zeros(image.shape[:2], dtype=np.uint8)
 
-        ### 1차: Object Detection & Segment by Box
+        ### 1차: Segment by Object Detection
         bbox = self.object_detection(image)
         if len(bbox) > 0:
-            logging.info("***** 객체 탐지 세그멘테이션 시작 ******")
-            masks_by_yolo = self.segment_from_boxes(image, bbox, save_path=None)  # 'test_images/seg_box.png'
+            logging.info("***** 1차: 객체 탐지 세그멘테이션 시작 ******")
+            masks_by_yolo = self.segment_from_yolo(image, bbox, save_path=None)  # 'test_images/seg_box.png'
             masks_total = cv2.bitwise_or(masks_total, masks_by_yolo)
-            #logging.info( f"1차 마스킹 후 shape 점검: YOLOv11 감지된 영역 shape: {masks_by_box.shape}, 이미지 영역 shape: {image.shape}")  # (1893, 1577, 3)  (1893, 1577)
         else:
-            logging.info("***** 객체 탐지 세그멘테이션 스킵 ******")
+            logging.info("***** 1차: 객체 탐지 세그멘테이션 스킵 ******")
             masks_by_yolo = None
-        ### 2차: points arguments by User & Segment by Points
+
+
+        ### 2차: Segment by User Prompt
         if len(user_inputs) > 0:
-            logging.info("***** 사용자 입력 세그멘테이션 시작 ******")
-            # masks_by_user = self.segment_from_points(image, user_inputs, user_labels, bbox, save_path=None)  # save_path='test_images/seg_points.png'
-            # masks_total = cv2.bitwise_or(masks_total, masks_by_user)
-            masks_by_user, image_output = self.inpaint_from_points(image, user_inputs, save_path=None)
+            logging.info("***** 2차: 사용자 입력 세그멘테이션 시작 ******")
+            masks_by_user = self.segment_from_user(image, user_inputs, bbox, save_path=None)  # save_path='test_images/seg_points.png'
+            masks_total = cv2.bitwise_or(masks_total, masks_by_user)
+            masks_by_user, image_output = self.inpaint_from_user(image, user_inputs, save_path=None)
             _, mask_bytes = cv2.imencode("." + extension, image_output)
         else:
-            logging.info("***** 사용자 입력 세그멘테이션 스킵 ******")
+            logging.info("***** 2차: 사용자 입력 세그멘테이션 스킵 ******")
             masks_by_user = None
             mask_bytes = None
-        # cv2.imwrite('test_images/mask_total.png', masks_total)
-        if isinstance(masks_total, np.ndarray):
-            image_output = self.inpainting(image_output, masks_total)
+
+        if isinstance(masks_total, np.ndarray) and len(bbox) > 0:
+            image_output = self.inpainting(image_output, masks_total, bbox)
             logging.info('***** 인페인팅 수행 완료 ******')
-        else:
-            logging.info('입력과 동일한 결과 이미지입니다.')
 
         _, input_bytes = cv2.imencode("." + extension, image)
-        # _, mask_bytes = cv2.imencode("." + extension, masks_total.astype(np.uint8))
         _, result_bytes = cv2.imencode("." + extension, image_output)
 
         if masks_by_yolo is not None:
-            _, mask_by_yolo_bytes = cv2.imencode("." + extension, masks_by_yolo.astype(np.uint8))
+            mask_by_yolo_img = image.copy()
+            mask_by_yolo_img[masks_by_yolo == 255] = [0, 0, 0]
+            _, mask_by_yolo_bytes = cv2.imencode("." + extension, mask_by_yolo_img)
         else:
             mask_by_yolo_bytes = None
         if masks_by_user is not None:
-            _, mask_by_user_bytes = cv2.imencode("." + extension, masks_by_user.astype(np.uint8))
+            mask_by_user_img = image.copy()
+            mask_by_user_img[masks_by_user == 255] = [0, 0, 0]
+            _, mask_by_user_bytes = cv2.imencode("." + extension, mask_by_user_img)
         else:
             mask_by_user_bytes = None
+
+        mask_total_img = image.copy()
+        mask_total_img[masks_total == 255] = [0, 0, 0]
+        _, mask_bytes = cv2.imencode("." + extension, mask_total_img)
+
         return (io.BytesIO(input_bytes), io.BytesIO(mask_bytes), io.BytesIO(result_bytes),
                 io.BytesIO(mask_by_yolo_bytes), io.BytesIO(mask_by_user_bytes))

From 2ccb36c992dd0fc25465b8569fc546e124addbad Mon Sep 17 00:00:00 2001
From: semnisem <doldori102493@gmail.com>
Date: Sun, 24 Nov 2024 21:14:22 +0900
Subject: [PATCH 5/5] =?UTF-8?q?Hot-Fix:=20=EC=A0=9C=EA=B1=B0=20=EC=9D=B4?=
 =?UTF-8?q?=EB=AF=B8=EC=A7=80=20=EC=93=B0=EA=B8=B0=20imwrite?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/AIProcessor.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/app/AIProcessor.py b/app/AIProcessor.py
index 9e0545d..f578f5b 100644
--- a/app/AIProcessor.py
+++ b/app/AIProcessor.py
@@ -113,14 +113,13 @@ def inpainting(self, image, mask_total, bbox=None):
 
         text_np = cv2.dilate(text_np, np.ones((4, 4), np.uint8), iterations=1)
         text_np = cv2.erode(text_np, np.ones((2, 2), np.uint8), iterations=2)
-        cv2.imwrite('text_np.jpg', text_np.astype(np.uint8))
+        # cv2.imwrite('text_np.jpg', text_np.astype(np.uint8))
 
         inpainted_image = image.copy()
         inpainted_image[mask_total == 255] = [255, 255, 255]
         inpainted_image[text_np == 255] = [30, 30, 30]
         final_image = cv2.convertScaleAbs(inpainted_image, alpha=1.5, beta=15)
 
-
         # inpainted_image = cv2.inpaint(image.copy(), mask_total, 15, cv2.INPAINT_TELEA)
         # cv2.imwrite('test_images/inpainted_init.png', inpainted_image)
         # cv2.imwrite('test_images/inpainted_final.png', final_image)