| | import cv2 |
| | import numpy as np |
| | from rembg import remove |
| | from ultralytics import YOLO |
| |
|
| | class ImageProcessor: |
| | def __init__(self, model_path): |
| | self.model = YOLO(model_path) |
| | self.class_names = {0: "upper_clothes", 1: "lower_clothes"} |
| |
|
| | def remove_background(self, image_bytes): |
| | return remove(image_bytes) |
| |
|
| | def process_image(self, image_bytes): |
| | |
| | bg_removed = self.remove_background(image_bytes) |
| | |
| | |
| | nparr = np.frombuffer(bg_removed, np.uint8) |
| | img = cv2.imdecode(nparr, cv2.IMREAD_COLOR) |
| | |
| | |
| | results = self.model.predict(img) |
| | return self._process_masks(results, img) |
| |
|
| | def _process_masks(self, results, img): |
| | segmented = {} |
| | if results[0].masks is not None: |
| | for mask, class_id in zip(results[0].masks.data, results[0].boxes.cls): |
| | class_id = int(class_id.item()) |
| | mask_np = mask.cpu().numpy() |
| | mask_resized = cv2.resize(mask_np, (img.shape[1], img.shape[0]), interpolation=cv2.INTER_NEAREST) |
| | _, binary_mask = cv2.threshold(mask_resized, 0.5, 255, cv2.THRESH_BINARY) |
| | binary_mask = binary_mask.astype(np.uint8) |
| | segmented[self.class_names[class_id]] = binary_mask |
| | return segmented |