app/service/generate_image/utils/image_processing.py

import logging

import cv2
import mmcv
import numpy as np
import torch
import tritonclient.http as httpclient
import torch.nn.functional as F
from app.core.config import *
import cv2

logger = logging.getLogger()


def seg_preprocess(img_path):
    img = mmcv.imread(img_path)
    ori_shape = img.shape[:2]
    img_scale = (224, 224)
    scale_factor = []
    img, x, y = mmcv.imresize(img, img_scale, return_scale=True)
    scale_factor.append(x)
    scale_factor.append(y)
    img = mmcv.imnormalize(img, mean=np.array([123.675, 116.28, 103.53]), std=np.array([58.395, 57.12, 57.375]), to_rgb=True)
    preprocessed_img = np.expand_dims(img.transpose(2, 0, 1), axis=0)
    return preprocessed_img, ori_shape


def get_mask(image_obj):
    pre_mask = None
    if len(image_obj.shape) == 2:
        image_obj = cv2.cvtColor(image_obj, cv2.COLOR_GRAY2RGB)
    if image_obj.shape[2] == 4:  # 如果是四通道 mask
        pre_mask = image_obj[:, :, 3]
        image_obj = image_obj[:, :, :3]

    Contour = get_contours(image_obj)
    Mask = np.zeros(image_obj.shape[:2], np.uint8)
    if len(Contour):
        Max_contour = Contour[0]
        Epsilon = 0.001 * cv2.arcLength(Max_contour, True)
        Approx = cv2.approxPolyDP(Max_contour, Epsilon, True)
        cv2.drawContours(Mask, [Approx], -1, 255, -1)
    else:
        Mask = np.ones(image_obj.shape[:2], np.uint8) * 255

    if pre_mask is None:
        mask = Mask
    else:
        mask = cv2.bitwise_and(Mask, pre_mask)
    return image_obj, mask


def get_contours(image):
    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
    Edge = cv2.Canny(gray, 10, 150)
    kernel = np.ones((5, 5), np.uint8)
    Edge = cv2.dilate(Edge, kernel=kernel, iterations=1)
    Edge = cv2.erode(Edge, kernel=kernel, iterations=1)
    Contour, _ = cv2.findContours(Edge, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
    Contour = sorted(Contour, key=cv2.contourArea, reverse=True)
    return Contour


def seg_infer_image(image_obj):
    image, ori_shape = seg_preprocess(image_obj)
    client = httpclient.InferenceServerClient(url=f"{SEG_MODEL_URL}")
    transformed_img = image.astype(np.float32)
    # 输入集
    inputs = [
        httpclient.InferInput(SEGMENTATION['input'], transformed_img.shape, datatype="FP32")
    ]
    inputs[0].set_data_from_numpy(transformed_img, binary_data=True)
    # 输出集
    outputs = [
        httpclient.InferRequestedOutput(SEGMENTATION['output'], binary_data=True),
    ]
    results = client.infer(model_name=SEGMENTATION['name'], inputs=inputs, outputs=outputs)
    # 推理
    # 取结果
    inference_output1 = torch.from_numpy(results.as_numpy(SEGMENTATION['output']))
    seg_result = seg_postprocess(inference_output1, ori_shape)
    return seg_result


def seg_postprocess(output, ori_shape):
    seg_logit = F.interpolate(output, size=ori_shape, scale_factor=None, mode='bilinear', align_corners=False)
    seg_logit = F.softmax(seg_logit, dim=1)
    seg_pred = seg_logit.argmax(dim=1)
    seg_pred = seg_pred.cpu().numpy()
    return seg_pred


def remove_background(image):
    image_obj, mask = get_mask(image)
    seg_result = seg_infer_image(image_obj)

    temp_front = seg_result == 1
    front_mask = (mask * (temp_front + 0).astype(np.uint8))
    temp_back = seg_result == 2
    back_mask = (mask * (temp_back + 0).astype(np.uint8))

    if len(front_mask.shape) > 2:
        front_mask = front_mask[0]
    else:
        front_mask = front_mask

    if len(back_mask.shape) > 2:
        back_mask = back_mask[0]
    else:
        back_mask = back_mask

    result_mask = front_mask + back_mask
    white_background = np.ones_like(image_obj) * 255
    remove_bg_image = np.where(result_mask[:, :, None].astype(bool), image_obj, white_background)
    # cv2.imwrite("source_image", image)
    # cv2.imwrite("remove_bg_image", remove_bg_image)

    return remove_bg_image


def bounding_box(image):
    edges = cv2.Canny(image, 50, 150)
    # 查找轮廓
    contours, _ = cv2.findContours(edges, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
    # 初始化包围所有外接矩形的大矩形的坐标
    x_min, y_min, x_max, y_max = float('inf'), float('inf'), -1, -1
    # 遍历所有外接矩形，更新大矩形的坐标
    for contour in contours:
        x, y, w, h = cv2.boundingRect(contour)
        x_min = min(x_min, x)
        y_min = min(y_min, y)
        x_max = max(x_max, x + w)
        y_max = max(y_max, y + h)

    # 根据大矩形的坐标来裁剪原始图像
    result_image = image[y_min:y_max, x_min:x_max]
    # cv2.imshow("result_image", result_image)
    # cv2.waitKey(0)
    return result_image


def stain_detection(image, spot_size=100):
    height, width, _ = image.shape

    corners = [
        image[0:spot_size, 0:spot_size],  # top left
        image[0:spot_size, width - spot_size:width],  # top right
        # image[height - spot_size:height, 0:spot_size],  # bottom left
        # image[height - spot_size:height, width - spot_size:width]  # bottom right
    ]

    for index, corner in enumerate(corners):
        num_white_pixels = (corner == [255, 255, 255]).all(axis=2).sum()
        if num_white_pixels != spot_size * spot_size:
            logger.info(f"第{index + 1}发现了污点")
            return False, None

    if DEBUG:
        for corner_coords in [(0, 0), (0, width - spot_size), (height - spot_size, 0), (height - spot_size, width - spot_size)]:
            cv2.rectangle(image, corner_coords, (corner_coords[0] + spot_size, corner_coords[1] + spot_size), (0, 0, 255), 2)

    return True, image


def generate_category_recognition(image, gender):
    def preprocess(img):
        img = mmcv.imread(img)
        # ori_shape = img.shape[:2]
        img_scale = (224, 224)
        scale_factor = []
        img, x, y = mmcv.imresize(img, img_scale, return_scale=True)
        scale_factor.append(x)
        scale_factor.append(y)
        img = mmcv.imnormalize(img, mean=np.array([123.675, 116.28, 103.53]), std=np.array([58.395, 57.12, 57.375]), to_rgb=True)
        preprocessed_img = np.expand_dims(img.transpose(2, 0, 1), axis=0)
        return preprocessed_img

    preprocessed_img = preprocess(image)
    triton_client = httpclient.InferenceServerClient(url=ATT_TRITON_URL)

    inputs = [
        httpclient.InferInput("input__0", preprocessed_img.shape, datatype="FP32")
    ]
    inputs[0].set_data_from_numpy(preprocessed_img, binary_data=True)
    results = triton_client.infer(model_name="attr_retrieve_category", inputs=inputs)
    inference_output = torch.from_numpy(results.as_numpy(f'output__0'))

    scores = inference_output.detach().numpy()
    import pandas as pd

    attr_type = pd.read_csv(CATEGORY_PATH)
    colattr = list(attr_type['labelName'])

    task = attr_type['taskName'][0]

    maxsc = np.max(scores[0][:5])
    indexs = np.argwhere(scores == maxsc)[:, 1]
    category = colattr[indexs[0]]

    if gender == "Male":
        if category == 'Trousers' or category == 'Skirt':
            category = 'Bottoms'
        elif category == 'Blouse' or category == 'Dress':
            category = 'Tops'
        else:
            category = 'Outwear'
    return category, scores, image
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`import logging`

feat generate 迁移 2024-04-15 18:07:25 +08:00			`import cv2`
			`import mmcv`
			`import numpy as np`
			`import torch`
			`import tritonclient.http as httpclient`
			`import torch.nn.functional as F`
			`from app.core.config import *`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`import cv2`

			`logger = logging.getLogger()`
feat generate 迁移 2024-04-15 18:07:25 +08:00

			`def seg_preprocess(img_path):`
			`img = mmcv.imread(img_path)`
			`ori_shape = img.shape[:2]`
			`img_scale = (224, 224)`
			`scale_factor = []`
			`img, x, y = mmcv.imresize(img, img_scale, return_scale=True)`
			`scale_factor.append(x)`
			`scale_factor.append(y)`
			`img = mmcv.imnormalize(img, mean=np.array([123.675, 116.28, 103.53]), std=np.array([58.395, 57.12, 57.375]), to_rgb=True)`
			`preprocessed_img = np.expand_dims(img.transpose(2, 0, 1), axis=0)`
			`return preprocessed_img, ori_shape`


			`def get_mask(image_obj):`
			`pre_mask = None`
			`if len(image_obj.shape) == 2:`
			`image_obj = cv2.cvtColor(image_obj, cv2.COLOR_GRAY2RGB)`
			`if image_obj.shape[2] == 4: # 如果是四通道 mask`
			`pre_mask = image_obj[:, :, 3]`
			`image_obj = image_obj[:, :, :3]`

			`Contour = get_contours(image_obj)`
			`Mask = np.zeros(image_obj.shape[:2], np.uint8)`
			`if len(Contour):`
			`Max_contour = Contour[0]`
			`Epsilon = 0.001 * cv2.arcLength(Max_contour, True)`
			`Approx = cv2.approxPolyDP(Max_contour, Epsilon, True)`
			`cv2.drawContours(Mask, [Approx], -1, 255, -1)`
			`else:`
			`Mask = np.ones(image_obj.shape[:2], np.uint8) * 255`

			`if pre_mask is None:`
			`mask = Mask`
			`else:`
			`mask = cv2.bitwise_and(Mask, pre_mask)`
			`return image_obj, mask`


			`def get_contours(image):`
			`gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)`
			`Edge = cv2.Canny(gray, 10, 150)`
			`kernel = np.ones((5, 5), np.uint8)`
			`Edge = cv2.dilate(Edge, kernel=kernel, iterations=1)`
			`Edge = cv2.erode(Edge, kernel=kernel, iterations=1)`
			`Contour, _ = cv2.findContours(Edge, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)`
			`Contour = sorted(Contour, key=cv2.contourArea, reverse=True)`
			`return Contour`


			`def seg_infer_image(image_obj):`
			`image, ori_shape = seg_preprocess(image_obj)`
			`client = httpclient.InferenceServerClient(url=f"{SEG_MODEL_URL}")`
			`transformed_img = image.astype(np.float32)`
			`# 输入集`
			`inputs = [`
			`httpclient.InferInput(SEGMENTATION['input'], transformed_img.shape, datatype="FP32")`
			`]`
			`inputs[0].set_data_from_numpy(transformed_img, binary_data=True)`
			`# 输出集`
			`outputs = [`
			`httpclient.InferRequestedOutput(SEGMENTATION['output'], binary_data=True),`
			`]`
			`results = client.infer(model_name=SEGMENTATION['name'], inputs=inputs, outputs=outputs)`
			`# 推理`
			`# 取结果`
			`inference_output1 = torch.from_numpy(results.as_numpy(SEGMENTATION['output']))`
			`seg_result = seg_postprocess(inference_output1, ori_shape)`
			`return seg_result`


			`def seg_postprocess(output, ori_shape):`
			`seg_logit = F.interpolate(output, size=ori_shape, scale_factor=None, mode='bilinear', align_corners=False)`
			`seg_logit = F.softmax(seg_logit, dim=1)`
			`seg_pred = seg_logit.argmax(dim=1)`
			`seg_pred = seg_pred.cpu().numpy()`
			`return seg_pred`


			`def remove_background(image):`
			`image_obj, mask = get_mask(image)`
			`seg_result = seg_infer_image(image_obj)`

			`temp_front = seg_result == 1`
			`front_mask = (mask * (temp_front + 0).astype(np.uint8))`
			`temp_back = seg_result == 2`
			`back_mask = (mask * (temp_back + 0).astype(np.uint8))`

			`if len(front_mask.shape) > 2:`
			`front_mask = front_mask[0]`
			`else:`
			`front_mask = front_mask`

			`if len(back_mask.shape) > 2:`
			`back_mask = back_mask[0]`
			`else:`
			`back_mask = back_mask`

			`result_mask = front_mask + back_mask`
			`white_background = np.ones_like(image_obj) * 255`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`remove_bg_image = np.where(result_mask[:, :, None].astype(bool), image_obj, white_background)`
			`# cv2.imwrite("source_image", image)`
			`# cv2.imwrite("remove_bg_image", remove_bg_image)`
feat generate 迁移 2024-04-15 18:07:25 +08:00
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`return remove_bg_image`
feat generate 新增背景去除 bounding box 2024-04-23 08:32:14 +08:00
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00
			`def bounding_box(image):`
			`edges = cv2.Canny(image, 50, 150)`
feat generate 新增背景去除 bounding box 2024-04-23 08:32:14 +08:00			`# 查找轮廓`
			`contours, _ = cv2.findContours(edges, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)`
			`# 初始化包围所有外接矩形的大矩形的坐标`
			`x_min, y_min, x_max, y_max = float('inf'), float('inf'), -1, -1`
			`# 遍历所有外接矩形，更新大矩形的坐标`
			`for contour in contours:`
			`x, y, w, h = cv2.boundingRect(contour)`
			`x_min = min(x_min, x)`
			`y_min = min(y_min, y)`
			`x_max = max(x_max, x + w)`
			`y_max = max(y_max, y + h)`

			`# 根据大矩形的坐标来裁剪原始图像`
			`result_image = image[y_min:y_max, x_min:x_max]`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`# cv2.imshow("result_image", result_image)`
feat generate 新增背景去除 bounding box 2024-04-23 08:32:14 +08:00			`# cv2.waitKey(0)`
			`return result_image`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00

feat generate sketch 污点检测改为顶部两角 2024-04-25 12:33:51 +08:00			`def stain_detection(image, spot_size=100):`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`height, width, _ = image.shape`

			`corners = [`
			`image[0:spot_size, 0:spot_size], # top left`
			`image[0:spot_size, width - spot_size:width], # top right`
feat generate sketch 污点检测改为顶部两角 2024-04-25 12:29:49 +08:00			`# image[height - spot_size:height, 0:spot_size], # bottom left`
			`# image[height - spot_size:height, width - spot_size:width] # bottom right`
feat 新增生成sketch时对图片清理背景，剔除带有污点的结果图 2024-04-23 14:59:47 +08:00			`]`

			`for index, corner in enumerate(corners):`
			`num_white_pixels = (corner == [255, 255, 255]).all(axis=2).sum()`
			`if num_white_pixels != spot_size * spot_size:`
			`logger.info(f"第{index + 1}发现了污点")`
			`return False, None`

			`if DEBUG:`
			`for corner_coords in [(0, 0), (0, width - spot_size), (height - spot_size, 0), (height - spot_size, width - spot_size)]:`
			`cv2.rectangle(image, corner_coords, (corner_coords[0] + spot_size, corner_coords[1] + spot_size), (0, 0, 255), 2)`

			`return True, image`
feat generate sketch 新增服装类别识别 2024-04-24 11:20:14 +08:00

feat generate sketch 新增服装类别识别 2024-04-24 13:25:17 +08:00			`def generate_category_recognition(image, gender):`
feat generate sketch 新增服装类别识别 2024-04-24 11:20:14 +08:00			`def preprocess(img):`
			`img = mmcv.imread(img)`
			`# ori_shape = img.shape[:2]`
			`img_scale = (224, 224)`
			`scale_factor = []`
			`img, x, y = mmcv.imresize(img, img_scale, return_scale=True)`
			`scale_factor.append(x)`
			`scale_factor.append(y)`
			`img = mmcv.imnormalize(img, mean=np.array([123.675, 116.28, 103.53]), std=np.array([58.395, 57.12, 57.375]), to_rgb=True)`
			`preprocessed_img = np.expand_dims(img.transpose(2, 0, 1), axis=0)`
			`return preprocessed_img`

			`preprocessed_img = preprocess(image)`
			`triton_client = httpclient.InferenceServerClient(url=ATT_TRITON_URL)`

			`inputs = [`
			`httpclient.InferInput("input__0", preprocessed_img.shape, datatype="FP32")`
			`]`
			`inputs[0].set_data_from_numpy(preprocessed_img, binary_data=True)`
			`results = triton_client.infer(model_name="attr_retrieve_category", inputs=inputs)`
			`inference_output = torch.from_numpy(results.as_numpy(f'output__0'))`

			`scores = inference_output.detach().numpy()`
			`import pandas as pd`

			`attr_type = pd.read_csv(CATEGORY_PATH)`
			`colattr = list(attr_type['labelName'])`

			`task = attr_type['taskName'][0]`

			`maxsc = np.max(scores[0][:5])`
			`indexs = np.argwhere(scores == maxsc)[:, 1]`
			`category = colattr[indexs[0]]`

feat generate sketch 新增服装类别识别 2024-04-24 13:25:17 +08:00			`if gender == "Male":`
			`if category == 'Trousers' or category == 'Skirt':`
			`category = 'Bottoms'`
			`elif category == 'Blouse' or category == 'Dress':`
			`category = 'Tops'`
			`else:`
			`category = 'Outwear'`
			`return category, scores, image`