attribute 字段名规范
This commit is contained in:
338
app/service/outfit_matcher/outfit_evaluator.py
Normal file
338
app/service/outfit_matcher/outfit_evaluator.py
Normal file
@@ -0,0 +1,338 @@
|
||||
import io
|
||||
from PIL import Image
|
||||
import cv2
|
||||
import numpy as np
|
||||
import tritonclient.http as httpclient
|
||||
import torch
|
||||
from matplotlib import pyplot as plt, image as mpimg
|
||||
from minio import Minio
|
||||
from torchvision import transforms
|
||||
|
||||
from app.core.config import *
|
||||
from app.service.outfit_matcher.foco import extract_main_colors
|
||||
from app.service.utils.decorator import RunTime
|
||||
|
||||
|
||||
class OutfitMatcher(object):
|
||||
def __init__(self):
|
||||
self.tritonclient = httpclient.InferenceServerClient(url=f"{OM_TRITON_IP}:{OM_TRITON_PORT}")
|
||||
self.minio_client = Minio(
|
||||
f"{MINIO_IP}:{MINIO_PORT}",
|
||||
access_key=MINIO_ACCESS,
|
||||
secret_key=MINIO_SECRET,
|
||||
secure=MINIO_SECURE)
|
||||
|
||||
@staticmethod
|
||||
def pad_array(input_value, value=0):
|
||||
"""pad List of Array into same batch size
|
||||
|
||||
Args:
|
||||
input_value: List of numpy arrary need to be padded
|
||||
|
||||
Returns:
|
||||
Tensor: [batch_dim, max_dim, original_tensor_size]
|
||||
"""
|
||||
max_dim = max([len(x) for x in input_value])
|
||||
mask = np.zeros((len(input_value), max_dim), dtype=np.float32)
|
||||
|
||||
# Pad each array
|
||||
padded_arrays = []
|
||||
for i, array in enumerate(input_value):
|
||||
# Compute padding amount along the pad dimension
|
||||
pad_dim = max_dim - array.shape[0]
|
||||
consistent_shape = array.shape[1:]
|
||||
pad_widths = [(0, pad_dim)] + [(0, 0)] * len(consistent_shape)
|
||||
padded_array = np.pad(array, pad_widths, mode='constant', constant_values=value)
|
||||
padded_arrays.append(padded_array)
|
||||
|
||||
mask[i, array.shape[0]:] = float("-inf")
|
||||
|
||||
# Stack the padded arrays and change the dimension
|
||||
batched_arrays = np.stack(padded_arrays, axis=0)
|
||||
return batched_arrays, mask
|
||||
|
||||
@staticmethod
|
||||
def imnormalize(img, mean, std, to_rgb=True):
|
||||
"""Normalize an image with mean and std.
|
||||
|
||||
Args:
|
||||
img (ndarray): Image to be normalized.
|
||||
mean (ndarray): The mean to be used for normalize.
|
||||
std (ndarray): The std to be used for normalize.
|
||||
to_rgb (bool): Whether to convert to rgb.
|
||||
|
||||
Returns:
|
||||
ndarray: The normalized image.
|
||||
"""
|
||||
img = img.copy().astype(np.float32)
|
||||
assert img.dtype != np.uint8
|
||||
mean = np.float64(mean.reshape(1, -1))
|
||||
stdinv = 1 / np.float64(std.reshape(1, -1))
|
||||
if to_rgb:
|
||||
cv2.cvtColor(img, cv2.COLOR_BGR2RGB, img) # inplace
|
||||
cv2.subtract(img, mean, img) # inplace
|
||||
cv2.multiply(img, stdinv, img) # inplace
|
||||
return img
|
||||
|
||||
@RunTime
|
||||
def visualize(self, outfits, scores, topk=5, best=True, output_path=None):
|
||||
# 将outfits和scores按照scores的值进行排序
|
||||
sorted_indices = np.argsort(-scores.flatten() if best else scores.flatten())[:topk] # 使用负号进行降序排序
|
||||
outfits = [outfits[i] for i in sorted_indices] # 最好或最差的五个
|
||||
scores = scores[sorted_indices] # 这五个的分数
|
||||
|
||||
# 是否画出来
|
||||
if output_path:
|
||||
# 设置子图的行列数
|
||||
num_rows = len(outfits)
|
||||
num_cols = max([len(x) for x in outfits]) + 1 # 一个是图片,一个是分数
|
||||
|
||||
# 创建一个新的图像,并指定子图的行列数
|
||||
fig, axes = plt.subplots(num_rows, num_cols, figsize=(8, 15))
|
||||
|
||||
title = f"Best {topk} Outfits" if best else f"Worst {topk} Outfits"
|
||||
fig.suptitle(title, fontsize=16)
|
||||
|
||||
# 遍历每套outfit并将其显示在对应的子图中
|
||||
for i, (outfit, score) in enumerate(zip(outfits, scores)):
|
||||
# 显示分数
|
||||
axes[i, 0].text(0.1, 0.5, f"Score: {score[0]:.4f}", fontsize=12)
|
||||
axes[i, 0].axis("off")
|
||||
# 显示图片
|
||||
for j, item in enumerate(outfit):
|
||||
img = mpimg.imread(item['image_path']) # 读取图片
|
||||
axes[i, j + 1].imshow(img) # 在对应的子图中显示图片
|
||||
axes[i, j + 1].axis('off') # 关闭坐标轴
|
||||
axes[i, j + 1].set_title(item["semantic_category"], fontsize=10)
|
||||
for j in range(len(outfit), num_cols):
|
||||
axes[i, j].axis("off")
|
||||
|
||||
# 在每一行的底部添加一条横线
|
||||
axes[i, 0].axhline(y=0, color='black', linewidth=1)
|
||||
# 隐藏最后一行的横线
|
||||
axes[-1, 0].axhline(y=0, color='white', linewidth=1)
|
||||
|
||||
# 调整布局
|
||||
plt.subplots_adjust(wspace=0.1, hspace=0.1)
|
||||
plt.tight_layout()
|
||||
|
||||
if output_path:
|
||||
plt.savefig(output_path)
|
||||
else:
|
||||
plt.show()
|
||||
else:
|
||||
return outfits, scores.numpy().flatten().tolist()
|
||||
|
||||
|
||||
class OutfitMatcherHon(OutfitMatcher):
|
||||
def __init__(self):
|
||||
super().__init__()
|
||||
|
||||
def load_image(self, img_path):
|
||||
try:
|
||||
# 从 MinIO 中获取对象(图像文件)
|
||||
image_data = self.minio_client.get_object(img_path.split("/", 1)[0], img_path.split("/", 1)[1])
|
||||
|
||||
# 读取图像数据并转换为 PIL 图像对象
|
||||
pil_image = Image.open(io.BytesIO(image_data.read()))
|
||||
|
||||
# 将 PIL 图像转换为 NumPy 数组
|
||||
image_array = np.array(pil_image)
|
||||
|
||||
return image_array
|
||||
except Exception as e:
|
||||
print(f"An error occurred: {e}")
|
||||
return None
|
||||
# if 'http' in img_path:
|
||||
# file = requests.get(img_path)
|
||||
# image = cv2.imdecode(np.fromstring(file.content, np.uint8), 1)
|
||||
# image = Image.fromarray(image.astype('uint8'), 'RGB')
|
||||
# else:
|
||||
# image = Image.open(img_path).convert('RGB')
|
||||
# return np.array(image)
|
||||
|
||||
@staticmethod
|
||||
def resize_image(img):
|
||||
"""
|
||||
Args:
|
||||
img: ndarray (height, width, channel)
|
||||
"""
|
||||
resized_img = cv2.resize(img, (224, 224), dst=None, interpolation=1)
|
||||
return resized_img
|
||||
|
||||
def preprocess(self, outfits):
|
||||
outfit_images = []
|
||||
outfit_colors = []
|
||||
for outfit in outfits:
|
||||
images = []
|
||||
colors = []
|
||||
for item in outfit:
|
||||
image = self.load_image(item["image_path"])
|
||||
image = self.resize_image(image)
|
||||
normalized_image = self.imnormalize(image,
|
||||
mean=np.array([208.32996145, 201.28227452, 198.47047691],
|
||||
dtype=np.float32),
|
||||
std=np.array([75.48939648, 80.47423057, 82.21144189],
|
||||
dtype=np.float32))
|
||||
images.append(normalized_image.transpose(2, 0, 1))
|
||||
color = extract_main_colors(image)
|
||||
colors.append(color)
|
||||
images = np.stack(images, axis=0)
|
||||
outfit_images.append(images) # List[(items, 3, 224, 224)]
|
||||
colors = np.stack(colors, axis=0)
|
||||
outfit_colors.append(colors)
|
||||
outfit_images, mask = self.pad_array(outfit_images)
|
||||
outfit_colors, _ = self.pad_array(outfit_colors)
|
||||
return outfit_images, outfit_colors, mask
|
||||
|
||||
def get_result(self, outfits):
|
||||
# start = time.time()
|
||||
image, color, mask = self.preprocess(outfits)
|
||||
# print(start - time.time())
|
||||
# transformed_img = image.astype(np.float32)
|
||||
# 输入集
|
||||
inputs = [
|
||||
httpclient.InferInput("input__0", image.shape, datatype="FP32"),
|
||||
httpclient.InferInput("input__1", color.shape, datatype="FP32"),
|
||||
httpclient.InferInput("input__2", mask.shape, datatype="FP32"),
|
||||
]
|
||||
inputs[0].set_data_from_numpy(image.astype(np.float32), binary_data=True)
|
||||
inputs[1].set_data_from_numpy(color.astype(np.float32), binary_data=True)
|
||||
inputs[2].set_data_from_numpy(mask.astype(np.float32), binary_data=True)
|
||||
# 输出集
|
||||
outputs = [
|
||||
httpclient.InferRequestedOutput("output__0", binary_data=True),
|
||||
]
|
||||
results = self.tritonclient.infer(model_name="outfit_matcher_hon", inputs=inputs, outputs=outputs)
|
||||
# 推理
|
||||
# 取结果
|
||||
inference_output1 = torch.from_numpy(results.as_numpy("output__0"))
|
||||
return inference_output1 # Shape (N, 1)
|
||||
|
||||
|
||||
class OutfitMaterTypeAware(OutfitMatcher):
|
||||
base_fashion_categories = [
|
||||
'accessories', 'all-body', 'bags', 'bottoms', 'hats', 'jewellery',
|
||||
'outerwear', 'scarves', 'shoes', 'sunglasses', 'tops'
|
||||
]
|
||||
|
||||
@RunTime
|
||||
def __init__(self):
|
||||
super().__init__()
|
||||
|
||||
@RunTime
|
||||
# TODO 用多线程读图片
|
||||
def load_image(self, img_path):
|
||||
try:
|
||||
# 从 MinIO 中获取对象(图像文件)
|
||||
image_data = self.minio_client.get_object(img_path.split("/", 1)[0], img_path.split("/", 1)[1])
|
||||
|
||||
# 读取图像数据并转换为 PIL 图像对象
|
||||
pil_image = Image.open(io.BytesIO(image_data.data)).convert("RGB")
|
||||
|
||||
# 将 PIL 图像转换为 NumPy 数组
|
||||
# image_array = np.array(pil_image)
|
||||
|
||||
return pil_image
|
||||
except Exception as e:
|
||||
print(f"An error occurred: {e}")
|
||||
return None
|
||||
# if 'http' in img_path:
|
||||
# file = requests.get(img_path)
|
||||
# image = cv2.imdecode(np.fromstring(file.content, np.uint8), 1)
|
||||
# image = Image.fromarray(image.astype('uint8'), 'RGB')
|
||||
# else:
|
||||
# image = Image.open(img_path).convert('RGB')
|
||||
# return np.array(image)
|
||||
|
||||
@staticmethod
|
||||
def resize_image(img):
|
||||
"""
|
||||
Args:
|
||||
img: ndarray (height, width, channel)
|
||||
"""
|
||||
image_transforms = transforms.Compose([
|
||||
transforms.Resize(112),
|
||||
transforms.CenterCrop(112),
|
||||
transforms.ToTensor(),
|
||||
transforms.Normalize(mean=[0.485, 0.456, 0.406],
|
||||
std=[0.229, 0.224, 0.225]),
|
||||
])
|
||||
resized_img = image_transforms(img).numpy()
|
||||
return resized_img
|
||||
|
||||
def preprocess(self, outfits):
|
||||
outfit_images = []
|
||||
outfit_categories = []
|
||||
for outfit in outfits:
|
||||
images = []
|
||||
categories = []
|
||||
for item in outfit:
|
||||
image = self.load_image(item["image_path"])
|
||||
image = self.resize_image(image)
|
||||
images.append(image)
|
||||
category = self.base_fashion_categories.index(item["mapped_cate"])
|
||||
categories.append(category)
|
||||
images = np.stack(images, axis=0)
|
||||
outfit_images.append(images) # List[(items, 3, 224, 224)]
|
||||
categories = np.array(categories)
|
||||
outfit_categories.append(categories) # List[(items)]
|
||||
outfit_images, mask = self.pad_array(outfit_images, value=0)
|
||||
outfit_categories, _ = self.pad_array(outfit_categories, value=len(self.base_fashion_categories))
|
||||
return outfit_images, outfit_categories, mask
|
||||
|
||||
@RunTime
|
||||
def get_result(self, outfits):
|
||||
"""Input outfits structure and output scores.
|
||||
Args:
|
||||
outfits: outfits to be evaluated.
|
||||
Example:
|
||||
[
|
||||
[
|
||||
{
|
||||
"item_name": "MSE_57987",
|
||||
"semantic_category": "BOTTOM/PANTS",
|
||||
"image_path": "D:\\PhD_Study\\MIXI\\mitu\\image\\2024 SS\\MSE_57987.jpg",
|
||||
"mapped_cate": "bottoms"
|
||||
},
|
||||
{
|
||||
"item_name": "MPO_SP7712",
|
||||
"semantic_category": "TOP/TANK",
|
||||
"image_path": "D:\\PhD_Study\\MIXI\\mitu\\image\\2024 SS\\MPO_SP7712.jpg",
|
||||
"mapped_cate": "tops"
|
||||
},
|
||||
{
|
||||
"item_name": "MWSS27195",
|
||||
"semantic_category": "OUTERWEAR/GILET",
|
||||
"image_path": "D:\\PhD_Study\\MIXI\\mitu\\image\\2024 SS\\MWSS27195.jpg",
|
||||
"mapped_cate": "outerwear"
|
||||
}
|
||||
],
|
||||
...
|
||||
]
|
||||
Returns:
|
||||
scores: List of float
|
||||
"""
|
||||
image, category, mask = self.preprocess(outfits)
|
||||
client = httpclient.InferenceServerClient(url=f"{OM_TRITON_IP}:{OM_TRITON_PORT}")
|
||||
# 输入集
|
||||
inputs = [
|
||||
httpclient.InferInput("input__0", image.shape, datatype="FP32"),
|
||||
httpclient.InferInput("input__1", category.shape, datatype="INT16"),
|
||||
httpclient.InferInput("input__2", mask.shape, datatype="FP32"),
|
||||
]
|
||||
inputs[0].set_data_from_numpy(image.astype(np.float32), binary_data=True)
|
||||
inputs[1].set_data_from_numpy(category.astype(np.int16), binary_data=True)
|
||||
inputs[2].set_data_from_numpy(mask.astype(np.float32), binary_data=True)
|
||||
# 输出集
|
||||
outputs = [
|
||||
httpclient.InferRequestedOutput("output__0", binary_data=True),
|
||||
httpclient.InferRequestedOutput("output__1", binary_data=True)
|
||||
]
|
||||
results = client.infer(model_name="outfit_matcher_type_aware", inputs=inputs, outputs=outputs)
|
||||
# 推理
|
||||
# 取结果
|
||||
scores = torch.from_numpy(results.as_numpy("output__0")) # Shape (N, 1)
|
||||
features = torch.from_numpy(results.as_numpy("output__1")) # Shape (N, 64)
|
||||
|
||||
return scores, features
|
||||
Reference in New Issue
Block a user