Forecast4Muses / app.py
Hanxiao Xiang
change the title
c9968b1
raw
history blame
14.1 kB
import subprocess
subprocess.call("mim install 'mmengine>=0.6.0'", shell=True)
subprocess.call("mim install 'mmcv>=2.0.0rc4,<2.1.0'", shell=True)
subprocess.call("min install 'mmdet>=3.0.0,<4.0.0'", shell=True)
subprocess.call("mim install 'mmyolo'", shell=True)
subprocess.call("mim install 'mmpose'", shell=True)
subprocess.call("mim install 'mmpretrain'", shell=True)
import numpy as np
import gradio as gr
import requests
import base64
import pandas as pd
import cv2
from typing import Tuple
from PIL import Image
from io import BytesIO
import os
from Model.Model6.model6_inference import main as model6_inferencer
from mmyolo.utils import register_all_modules
register_all_modules()
def get_access_token(refatch=False) -> str:
"""获取百度AI的access_token
:param refatch:是否重新获取access_token
:return:返回access_token"""
if refatch:
# client_id 为官网获取的AK, client_secret 为官网获取的SK
client_id = '7OtH60uo01ZNYN4yPyahlRSx'
client_secret = 'D5AxcUpyQyIA7KgPplp7dnz5tM0UIljy'
host = 'https://aip.baidubce.com/oauth/2.0/token?' \
'grant_type=client_credentials&client_id=%s&client_secret=%s' % (client_id, client_secret)
response = requests.get(host)
# print(response)
if response:
return response.json()['access_token']
else:
r"""
{"refresh_token":"25.24b9368ce91f9bd62c8dad38b3436800.315360000.2007815067.282335-30479502",
"expires_in":2592000,
"session_key":
"9mzdWT\/YmQ7oEi9WCRWbXd0YCcrSYQY6kKZjObKunlcKcZt95j9\/q1aJqbVXihpQOXK84o5WLJ8e7d4cXOi0VUJJcz5YEQ==",
"access_token":"24.becefee37aba38ea43c546fc154d3016.2592000.1695047067.282335-30479502",
"scope":"public brain_all_scope brain_body_analysis brain_body_attr brain_body_number brain_driver_behavior
brain_body_seg brain_gesture_detect brain_body_tracking brain_hand_analysis wise_adapt
lebo_resource_base lightservice_public hetu_basic lightcms_map_poi kaidian_kaidian
ApsMisTest_Test\u6743\u9650 vis-classify_flower lpq_\u5f00\u653e cop_helloScope
ApsMis_fangdi_permission smartapp_snsapi_base smartapp_mapp_dev_manage iop_autocar oauth_tp_app
smartapp_smart_game_openapi oauth_sessionkey smartapp_swanid_verify smartapp_opensource_openapi
smartapp_opensource_recapi fake_face_detect_\u5f00\u653eScope
vis-ocr_\u865a\u62df\u4eba\u7269\u52a9\u7406 idl-video_\u865a\u62df\u4eba\u7269\u52a9\u7406
smartapp_component smartapp_search_plugin avatar_video_test b2b_tp_openapi b2b_tp_openapi_online
smartapp_gov_aladin_to_xcx","session_secret":"5c8c3dbb80b04f58bb33aa8077758679"
}
"""
access_token = "24.becefee37aba38ea43c546fc154d3016.2592000.1695047067.282335-30479502"
return access_token
def resize_image(img, max_length=2048, min_length=50) -> Tuple[np.ndarray, bool]:
"""Ensure that the longest side is shorter than 2048px and the shortest side is longer than 50px.
:param img: 前端传入的图片
:param max_length: 最长边像素
:param min_length: 最短边像素
:return: 返回处理后的图片和是否进行了resize的标志
"""
flag = False
max_side = max(img.shape[0], img.shape[1])
min_side = min(img.shape[0], img.shape[1])
if max_side > max_length:
scale = max_length / max_side
img = cv2.resize(img, (int(img.shape[1] * scale), int(img.shape[0] * scale)))
flag = True
if min_side < min_length:
scale = min_length / min_side
img = cv2.resize(img, (int(img.shape[1] * scale), int(img.shape[0] * scale)))
flag = True
return img, flag
def model1_det(x):
"""人体检测与属性识别
:param x:前端传入的图片
:return:返回检测结果
"""
def _Baidu_det(img):
"""调用百度AI接口进行人体检测与属性识别
:param img:前端传入的图片,格式为numpy.ndarray
:return:返回检测结果
"""
request_url = "https://aip.baidubce.com/rest/2.0/image-classify/v1/body_attr"
# 保存图片到本地
cv2.imwrite('test.jpg', img)
# 二进制方式打开图片文件
f = open('test.jpg', 'rb')
hex_image = base64.b64encode(f.read())
# 选择二进制图片和需要输出的属性(12个)
params = {
"image": hex_image,
"type": "gender,age,upper_wear,lower_wear,upper_color,lower_color,"
"orientation,upper_cut,lower_cut,side_cut,occlusion,is_human"
}
access_token = get_access_token()
request_url = request_url + "?access_token=" + access_token
headers = {'content-type': 'application/x-www-form-urlencoded'}
response = requests.post(request_url, data=params, headers=headers)
if response:
return response.json()
def _get_attributes_list(r) -> dict:
"""获取人体属性列表
:param r:百度AI接口返回的json数据
:return:返回人体属性列表
"""
all_humans_attributes_list = {}
person_num = r['person_num']
print('person_num:', person_num)
for human_idx in range(person_num):
attributes_dict = r['person_info'][human_idx]['attributes']
attributes_list = []
for key, value in attributes_dict.items():
attribute = [key, value['name'], value['score']]
attributes_list.append(attribute)
new_value = ['attribute', 'attribute_value', 'accuracy']
attributes_list.insert(0, new_value)
df = pd.DataFrame(attributes_list[1:], columns=attributes_list[0])
all_humans_attributes_list[human_idx] = df
return all_humans_attributes_list
def _show_img(img, bboxes):
"""显示图片
:param img:前端传入的图片
:param bboxes:检测框坐标
:return:处理完成的图片 """
line_width = int(max(img.shape[1], img.shape[0]) / 400)
for bbox in bboxes:
left, top, width, height = bbox['left'], bbox['top'], bbox['width'], bbox['height']
right, bottom = left + width, top + height
for i in range(left, right):
img[top:top + line_width, i] = [255, 0, 0]
img[bottom - line_width:bottom, i] = [255, 0, 0]
for i in range(top, bottom):
img[i, left:left + line_width] = [255, 0, 0]
img[i, right - line_width:right] = [255, 0, 0]
return img
result = _Baidu_det(x)
HAs_list = _get_attributes_list(result)
locations = []
for i in range(len(result['person_info'])):
locations.append(result['person_info'][i]['location'])
return _show_img(x, locations), f"模型检测到的人数为:{result['person_num']}人"
def model2_rem(x):
"""背景消除
:param x: 前端传入的图片
:return: 返回处理后的图片
"""
def _Baidu_rem(img):
"""调用百度AI接口进行背景消除
:param img: 前端传入的图片,格式为numpy.ndarray
:return: 返回处理后的图片
"""
request_url = "https://aip.baidubce.com/rest/2.0/image-classify/v1/body_seg"
bgr_image = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
cv2.imwrite('test.jpg', bgr_image)
f = open('test.jpg', 'rb')
hex_image = base64.b64encode(f.read())
params = {"image": hex_image}
access_token = get_access_token()
request_url = request_url + "?access_token=" + access_token
headers = {'content-type': 'application/x-www-form-urlencoded'}
response = requests.post(request_url, data=params, headers=headers)
if response:
encoded_image = response.json()["foreground"]
decoded_image = base64.b64decode(encoded_image)
image = Image.open(BytesIO(decoded_image))
image_array = np.array(image)
return image_array
resized_x, resized_f = resize_image(x)
new_img = _Baidu_rem(resized_x)
if resized_f:
resized_f = "图片尺寸已被修改至合适大小"
else:
resized_f = "图片尺寸无需修改"
return new_img, resized_f
def model3_ext(x: np.ndarray, num_clusters=12):
"""主色调提取
:param x: 前端传入的图片
:param num_clusters: 聚类的数量
:return: 返回主色调条形卡片"""
# TODO: 编写颜色名称匹配算法[most important]
# TODO: 修改颜色条形卡片呈现形式,要求呈现颜色名称和比例[important]
def _find_name(color):
"""根据颜色值查找颜色名称
:param color:颜色值
:return:返回颜色名称
"""
pass
def _cluster(img, NUM_CLUSTERS):
"""K-means 聚类提取主色调
:param img: 前端传入的图片
:param NUM_CLUSTERS: 聚类的数量
:return: 返回聚类结果
"""
h, w, ch = img.shape
reshaped_x = np.float32(img.reshape((-1, 4)))
new_data_list = []
for i in range(len(reshaped_x)):
if reshaped_x[i][3] < 100:
continue
else:
new_data_list.append(reshaped_x[i])
reshaped_x = np.array(new_data_list)
reshaped_x = np.delete(reshaped_x, 3, axis=1)
criteria = (cv2.TERM_CRITERIA_EPS + cv2.TERM_CRITERIA_MAX_ITER, 10, 1.0)
NUM_CLUSTERS = NUM_CLUSTERS
ret, label, center = cv2.kmeans(reshaped_x, NUM_CLUSTERS, None, criteria,
NUM_CLUSTERS, cv2.KMEANS_RANDOM_CENTERS)
clusters = np.zeros([NUM_CLUSTERS], dtype=np.int32)
for i in range(len(label)):
clusters[label[i][0]] += 1
clusters = np.float32(clusters) / float(len(reshaped_x))
center = np.int32(center)
x_offset = 0
card = np.zeros((50, w, 3), dtype=np.uint8)
for c in np.argsort(clusters)[::-1]:
dx = int(clusters[c] * w)
b = center[c][0]
g = center[c][1]
r = center[c][2]
cv2.rectangle(card, (x_offset, 0), (x_offset + dx, 50),
(int(b), int(g), int(r)), -1)
x_offset += dx
return card, resized_f
resized_x, resized_f = resize_image(x)
card, resized_f = _cluster(resized_x, num_clusters)
if resized_f:
resized_f = "图片尺寸已被修改至合适大小"
else:
resized_f = "图片尺寸无需修改"
return card, resized_f
def model4_clo(x_path: str):
def _get_result(input_path: str, cls_results: dict) -> pd.DataFrame:
"""convert the results of model6_2 to a dataframe
:param input_path: the (absolute) path of the image
:param cls_results: the results of model6_2
:return: a dataframe to display on the web
"""
result_pd = []
img_name = os.path.basename(input_path)
pred_profile = cls_results[img_name][0]['pred_class']
pred_score = round(cls_results[img_name][0]['pred_score'], 2)
result_pd.append([img_name, pred_profile, pred_score])
df = pd.DataFrame(result_pd, columns=None)
return df
output_path_root = 'upload_to_web_tmp'
if not os.path.exists(output_path_root):
os.mkdir(output_path_root)
cls_result = model6_inferencer(x_path, output_path_root)
if cls_result:
# use np to read image·
x_name = os.path.basename(x_path)
pred_x = np.array(Image.open(os.path.join(output_path_root, 'visualizations', x_name)))
return pred_x, _get_result(x_path, cls_result), "识别成功!"
# TODO: 完善识别失败时的处理(model6_inference.py中)[important]
return x_path, pd.DataFrame(), "未检测到服装"
with gr.Blocks() as demo:
gr.Markdown("# 服装图像识别模块——功能演示")
with gr.Tab("人体检测模型"):
with gr.Row():
model1_input = gr.Image(height=400)
model1_output_img = gr.Image(height=400)
# model1_output_df = gr.DataFrame()
model1_button = gr.Button("开始检测")
with gr.Tab("背景消除模型"):
with gr.Row():
model2_input = gr.Image(height=400)
model2_output_img = gr.Image(height=400)
model2_button = gr.Button("开始消除")
with gr.Tab('主色调提取'):
with gr.Row():
with gr.Column():
# TODO: 参照“蒙娜丽莎”尝试修改前端界面[not important]
# TODO: 修改布局,使其更美观[moderately important]
model3_input = gr.Image(height=400, image_mode='RGBA')
model3_slider = gr.Slider(minimum=1, maximum=20, step=1, value=12,
min_width=400, label="聚类数量")
model3_output_img = gr.Image(height=400)
model3_button = gr.Button("开始提取")
with gr.Tab("廓形识别"):
with gr.Row():
model4_input = gr.Image(height=400, type="filepath")
model4_output_img = gr.Image(height=400)
model4_output_df = gr.DataFrame(headers=['img_name', 'pred_profile', 'pred_score'],
datatype=['str', 'str', 'number'])
model4_button = gr.Button("开始识别")
# 设置折叠内容
with gr.Accordion("模型运行信息"):
running_info = gr.Markdown("等待输入和运行...")
model1_button.click(model1_det, inputs=model1_input, outputs=[model1_output_img, running_info])
model2_button.click(model2_rem, inputs=model2_input, outputs=[model2_output_img, running_info])
model3_button.click(model3_ext, inputs=[model3_input, model3_slider], outputs=[model3_output_img, running_info])
model4_button.click(model4_clo, inputs=model4_input, outputs=[model4_output_img, model4_output_df, running_info])
demo.launch()