4.人脸检测mtcnn+mobilenet戴口罩分类

2023-11-17

#from keras.models import Model,Sequential
import tensorflow as tf
import numpy as np
import cv2
import os
from functools import partial
#from keras.layers import ZeroPadding2D,Depthwise,Conv2D,Activation,BatchNormalization,Concatenate,MaxPool2D,Conv2D,Dense,Dropout,GlobalAveragePooling2D
#from keras.layers import Input,Lambda,MaxPooling2D,add,Reshape,Permute,PReLU,Flatten
from keras import backend as K
import sys
from operator import itemgetter
import math
import matplotlib.pyplot as plt
from keras.models import *
from keras.layers import *
import keras
from keras.callbacks import TensorBoard,ModelCheckpoint,ReduceLROnPlateau,EarlyStopping
from keras.applications.imagenet_utils import preprocess_input
from keras.utils import np_utils,get_file
from PIL import Image
from keras.optimizers import Adam
from matplotlib.colors import rgb_to_hsv, hsv_to_rgb

#1.生成数据名+类别(0,1)的txt文件
classes=['mask','nomask']
with open('./data/train.txt','w') as f:
    after_generate=os.listdir('./data/image/train')
    for image in after_generate:
        if image.endswith('jpg'):
            f.write(image+';'+str(classes.index(image.split('_')[0]))+'\n')

#2.mtcnn检测出人脸
#2.1构建原图金字塔
def calculateScales(img):
    copy_img=img.copy()
    pr_scale=1.0
    h,w,_=copy_img.shape
    if min(w,h)>500:
        pr_scale=500.0/min(h,w)
        w=int(w*pr_scale)
        h=int(h*pr_scale)
    elif max(w,h)<500:
        pr_scale=500.0/max(h,w)
        w=int(w*pr_scale)
        h=int(h*pr_scale)
    scales=[]
    factor=0.709
    factor_count=0
    minl=min(h,w)
    while minl>=12:
        scales.append(pr_scale*pow(factor,factor_count))
        minl*=factor
        factor_count+=1
    return scales#返回图像金字塔的缩放比例列表
#2.2金字塔图像输入到Pnet大致预测人脸位置与概率
def create_Pnet(weight_path):
    inp=Input(shape=[None,None,3])
    x=Conv2D(10,(3,3),strides=1,padding='valid',name='conv1')(inp)
    x=PReLU(shared_axes=[1,2],name='PReLU1')(x)
    x=MaxPool2D(pool_size=2)(x)
    x=Conv2D(16,(3,3),strides=1,padding='valid',name='conv2')(x)
    x=PReLU(shared_axes=[1,2],name='PReLU2')(x)
    x=Conv2D(32,(3,3),strides=1,padding='valid',name='conv3')(x)
    x=PReLU(shared_axes=[1,2],name='PReLU3')(x)
    classifier=Conv2D(2,(1,1),activation='softmax',name='conv4_1')(x)#类别预测值
    bbox_regress=Conv2D(4,(1,1),name='conv4_2')(x)#人脸框的预测位置
    model=Model([inp],[classifier,bbox_regress])#返回的是三维
    model.load_weights(weight_path,by_name=True)
    return model#返回带有与训练参数的Pnet模型
#2.3对Pnet的输出结果调整，width,height是Pnet输出时的图片大小，cls_prob对应输出图片的每个像素点由脸的概率
def detect_face_12net(cls_prob,roi,out_side,scale,width,height,threshold):
    cls_prob=np.swapaxes(cls_prob,0,1)
    roi=np.swapaxes(roi,0,2)
    stride=0
    if out_side!=1:#out_side是输出图片的最大边长
        stride=float(2*out_side-1)/(out_side-1)
        
        
    (x,y)=np.where(cls_prob>=threshold)#找出有人脸概率大于阈值的像素点的坐标
    score=np.array([cls_prob[x,y]]).T#拿出他的概率值
    
    boundingbox=np.array([x,y]).T
    bb1=np.fix((stride*boundingbox+0)*scale)#将在pnet输出图像上的x,y映射到原图的坐标上
    bb2=np.fix((stride*boundingbox+11)*scale)
    boundingbox=np.concatenate((bb1,bb2),axis=1)
    
    dx1=roi[0][x,y]#拿出人脸概率大于阈值的像素点的坐标预测模型的四个输出值，
    dx2=roi[1][x,y]
    dx3=roi[2][x,y]
    dx4=roi[3][x,y]
    
    offset=np.array([dx1,dx2,dx3,dx4]).T
    
    boundingbox=boundingbox+offset*12.0*scale#将框的x，y映射到原图上
    
    rectangles=np.concatenate((boundingbox,score),axis=1)
    
    rectangles=rect2square(rectangles)
    pick=[]
    for i in range(len(rectangles)):#将框位置和概率值在原图上的映射经过非极大抑制等方法后输出
        x1=int(max(0,rectangles[i][0]))
        y1=int(max(0,rectangles[i][1]))
        x2=int(min(width,rectangles[i][2]))
        y2=int(min(height,rectangles[i][3]))
        sc=rectangles[i][4]
        if x2>x1 and y2>y1:
            pick.append([x1,y1,x2,y2,sc])
    return NMS(pick,0.3)
#2.4对pnet的结果处理后会裁剪下其预测框并resize到24，24，3输入到rnet中
def create_Rnet(weight_path):
    inp=Input(shape=[24,24,3])
    x=Conv2D(28,(3,3),strides=1,padding='valid',name='conv1')(inp)
    x=PReLU(shared_axes=[1,2],name='prelu1')(x)
    x=MaxPool2D(pool_size=3,strides=2,padding='same')(x)
    x=Conv2D(48,(3,3),strides=1,padding='valid',name='conv2')(x)
    x=PReLU(shared_axes=[1,2],name='prelu2')(x)
    x=MaxPool2D(pool_size=3,strides=2)(x)
    x=Conv2D(64,(2,2),strides=1,padding='valid',name='conv3')(x)
    x=PReLU(shared_axes=[1,2],name='prelu3')(x)
    x=Permute((3,2,1))(x)
    x=Flatten()(x)
    x=Dense(128,name='conv4')(x)
    x=PReLU(name='prelu4')(x)
    classifier=Dense(2,activation='softmax',name='conv5-1')(x)
    bbox_regress=Dense(4,name='conv5-2')(x)#返回的是一维
    model=Model([inp],[classifier,bbox_regress])
    model.load_weights(weight_path,by_name=True)
    return model
#2.5对rnet的输出结果进行调整
def filter_face_24net(cls_prob,roi,rectangles,width,height,threshold):
    prob=cls_prob[:,1]
    pick=np.where(prob>=threshold)
    sc=np.array([prob[pick]]).T
    
    rectangles=np.array(rectangles)
    x1=rectangles[pick,0]
    y1=rectangles[pick,1]
    x2=rectangles[pick,2]
    y2=rectangles[pick,3]#输入到Rnet的框中符合阈值条件的框的位置,即原图上的坐标
    
    dx1=roi[pick,0]#从rnet输出的符合阈值的框网络预测输出位置
    dx2=roi[pick,1]
    dx3=roi[pick,2]
    dx4=roi[pick,3]
    w=x2-x1
    h=y2-y1
    
    x1=np.array([(x1+dx1*w)[0]]).T#符合条件的框在原图上的坐标位置
    y1=np.array([(y1+dx2*h)[0]]).T
    x2=np.array([(x2+dx3*w)[0]]).T
    y2=np.array([(y2+dx4*h)[0]]).T
    rectangles=np.concatenate((x1,y1,x2,y2,sc),axis=1)
    rectangles=rect2square(rectangles)
    pick=[]
    for i in range(len(rectangles)):#确保选出来的矩形框的坐标点不超出范围
        x1 = int(max(0     ,rectangles[i][0]))
        y1 = int(max(0     ,rectangles[i][1]))
        x2 = int(min(width ,rectangles[i][2]))
        y2 = int(min(height,rectangles[i][3]))
        sc = rectangles[i][4]
        if x2>x1 and y2>y1:
            pick.append([x1,y1,x2,y2,sc])
    return NMS(pick,0.3)
#2.6将rnet的结果经过调整裁剪下来resize到48，48，输入到onet
def create_Onet(weight_path):
    inp=Input(shape=[48,48,3])
    x=Conv2D(32,(3,3),strides=1,padding='valid',name='conv1')(inp)
    x=PReLU(shared_axes=[1,2],name='prelu')(x)
    x=MaxPool2D(pool_size=3,strides=2,padding='same')(x)
    x=Conv2D(64,(3,3),strides=1,padding='valid',name='conv2')(x)
    x=PReLU(shared_axes=[1,2],name='prelu2')(x)
    x=MaxPool2D(pool_size=3,strides=2)(x)
    x=Conv2D(64,(3,3),strides=1,padding='valid',name='conv3')(x)
    x=PReLU(shared_axes=[1,2],name='prelu3')(x)
    x=MaxPool2D(pool_size=2)(x)
    x=Conv2D(128,(2,2),strides=1,padding='valid',name='conv4')(x)
    x=PReLU(shared_axes=[1,2],name='prelu4')(x)
    x=Permute((3,2,1))(x)
    x=Flatten()(x)
    x=Dense(256,name='conv5')(x)
    x=PReLU(name='prelu5')(x)
    classifier=Dense(2,activation='softmax',name='conv6-1')(x)
    bbox_regress=Dense(4,name='conv6-2')(x)
    landmark_regress=Dense(10,name='conv6_3')(x)#五个人脸监测点的左上与右下坐标
    model=Model([inp],[classifier,bbox_regress,landmark_regress])
    model.load_weights(weight_path,by_name=True)
    return model
#2.7对Onet的输出进行调整
def filter_face_48net(cls_prob,roi,pts,rectangles,width,height,threshold):
    prob=cls_prob[:,1]#有人脸的概率值
    pick=np.where(prob>=threshold)
    sc=np.array([prob[pick]]).T
    rectangles=np.array(rectangles)

    x1=rectangles[pick,0]
    y1=rectangles[pick,1]
    x2=rectangles[pick,2]
    y2=rectangles[pick,3]#输入到Onet的框中符合阈值条件的框的位置,即原图上的坐标
    
    dx1=roi[pick,0]#从Onet输出的符合阈值的框网络预测输出位置
    dx2=roi[pick,1]
    dx3=roi[pick,2]
    dx4=roi[pick,3]
    w=x2-x1
    h=y2-y1
    
    pts0= np.array([(w*pts[pick,0]+x1)[0]]).T#人脸点坐标映射到原图上
    pts1= np.array([(h*pts[pick,5]+y1)[0]]).T

    pts2= np.array([(w*pts[pick,1]+x1)[0]]).T
    pts3= np.array([(h*pts[pick,6]+y1)[0]]).T

    pts4= np.array([(w*pts[pick,2]+x1)[0]]).T
    pts5= np.array([(h*pts[pick,7]+y1)[0]]).T

    pts6= np.array([(w*pts[pick,3]+x1)[0]]).T
    pts7= np.array([(h*pts[pick,8]+y1)[0]]).T
    
    pts8= np.array([(w*pts[pick,4]+x1)[0]]).T
    pts9= np.array([(h*pts[pick,9]+y1)[0]]).T
    x1  = np.array([(x1+dx1*w)[0]]).T
    y1  = np.array([(y1+dx2*h)[0]]).T
    x2  = np.array([(x2+dx3*w)[0]]).T
    y2  = np.array([(y2+dx4*h)[0]]).T
    rectangles=np.concatenate((x1,y1,x2,y2,sc,pts0,pts1,pts2,pts3,pts4,pts5,pts6,pts7,pts8,pts9),axis=1)
    pick = []
    for i in range(len(rectangles)):
        x1 = int(max(0     ,rectangles[i][0]))
        y1 = int(max(0     ,rectangles[i][1]))
        x2 = int(min(width ,rectangles[i][2]))
        y2 = int(min(height,rectangles[i][3]))
        if x2>x1 and y2>y1:
            pick.append([x1,y1,x2,y2,rectangles[i][4],
                 rectangles[i][5],rectangles[i][6],rectangles[i][7],rectangles[i][8],rectangles[i][9],rectangles[i][10],rectangles[i][11],rectangles[i][12],rectangles[i][13],rectangles[i][14]])
    return NMS(pick,0.3)
#2.8矩形转正方形，非极大抑制
def rect2square(rectangles):
    w = rectangles[:,2] - rectangles[:,0]
    h = rectangles[:,3] - rectangles[:,1]
    l = np.maximum(w,h).T
    rectangles[:,0] = rectangles[:,0] + w*0.5 - l*0.5
    rectangles[:,1] = rectangles[:,1] + h*0.5 - l*0.5 
    rectangles[:,2:4] = rectangles[:,0:2] + np.repeat([l], 2, axis = 0).T 
    return rectangles
def NMS(rectangles,threshold):
    if len(rectangles)==0:
        return rectangles
    boxes = np.array(rectangles)
    x1 = boxes[:,0]
    y1 = boxes[:,1]
    x2 = boxes[:,2]
    y2 = boxes[:,3]
    s  = boxes[:,4]
    area = np.multiply(x2-x1+1, y2-y1+1)
    I = np.array(s.argsort())
    pick = []
    while len(I)>0:
        xx1 = np.maximum(x1[I[-1]], x1[I[0:-1]]) #I[-1] have hightest prob score, I[0:-1]->others
        yy1 = np.maximum(y1[I[-1]], y1[I[0:-1]])
        xx2 = np.minimum(x2[I[-1]], x2[I[0:-1]])
        yy2 = np.minimum(y2[I[-1]], y2[I[0:-1]])
        w = np.maximum(0.0, xx2 - xx1 + 1)
        h = np.maximum(0.0, yy2 - yy1 + 1)
        inter = w * h
        o = inter / (area[I[-1]] + area[I[0:-1]] - inter)
        pick.append(I[-1])
        I = I[np.where(o<=threshold)[0]]
    result_rectangle = boxes[pick].tolist()
    return result_rectangle
#2.9网络搭建构成mtcnn类
class mtcnn():
    def __init__(self):
        self.Pnet=create_Pnet('model_data/pnet.h5')
        self.Rnet=create_Rnet('model_data/rnet.h5')
        self.Onet=create_Onet('model_data/onet.h5')
    def detectFace(self,img,threshold):
        copy_img=(img.copy()-127.5)/127.5
        origin_h,origin_w,_=copy_img.shape#原图大小
        scales=calculateScales(img)
        out=[]
        for scale in scales:
            hs=int(origin_h*scale)
            ws=int(origin_w*scale)
            scale_img=cv2.resize(copy_img,(ws,hs))
            inputs=scale_img.reshape(1,*scale_img.shape)#对一个普通变量使用单星号前缀，能够将这个变量拆分成单个元素
            output=self.Pnet.predict(inputs)#batch_size=1
            out.append(output)
        image_num=len(scales)
        rectangles=[]
        for i in range(image_num):
            cls_prob=out[i][0][0][:,:,1]#经过psnet预测后的输出图片上每个像素上的人脸概率
            roi=out[i][1][0]
            out_h,out_w=cls_prob.shape#Pnet输出的图片的大小
            out_size=max(out_h,out_w)#输出图片的最大边长
            rectangle=detect_face_12net(cls_prob,roi,out_size,1/scales[i],origin_w,origin_h,threshold[0])
            rectangles.extend(rectangle)#pnet的输出经过处理后的框
        rectangles=NMS(rectangles,0.7)
        if len(rectangles)==0:
            return rectangles
        predict_24_batch=[]
        for rectangle in rectangles:
            crop_img=copy_img[int(rectangle[1]):int(rectangle[3]),int(rectangle[0]):int(rectangle[2])]
            scale_img=cv2.resize(crop_img,(24,24))#将pnet的预测裁剪下来，resize
            predict_24_batch.append(scale_img)##将要输入到rnet网络的框
        predict_24_batch=np.array(predict_24_batch)
        out=self.Rnet.predict(predict_24_batch)
        cls_prob=out[0]
        cls_prob=np.array(cls_prob)
        roi_prob=out[1]
        roi_prob=np.array(roi_prob)
        rectangles=filter_face_24net(cls_prob,roi_prob,rectangles,origin_w,origin_h,threshold[1])
        if len(rectangles)==0:
            return rectangles
        predict_batch=[]
        for rectangle in rectangles:
            crop_img=copy_img[int(rectangle[1]):int(rectangle[3]),int(rectangle[0]):int(rectangle[2])]
            scale_img=cv2.resize(crop_img,(48,48))
            predict_batch.append(scale_img)
        predict_batch=np.array(predict_batch)
        output=self.Onet.predict(predict_batch)
        cls_prob=output[0]
        roi_prob=output[1]
        pts_prob=output[2]
        rectangles=filter_face_48net(cls_prob,roi_prob,pts_prob,rectangles, origin_w, origin_h, threshold[2])
        return rectangles

#3.搭建mobilenet网络，对图片进行分类

IMAGE_ORDERING='channels_last'
channel_axis=1 if IMAGE_ORDERING=='channles_first' else -1 #获取图像的channels位置
def relu6(x):
    return K.relu(x,max_value=6)
def _conv_block(inputs,filters,alpha,kernel=(3,3),strides=(1,1)):#普通卷积块
    filters=int(filters*alpha)#设置卷积核的个数
    x=ZeroPadding2D(padding=(1,1),name='conv1_pad',data_format=IMAGE_ORDERING)(inputs)
    x=Conv2D(filters,kernel,data_format=IMAGE_ORDERING,padding='valid',use_bias=False,strides=strides,name='conv1')(x)
    x=BatchNormalization(axis=channel_axis,name='conv1_bn')(x)
    return Activation(relu6,name='conv1_relu')(x)
def _depthwise_conv_block(inputs,pointwise_conv_filters,alpha,depth_multiplier=1,strides=(1,1),block_id=1):#深度可分离卷积块
    pointwise_conv_filters=int(pointwise_conv_filters*alpha)#卷积核个数
    x=ZeroPadding2D((1,1),data_format=IMAGE_ORDERING,name='conv_pad_%d'%block_id)(inputs)
    x=DepthwiseConv2D((3,3),data_format=IMAGE_ORDERING,padding='valid',depth_multiplier=depth_multiplier,strides=strides,use_bias=False,name='conv_dw_%d'%block_id)(x)
    x=BatchNormalization(axis=channel_axis,name='conv_dw_%d_bn'%block_id)(x)
    x=Activation(relu6,name='conv_dw_%d_relu'%block_id)(x)
    x=Conv2D(pointwise_conv_filters,(1,1),data_format=IMAGE_ORDERING,padding='same',use_bias=False,strides=(1,1),name='conv_pw_%d'%block_id)(x)
    x=BatchNormalization(axis=channel_axis,name='conv_pw_%d_bn'%block_id)(x)
    return Activation(relu6,name='conv_pw_%d_relu'%block_id)(x)
def get_mobilenet_encoder(input_height=416,input_width=416,classes=1000):
    alpha=1.0
    depth_multiplier=1
    dropout=1e-3
    img_input=Input(shape=(input_height,input_width,3))
    x=_conv_block(img_input,32,alpha,strides=(2,2))#普通卷积快，图像缩小一半
    x=_depthwise_conv_block(x,64,alpha,depth_multiplier,block_id=1)#深度可分离，图像大小不变
    f1=x
    x=_depthwise_conv_block(x,128,alpha,depth_multiplier,strides=(2,2),block_id=2)#图像缩小一倍
    x=_depthwise_conv_block(x,128,alpha,depth_multiplier,block_id=3)
    f2=x
    x=_depthwise_conv_block(x,256,alpha,depth_multiplier,strides=(2,2),block_id=4)#缩小一半
    x=_depthwise_conv_block(x,256,alpha,depth_multiplier,block_id=5)
    f3=x
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,strides=(2,2),block_id=6)#缩小一半
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,block_id=7)
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,block_id=8)
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,block_id=9)
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,block_id=10)
    x=_depthwise_conv_block(x,512,alpha,depth_multiplier,block_id=11)
    f4=x
    x=_depthwise_conv_block(x,1024,alpha,depth_multiplier,strides=(2,2),block_id=12)#缩小一半
    x=_depthwise_conv_block(x,1024,alpha,depth_multiplier,block_id=13)
    f5=x
    x=GlobalAveragePooling2D()(x)
    x=Reshape((1,1,1024))(x)
    x=Dropout(1e-3)(x)
    x=Conv2D(classes,(1,1),padding='same')(x)
    x=Activation('softmax')(x)
    x=Reshape((classes,))(x)
    model=Model(img_input,x,name='mobilenet')
    return model

#4.读取图片数据，训练mobilenet对口罩人脸的分类能力

def rand(a=0, b=1):
    return np.random.rand()*(b-a) + a
def get_random_data(image, input_shape, random=True, jitter=.1, hue=.1, sat=1.2, val=1.2, proc_img=True):#数据增强函数
    h, w = input_shape

    new_ar = w/h * rand(1-jitter,1+jitter)/rand(1-jitter,1+jitter)
    scale = rand(.7, 1.3)
    if new_ar < 1:
        nh = int(scale*h)
        nw = int(nh*new_ar)
    else:
        nw = int(scale*w)
        nh = int(nw/new_ar)
    image = image.resize((nw,nh), Image.BICUBIC)

    # place image
    dx = int(rand(0, w-nw))
    dy = int(rand(0, h-nh))
    new_image = Image.new('RGB', (w,h), (0,0,0))
    new_image.paste(image, (dx, dy))
    image = new_image

    # flip image or not
    flip = rand()<.5
    if flip: image = image.transpose(Image.FLIP_LEFT_RIGHT)

    # distort image
    hue = rand(-hue, hue)
    sat = rand(1, sat) if rand()<.5 else 1/rand(1, sat)
    val = rand(1, val) if rand()<.5 else 1/rand(1, val)
    x = rgb_to_hsv(np.array(image)/255.)
    x[..., 0] += hue
    x[..., 0][x[..., 0]>1] -= 1
    x[..., 0][x[..., 0]<0] += 1
    x[..., 1] *= sat
    x[..., 2] *= val
    x[x>1] = 1
    x[x<0] = 0
    image_data = hsv_to_rgb(x)*255 # numpy array, 0 to 1
    return image_data
K.set_image_dim_ordering('tf')
BASE_WEIGHT_PATH = ('https://github.com/fchollet/deep-learning-models/releases/download/v0.6/')
HEIGHT=160#mobilnet的输入尺寸
WIDTH=160
NUM_CLASSES=2
def letterbox_image(image,size):
    iw,ih=image.size
    w,h=size
    scale=min(w/iw,h/ih)
    nw=int(iw*scale)
    nh=int(ih*scale)
    image=image.resize((nw,nh),Image.BICUBIC)
    new_image=Image.new('RGB',size,(0,0,0))#黑色的底儿
    new_image.paste(image,((w-nw)//2,(h-nh)//2))
    return new_image
#4.1读取batch个图片数据
def generate_arrays_from_file(lines,batch_size,train):
    n=len(lines)
    i=0
    while 1:
        x_train=[]
        y_train=[]
        for b in range(batch_size):
            if i==0:
                np.random.shuffle(lines)
            name=lines[i].split(';')[0]#一行一行读，每读一个图片i会+1
            img=Image.open('./data/image/train'+'/'+name)
            if train==True:
                img=np.array(get_random_data(img,[HEIGHT,WIDTH]),dtype=np.float64)#对训练数据进行数据增强
            else:
                img=np.array(letterbox_image(img,[HEIGHT,WIDTH]),dtype=np.float64)#对测试数据加上黑框变成正方形
            x_train.append(img)
            y_train.append(lines[i].split(';')[1])
            i=(i+1)%n
        x_train=preprocess_input(np.array(x_train).reshape(-1,HEIGHT,WIDTH,3))#x》》预处理image
        y_train=keras.utils.to_categorical(np.array(y_train),num_classes=NUM_CLASSES)#y》》onehot
        yield (x_train,y_train)
#4.2训练mobilenet
if __name__=='__main__':
    log_dir='./logs/'
    with open('./data/train.txt','r') as f:
        lines=f.readlines()
    num_val=int(len(lines)*0.1)#测试集数据的多少
    num_train=len(lines)-num_val#训练集数据的多少
    model= get_mobilenet_encoder(HEIGHT,WIDTH,classes=NUM_CLASSES)
    model_name='mobilenet_1_0_224_tf_no_top.h5'
    weight_path=BASE_WEIGHT_PATH+model_name
    weights_path=get_file(model_name,weight_path,cache_subdir='models')
    model.load_weights(weights_path,by_name=True)
    checkpoint_period1=ModelCheckpoint(log_dir + 'ep{epoch:03d}-loss{loss:.3f}-val_loss{val_loss:.3f}.h5',monitor='acc',save_weights_only=False,save_best_only=True,period=3 )
    reduce_lr = ReduceLROnPlateau(monitor='acc', factor=0.5, patience=3,  verbose=1 )
    early_stopping = EarlyStopping( monitor='val_loss',  min_delta=0, patience=10, verbose=1)
    model.compile(loss = 'categorical_crossentropy',optimizer = Adam(lr=1e-3), metrics = ['accuracy'])
    batch_size=8
    model.fit_generator(generate_arrays_from_file(lines[:num_train], batch_size, True),
            steps_per_epoch=max(1, num_train//batch_size),
            validation_data=generate_arrays_from_file(lines[num_train:], batch_size, False),
            validation_steps=max(1, num_val//batch_size),
            epochs=2,
            initial_epoch=0,
            callbacks=[checkpoint_period1, reduce_lr])
    model.save_weights(log_dir+'middle_one.h5')

#5.链接mtcnn与mobilenet进行带口罩检测
def Alignment_1(img,landmark):#人脸对齐

    if landmark.shape[0]==68:
        x = landmark[36,0] - landmark[45,0]
        y = landmark[36,1] - landmark[45,1]
    elif landmark.shape[0]==5:
        x = landmark[0,0] - landmark[1,0]
        y = landmark[0,1] - landmark[1,1]
    # 眼睛连线相对于水平线的倾斜角
    if x==0:
        angle = 0
    else: 
        # 计算它的弧度制
        angle = math.atan(y/x)*180/math.pi

    center = (img.shape[1]//2, img.shape[0]//2)
    
    RotationMatrix = cv2.getRotationMatrix2D(center, angle, 1)
    # 仿射函数
    new_img = cv2.warpAffine(img,RotationMatrix,(img.shape[1],img.shape[0])) 

    RotationMatrix = np.array(RotationMatrix)
    new_landmark = []
    for i in range(landmark.shape[0]):
        pts = []    
        pts.append(RotationMatrix[0,0]*landmark[i,0]+RotationMatrix[0,1]*landmark[i,1]+RotationMatrix[0,2])
        pts.append(RotationMatrix[1,0]*landmark[i,0]+RotationMatrix[1,1]*landmark[i,1]+RotationMatrix[1,2])
        new_landmark.append(pts)

    new_landmark = np.array(new_landmark)

    return new_img, new_landmark
class face_rec():
    def __init__(self):
        self.mtcnn_model=mtcnn()
        self.threshold=[0.5,0.6,0.8]
        self.Crop_HEIGHT=160
        self.Crop_WIDTH=160
        self.classes_path='model_data/classes.txt'
        self.NUM_CLASSES=2
        self.mask_model=get_mobilenet_encoder(self.Crop_HEIGHT,self.Crop_WIDTH,classes=self.NUM_CLASSES)
        self.mask_model.load_weights('./logs/middle_one.h5')
        self.class_name=self._get_class()
    def _get_class(self):
        classes_path=os.path.expanduser(self.classes_path)
        with open(classes_path) as f:
            class_names=f.readlines()
        class_names=[c.strip() for c in class_names]
        return class_names
    def recognize(self,draw):
        height,width,_=np.shape(draw)
        draw_rgb=cv2.cvtColor(draw,cv2.COLOR_BGR2RGB)
        rectangles=self.mtcnn_model.detectFace(draw_rgb,self.threshold)#mtcnn进行人脸检测
        if len(rectangles)==0:
            return 
        rectangles=np.array(rectangles,dtype=np.int32)
        rectangles[:,0]=np.clip(rectangles[:,0],0,width)#规定检测到的人脸框不会出图片的大小范围
        rectangles[:,1]=np.clip(rectangles[:,1],0,height)
        rectangles[:,2]=np.clip(rectangles[:,2],0,width)
        rectangles[:,3]=np.clip(rectangles[:,3],0,height)
        rectangles_temp=rect2square(np.array(rectangles,dtype=np.int32))#框规定成正方形
        rectangles_temp[:,0]=np.clip(rectangles_temp[:,0],0,width)#化成正方形框后也不能出图像的大小范围
        rectangles_temp[:,1] = np.clip(rectangles_temp[:,1],0,height)
        rectangles_temp[:,2] = np.clip(rectangles_temp[:,2],0,width)
        rectangles_temp[:,3] = np.clip(rectangles_temp[:,3],0,height)
        classes_all=[]
        for rectangle in rectangles_temp:
            landmark=(np.reshape(rectangle[5:15],(5,2))-np.array([int(rectangle[0]),int(rectangle[1])]))/(rectangle[3]-rectangle[1])*160#5个关键点在160框的位置的坐标
            crop_img=draw_rgb[int(rectangle[1]):int(rectangle[3]), int(rectangle[0]):int(rectangle[2])]#剪下框
            crop_img = cv2.resize(crop_img,(self.Crop_HEIGHT,self.Crop_WIDTH))#resize到160框
            new_img,_=Alignment_1(crop_img,landmark)#将160图像利用两个眼睛的坐标对齐
            new_img=preprocess_input(np.reshape(np.array(new_img,np.float64),[1,self.Crop_HEIGHT,self.Crop_WIDTH,3]))#预处理160，batch=1
            classes=self.class_name[np.argmax(self.mask_model.predict(new_img)[0])]
            classes_all.append(classes)
        rectangles=rectangles[:,0:4] 
        #画框
        for (left, top, right, bottom), c in zip(rectangles,classes_all):
            cv2.rectangle(draw, (left, top), (right, bottom), (0, 0, 255), 2)
            font = cv2.FONT_HERSHEY_SIMPLEX
            cv2.putText(draw, c, (left , bottom - 15), font, 0.75, (255, 255, 255), 2)  
        return draw

#6主函数调用
if __name__=='__main__':
    out=face_rec()
    video_capture=cv2.VideoCapture(0)
    while True:
        ret,draw=video_capture.read()
        out.recognize(draw)
        cv2.imshow('video',draw)
        if cv2.waitKey(20)&0xFF==ord('q'):
            break
    video_capture.release()
    cv2.destroyAllWindows()

本文内容由网友自发贡献，版权归原作者所有，本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容，请联系:hwhale#tublm.com(使用前将#替换为@)

AIGC

python

深度学习

人工智能

4.人脸检测mtcnn+mobilenet戴口罩分类的相关文章

尽管极其懒惰，但如何在 Python 中模拟 IMAP 服务器？

我很好奇是否有一种简单的方法来模拟 IMAP 服务器例如imaplib模块在Python中 without做很多工作是否有预先存在的解决方案理想情况下我可以连接到现有的 IMAP 服务器进行转储并让模拟服务器在真实的邮箱电子
下载 PyQt6 的 Qt Designer 并使用 pyuic6 将 .ui 文件转换为 .py 文件

如何下载 PyQt6 的 QtDesigner 如果没有适用于 PyQt6 的 QtDesigner 我也可以使用 PyQt5 的 QtDesigner 但是如何将此 ui 文件转换为使用 PyQt6 库而不是 PyQt5 的 py 文件
Django REST序列化器：创建对象而不保存

我已经开始使用 Django REST 框架我想做的是使用一些 JSON 发布请求从中创建一个 Django 模型对象然后使用该对象而不保存它我的 Django 模型称为 SearchRequest 我所拥有的是 api view
将字符串转换为带有毫秒和时区的日期时间 - Python

我有以下 python 片段 from datetime import datetime timestamp 05 Jan 2015 17 47 59 000 0800 datetime object datetime strptime t
Python PAM 模块的安全问题？

我有兴趣编写一个 PAM 模块该模块将利用流行的 Unix 登录身份验证机制我过去的大部分编程经验都是使用 Python 进行的并且我正在交互的系统已经有一个 Python API 我用谷歌搜索发现pam python http pa
如何在android上的python kivy中关闭应用程序后使服务继续工作

我希望我的服务在关闭应用程序后继续工作但我做不到我听说我应该使用startForeground 但如何在Python中做到这一点呢应用程序代码 from kivy app import App from kivy uix floatl
DreamPie 不适用于 Python 3.2

我最喜欢的 Python shell 是DreamPie http dreampie sourceforge net 我想将它与 Python 3 2 一起使用我使用了添加解释器 DreamPie 应用程序并添加了 Python 3 2
更改自动插入 tkinter 小部件的文本颜色

我有一个文本框小部件其中插入了三条消息一条是开始消息一条是结束消息一条是在单位被摧毁时发出警报的消息我希望开始和结束消息是黑色的但被毁坏的消息参见我在代码中评论的位置插入小部件时颜色为红色我不太确定如何去做这件事我看
Python 多处理示例不起作用

我正在尝试学习如何使用multiprocessing但我无法让它发挥作用这是代码文档 http docs python org 2 library multiprocessing html from multiprocessing imp
Spark的distinct()函数是否仅对每个分区中的不同元组进行洗牌

据我了解 distinct 哈希分区 RDD 来识别唯一键但它是否针对仅移动每个分区的不同元组进行了优化想象一个具有以下分区的 RDD 1 2 2 1 4 2 2 1 3 3 5 4 5 5 5 在此 RDD 上的不同键上所有重复键
在循环中每次迭代开始时将变量重新分配给原始值（在循环之前定义）

在Python中你使用在每次迭代开始时将变量重新分配给原始值在循环之前定义时也就是说 original 1D o o o for i in range 0 3 new original 1D revert back to orig
运行多个 scrapy 蜘蛛的正确方法

我只是尝试使用在同一进程中运行多个蜘蛛新的 scrapy 文档 http doc scrapy org en 1 0 topics practices html但我得到 AttributeError CrawlerProcess objec
在 NumPy 中获取 ndarray 的索引和值

我有一个 ndarrayA任意维数N 我想创建一个数组B元组数组或列表其中第一个N每个元组中的元素是索引最后一个元素是该索引的值A 例如 A array 1 2 3 4 5 6 Then B 0 0 1 0 1 2 0 2 3 1 0
Abaqus 将曲面转化为集合

我一直试图在模型中找到两个表面的中心参见照片但未能成功它们是元素表面面查询中没有选项可以查找元素表面的中心只能查找元素集的中心找到节点集的中心也很好但是我的节点集没有出现在工具 gt 查询 gt 质量属性选项中而且我找不到
Python：字符串不会转换为浮点数[重复]

这个问题在这里已经有答案了我几个小时前写了这个程序 while True print What would you like me to double line raw input gt if line done break else f
Python - 在窗口最小化或隐藏时使用 pywinauto 控制窗口

我正在尝试做的事情我正在尝试使用 pywinauto 在 python 中创建一个脚本以在后台自动安装 notepad 隐藏或最小化 notepad 只是一个示例因为我将编辑它以与其他软件一起使用 Problem 问题是我想在安装程序
从 pygame 获取 numpy 数组

我想通过 python 访问我的网络摄像头不幸的是由于网络摄像头的原因 openCV 无法工作 Pygame camera 使用以下代码就像魅力一样 from pygame import camera display camera in
在Python中重置生成器对象

我有一个由多个yield 返回的生成器对象准备调用该生成器是相当耗时的操作这就是为什么我想多次重复使用生成器 y FunctionWithYield for x in y print x here must be something t
用于运行可执行文件的python多线程进程

我正在尝试将一个在 Windows 上运行可执行文件并管理文本输出文件的 python 脚本升级到使用多线程进程的版本以便我可以利用多个核心我有四个独立版本的可执行文件每个线程都知道要访问它们这部分工作正常我遇到问题的地方是当它们
Python - 字典和列表相交

给定以下数据结构找出这两种数据结构共有的交集键的最有效方法是什么 dict1 2A 3A 4B list1 2A 4B Expected output 2A 4B 如果这也能产生更快的输出我可以将列表不是 dict1 组织到任何其他数

随机推荐

超链接标签以及应用

a 顶部 a a href led 跳转到底部 a a href 1 我的第一个网页 html target blank 点击我跳转到页面一 a
计算期货均线数据

import tushare as ts import pandas as pd pro ts pro api 接口 df pro fut daily ts code FU2005 SHF start date 20190506 end d
Linux 多线程原理深剖

目录传统艺能 Linux 线程 phread 二级页表线程优点线程缺点线程异常进程与线程多线程共享 Linux线程控制 POSIX线程库线程的创建获取线程id 线程等待线程终止线程分离进程地址空间布局传统艺能小编是
【技术经验分享】计算机毕业设计Hadoop+Spark知识图谱股票基金推荐与预测系统股票基金可视化股票基金推荐系统股票基金可视化系统股票基金数据分析股票基金爬虫大数据

开发技术前端开发 vue js element ui echarts websocket 后端开发 springboot mybatis 数据库 mysql关系系数据库 neo4j图数据库大数据分析 hadoop spark flink
applicationContext.xml解析
单点登录--cookie技术实现

第一种为自己实现的单点登录未使用CAS 主要是cookie跨域实现代码如下 package com bochy filter import java io IOException import java security NoSuchA
多媒体技术复习题

多媒体技术复习题一选择题 1 所谓媒体是指 b A 二进制代码 B 表示和传播信息的载体 C 计算机输入与输出的信息 D 计算机屏幕显示的信息 2 帧频率为25帧秒的电视制式有 b A PAL NTSC B PAL SECAM C S
SURF算法原理

1 先对图像进行高斯滤波 2 选用二阶标准高斯函数作为滤波器通过特定核间的卷积计算二阶偏导数计算出Hessian矩阵 3 计算判别式的值根据判别式取值的正负来判断该点是不是极值点 4 利用非极大值抑制初步确定的特征点 5 精确定位极
STM32单片机PT100温度采集控制系统

实践制作DIY GC0030 PT100温度采集控制系统一功能说明基于STM32单片机设计 PT100温度采集控制系统功能介绍 STM32F103C系列最小系统班 PT100温度传感器 LCD1602显示器 12mA恒流源电路继电
Failed to resolve import “element-plus/lib/theme-chalk/index.css“ from “src\...

Failed to resolve import element plus lib theme chalk index css from src 学习vue3 ts中遇到的问题 vue3 ts搭建参考掘金文章很详细希望我能早日学会这套东
最小二乘法求解圆方程圆形及半径

ci最小二乘法定义摘抄于百度百科基本思路摘抄于百度百科简单的来说最小二乘法为一类线性算法将需要求解的系数当作未知数 f x 与x当作已知数通过多组对应关系求得系数的方法所以最小二乘法仅适合系数为一次项方程式例如 k与b作
贝叶斯软件genle教程_贝叶斯网络可视化软件GeNIe使用说明

实例简介详细的介绍了贝叶斯网络可视化软件GeNIe使用说明适合初学者 Table of contents 3 1 Read me first 2 Hello gentel 13 3 Introduction 31 3 1 Guide t
js替换所有的回车换行符

替换所有的回车换行 function TransferString content var string content try string string replace r n g br string string replace n
Intelij IDEA 配置Tomcat时找不到 “Application Server”

由于公司突然断电再打开idea的时候 tomcat就消失了然后在网上搜了一下没搜到自己乱点了一下如图 plugins gt gt application servers View 是报红色所以我在搜索栏搜索了tomcat 如果箭头
Java的replaceAll（）方法

replaceAll 方法实际是采用正则表达式的规则去匹配的在regex中表示一个在java中一个也要用表示这样前一个代表regex中的后一个代表java中的所以字符串转义一次正则转义一次那么一个斜扛要写4个 1
R语言实现常用的5种分析方法（主成分+因子+多维标度+判别+聚类

来源 R友舍 R语言多元分析系列之一主成分分析主成分分析 principal components analysis PCA 是一种分析简化数据集的技术它把原始数据变换到一个新的坐标系统中使得任何数据投影的第一大方差在第一个坐标
linux下的qt可以调用脚本吗,QT下实现对Linux Shell调用的几种方法

使用QProcess QThread include int main QProcess execute ls return 0 QProcess poc new QProcess poc gt start ping 222 207 53
vue学习十七 Vue路由和http请求

路由的实现首先需要cmd将路由模块装上然后重启项目多打几遍就熟悉了npm run dev 在下面的黑窗口中我之前已经装过了路由模块显示如下 npm install vue router save dev npm run dev 然
什么？到现在你还不知道什么是访问修饰限定符吗？

导航小助手前言一 public 访问修饰限定符二 private 访问修饰限定符三 default 访问修饰限定符 3 1 包的概念 3 2 导入包中的类 3 3 自定义包 3 4 包访问权限 3 5 常见的包四 protecte
4.人脸检测mtcnn+mobilenet戴口罩分类

from keras models import Model Sequential import tensorflow as tf import numpy as np import cv2 import os from functools

4.人脸检测mtcnn+mobilenet戴口罩分类

4.人脸检测mtcnn+mobilenet戴口罩分类 的相关文章

随机推荐

热门标签

4.人脸检测mtcnn+mobilenet戴口罩分类的相关文章