利用caffe和mxnet 開啟攝像頭，進行人臉檢測

阿新 • • 發佈：2018-12-14

# -*- coding:utf-8 -*-
import random
import mxnet as mx
import numpy as np
from sklearn import preprocessing
import base64
import cv2
import time
from easydict import EasyDict as edict
import os
import sys
from scipy import misc
from mtcnn_detector import MtcnnDetector
import numpy as np
caffe_root = '../../caffe-ssd/python'  # 設定當前的工作環境在caffe下
sys.path.insert(0, caffe_root)
import caffe
sys.path.append(os.path.join(os.path.dirname(__file__), '..', 'src', 'common'))  #放入preprocess路徑
import face_preprocess

caffe.set_device(0)
caffe.set_mode_gpu()
model_def = '../models/sfd/deploy.prototxt'
model_weights = '../models/sfd/SFD.caffemodel'
net = caffe.Net(model_def, model_weights, caffe.TEST)    #把上面新增的兩個變數都作為引數構造一個Net


#********************************SFD***********************************************************************
def sfd_detection(frame, threshold, mode):
    # start = time.time()
    image = frame
    height = image.shape[0]
    width = image.shape[1]

    # 適用於長寬不對等的場景,進行長寬等比例變化
    if mode == 'reg':
        im_shrink = 80.0 / max(image.shape[0], image.shape[1])
        # print(im_shrink)
    # waitkey()
    elif mode == 'global':
        im_shrink = 320.0 / max(image.shape[0], image.shape[1])
    elif mode == 'cached':
        im_shrink = 160.0 / max(image.shape[0], image.shape[1])
    image = cv2.resize(image, None, None, fx=im_shrink, fy=im_shrink, interpolation=cv2.INTER_LINEAR)    #調整輸入樣本大小以便輸入神經網路呦 (3維) 320*320*3
    # cv2.imshow('iamge',image)
    # cv2.waitKey(0)
    # print image.shape[0]
    # print image.shape[1]
    net.blobs['data'].reshape(1, 3, image.shape[0], image.shape[1])

#由於matplotlib載入的image畫素（0-1）之間，圖片：RGB 而caffe需要畫素（0-255），圖片：BGR ，因此要轉換
    transformer = caffe.io.Transformer({'data': net.blobs['data'].data.shape})

#channel通道提前
    transformer.set_transpose('data', (2, 0, 1))
    transformer.set_mean('data', np.array([104, 117, 123]))
  
#畫素放大，通道RGB->BGR 
    transformer.set_raw_scale('data', 255)
    transformer.set_channel_swap('data', (2, 1, 0))
#處理載入的圖片
    transformed_image = transformer.preprocess('data', image)
    net.blobs['data'].data[...] = transformed_image 
#前向傳播，輸出SSD網路最後一層detction_out的輸出。
    detections = net.forward()['detection_out']                                                      #神經網路的人臉座標輸出(4維) 1*1*23*7 :array
    #SSD網路的最後一層名為'detection_out'，該層輸出Blob結構'detection_out'中包含了多組元組結構，每個元組結構包含7個引數，其中第2引數表示分類類別序號，第3個引數表示概率置信度，第3-6引數分別表示目標區域左上及右下的座標，而元組的個數表明該影象中可能的目標個數。
    # print detections.shape[0]
    det_conf = detections[0, 0, :, 2]
    # print det_conf
    det_xmin = detections[0, 0, :, 3]
    det_ymin = detections[0, 0, :, 4]
    det_xmax = detections[0, 0, :, 5]
    det_ymax = detections[0, 0, :, 6]
    bbox = []
    for i in range(det_conf.shape[0]):
        xmin = max(0, int(round(det_xmin[i] * width)))
        ymin = max(0, int(round(det_ymin[i] * height)))
        xmax = min(width - 1, int(round(det_xmax[i] * width)))
        ymax = min(height - 1, int(round(det_ymax[i] * height)))
        score = det_conf[i]
        if score < threshold or xmin >= xmax or ymin >= ymax:
            continue
        # print('{:s} {:.3f} {:.1f} {:.1f} {:.1f} {:.1f}\n'.
        # format('person', score, xmin, ymin, xmax, ymax))
        bbox.append([xmin, ymin, xmax, ymax])
        # cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), (255,0,0), 2)
    # end = time.time()
    # print(end-start)
    # cv2.imshow('result', frame)
    # cv2.waitKey(0)
    return bbox                                                                  #[[0, 0, 239, 239], [0, 0, 239, 239]](返回是網路輸出變換後的人臉畫素座標)
#********************************SFD**********************************************************************************************************



def do_flip(data):
  for idx in xrange(data.shape[0]):
    data[idx,:,:] = np.fliplr(data[idx,:,:])

#***********************************************************MTCNN****************************************************************


#*******************************************************************************************************輸出的圖片大小處理*********
  image_size='112,112'
  _vec = image_size.split(',')  # 1)將str->list  2)將圖片長寬分開
  assert len(_vec) == 2
  image_size = (int(_vec[0]), int(_vec[1]))  # 將列表元素強制為int

# *******************************************************************************************************輸出的圖片大小處理*********


  # *****************************************************************************************************************************捆綁mtcnn 預訓練模型
  ctx = mx.gpu(0)
  model='../models/model-r50-am-lfw/model,0'
  _vec = model.split(',')  # 1)將模型地址與模型標籤分開 2)將str->list
  assert len(_vec) == 2
  prefix = _vec[0]
  epoch = int(_vec[1])
  sym, arg_params, aux_params = mx.model.load_checkpoint(prefix, epoch)  # 載入模型  引數1)模型地址 2)模型的標籤
  all_layers = sym.get_internals()  # 檢視模型中間層
  sym = all_layers['fc1_output']
  model = mx.mod.Module(symbol=sym, context=ctx, label_names=None)  # 建立模組
  # model.bind(data_shapes=[('data', (args.batch_size, 3, image_size[0], image_size[1]))], label_shapes=[('softmax_label', (args.batch_size,))])
  model.bind(data_shapes=[('data', (1, 3, image_size[0], image_size[1]))])  # 繫結模型
  model.set_params(arg_params, aux_params)  # 設定權重引數
#**************************************************************************************************************************************捆綁mtcnn 預訓練模型


  mtcnn_path = os.path.join(os.path.dirname(__file__), 'mtcnn-model')  # 賦值MTCNN模型地址,作為引數輸入探測器類中
  detector = MtcnnDetector(model_folder=mtcnn_path, ctx=ctx, num_worker=1, accurate_landmark=True,
                           threshold=[0.0, 0.0, 0.2])  # 傳參的過程,將引數傳入捆綁的模型中


def get_feature(ssd_bbox,detector,model):  # 這裡是將原MTCNN的get_feature和get_input結合



  # ssd_bbox is bgr image
  ret = detector.detect_face_limited(ssd_bbox, det_type=2)  # 呼叫探測器的人臉檢測函式,返回所有bbox和point   det_type=2 means using R+O, else using O'
  #print '************************************************************************************************'
  #print('ret',ret[1])  #5個關鍵點
  if ret is None:
      return None
  bbox, points = ret
  #print('bboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbbox',bbox)
  if bbox.shape[0] == 0:
      return None
  bbox = bbox[0, 0:4]   #定義bbox
 # print('bboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbboxbbox',bbox)
  points = points[0, :].reshape((2, 5)).T  #定義point
  #print('pointspointspointspointspointspointspointspointspointspointspointspointspoints',points)



#MTCNN的標籤儲存(bbox，points)
  # np.savetxt("../label/msra_lmk",(bbox,points))
  # a=np.loadtxt("msra_lmk")
  # print('aaaaaaaaaaaaaaaaaaaaaaaaaaaaa',a)


  #確定一次
  flip=0
  nimg = face_preprocess.preprocess(ssd_bbox, bbox, points, image_size='112,112')  # 用mtcnn的bbox,point結果,替代cv2的bbox結果 ->這個函式目的是為了將座標變成圖片
 # cv2.imshow('mtcnn_face', nimg)
  cv2.imwrite('./feature/'+str(random.random())+'.jpg',nimg)
  print '********************************************************************************************************************************'


  nimg = cv2.cvtColor(nimg, cv2.COLOR_BGR2RGB)
  aligned = np.transpose(nimg, (2, 0, 1))  # 轉置

  # print(nimg.shape)
  embedding = None
  for flipid in [0, 1]:
      if flipid == 1:
          if flip == 0:
              break
          do_flip(aligned)
      input_blob = np.expand_dims(aligned, axis=0)
      data = mx.nd.array(input_blob)
      db = mx.io.DataBatch(data=(data,))
      model.forward(db, is_train=False)
      _embedding = model.get_outputs()[0].asnumpy()
      # print(_embedding.shape)
      if embedding is None:
          embedding = _embedding
      else:
          embedding += _embedding
  embedding=preprocessing.normalize(embedding).flatten()


  #這裡 返回的是歸一化的圖片特徵
  return embedding


#***********************************************************MTCNN****************************************************************************************************

if __name__ == '__main__':
    # 讀圖片
    image = cv2.imread('/home/chenyu/3.jpg')
    #cv2.imshow('yuantu', image)

    #繫結ssd模型
    caffe.set_device(0)
    caffe.set_mode_gpu()
    model_def = '../models/sfd/deploy.prototxt'
    model_weights = '../models/sfd/SFD.caffemodel'
    net = caffe.Net(model_def, model_weights, caffe.TEST)



    bbox = sfd_detection(image, 0.5, 'global')      #    引數:閾值，模式
    print('++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++',bbox)
    # *******************************************SDF擴充套件*************************************************等同於進行了根據人臉定位人身，圖片定位壓縮
    offset_height = 160
    offset_width = 160
    frame_height = image.shape[0]
    frame_width = image.shape[1]
    for tbbox in bbox:
        y1 = max(0, tbbox[1] - offset_height)  # 根據人臉畫素座標,進行相對放大，獲取人身定位
        y2 = min(frame_height, tbbox[3] + offset_height)
        x1 = max(0, tbbox[0] - offset_width)
        x2 = min(frame_width, tbbox[2] + offset_width)
        ssd_facetobody = image[y1:y2, x1:x2, :]  # 輸出樣本的人臉特徵圖


        # print image_facetobody
    # **********************************************SDF擴充套件*************************************************  等同於進行了根據人臉定位人身，圖片定位壓縮

    ssd_bbox = image[tbbox[1]:tbbox[3], tbbox[0]:tbbox[2], :]   
    #cv2.imshow('SSD_body', ssd_facetobody)
    #cv2.imshow('SSD_bbox', ssd_bbox)

    #繫結mtcnn模型
    ctx = mx.gpu(0)
    model = '../models/model-r50-am-lfw/model,0'
    _vec = model.split(',')  # 1)將模型地址與模型標籤分開 2)將str->list
    assert len(_vec) == 2
    prefix = _vec[0]
    epoch = int(_vec[1])
    sym, arg_params, aux_params = mx.model.load_checkpoint(prefix, epoch)  # 載入模型檢查點(作用：在每次迭代時，在特殊位置進行點檢測)  引數1)模型地址 2)模型的標籤    返回：sym(symbol):網路模型配置 arg:網路權重字典 aux：附加項字典
    all_layers = sym.get_internals()  # 檢視模型中間層
    sym = all_layers['fc1_output']
    model = mx.mod.Module(symbol=sym, context=ctx, label_names=None)  # 建立模組
    # model.bind(data_shapes=[('data', (args.batch_size, 3, image_size[0], image_size[1]))], label_shapes=[('softmax_label', (args.batch_size,))])
    model.bind(data_shapes=[('data', (1, 3, image_size[0], image_size[1]))])  # 繫結模型
    model.set_params(arg_params, aux_params)  # 設定權重引數
    # **************************************************************************************************************************************捆綁mtcnn 預訓練模型

    mtcnn_path = os.path.join(os.path.dirname(__file__), 'mtcnn-model')  # 賦值MTCNN模型地址,作為引數輸入探測器類中
    detector = MtcnnDetector(model_folder=mtcnn_path, ctx=ctx, num_worker=1, accurate_landmark=True,
                             threshold=[0.0, 0.0, 0.2])  # 傳參的過程,將引數傳入捆綁的模型中

    feature_label = get_feature(ssd_bbox)  # SSD輸出的point放入MTCNN

    tFace = misc.imresize(ssd_facetobody, (160, 160), interp='bilinear')

利用caffe和mxnet 開啟攝像頭，進行人臉檢測

# -*- coding:utf-8 -*- import random import mxnet as mx import numpy as np from sklearn import preprocessing import base64 import cv2 impo

利用padding-top/padding-bottom百分比，進行占位和高度自適應

自身 .com gty tps 有一個想要很大的 after pic 在css裏面，padding-top,padding-bottom,margin-top,margin-bottom取值為百分比的時候，參照的是父元素的寬度。比如：父元素寬度是100px, 子元素p

python利用pandas和xlrd讀取excel，特征篩選刪除0值超過99%的列

print div 3.x += nco borde class value append 利用xlrd讀取excel篩選0值超過99%的列，並刪除import xlrdworkbook=xlrd.open_workbook(r"123.xlsx")table =

利用lucene和pdfBox對PDF文字進行內容的解析

wechat:812716131 ------------------------------------------------------ 技術交流群請聯絡上面wechat ----------------------------------------------

虛擬機器和opencv開啟攝像頭超時失敗的解決辦法__2018.12.25

原文連結：https://blog.csdn.net/qq_30155503/article/details/79460420 原文連結：https://blog.csdn.net/u012792343/article/details/78068964 原文連結：https://blog.c

Python和opencv開啟攝像頭

import cv2 import numpy as np cap = cv2.VideoCapture(0) fourcc = cv2.cv.CV_FOURCC(*'XVID') #opencv3

人工智能？使用Python和dlib進行人臉檢測

Python 初學人工智能；本人從事Python以及近9年了，目前在向人工智能進軍，遇到不懂得可以騷擾我：154.7251666，Q記著，別加錯了，想學Python的可以來問我學習方法，想要源代碼的也可以滴滴我“Dlib是一個現代化的C ++工具包，包含用於創建復雜軟件的機器學習算法和工具”。它使您

gluoncv 訓練自己的資料集，進行目標檢測

跑了一晚上的模型，實在佔GPU資源，這兩天已經有很多小朋友說我了。我選擇了其中一個引數。 https://github.com/dmlc/gluon-cv/blob/master/scripts/detection/faster_rcnn/train_faster_rcnn.py train_faster

java呼叫本地攝像頭，實現人臉識別

package com.lw.test; import java.awt.Graphics; import java.awt.event.MouseAdapter; import java.awt.event.MouseEvent; import java.awt.imag

【Python+OpenCV】實現檢測場景內是否有物體移動，並進行人臉檢測抓拍

可以當個家庭安防用吧0.0 import cv2 import time save_path = './face/' face_cascade = cv2.CascadeClassifier('./cascades/haarcascade_front

程式碼C++， opencv實現人臉識別，人臉檢測，人臉匹配，視訊中的人臉檢測，攝像頭下的人臉檢測等

前一段時間寫了一個人臉相關的演算法，包括視訊中的人臉檢測，相機的人臉檢測，影象中人臉檢測，還有人臉識別。使用的是VS2013和opencv。首先建立標頭檔案common.h#ifndef _COMMON_H #define _COMMON_H #include <op

TensorFlow實現人臉識別(5)-------利用訓練好的模型實時進行人臉檢測

經過前面複雜的操作，訓練出來對於某一個人的識別模型。本文將利用該模型對於開啟的視訊或者攝像頭實時的識別該人。讀取視訊 ==> 識別人臉 ==> 繪製標誌程式碼如下： #-*- coding:UTF-8 -*- import tensor

OpenCV中基於Haar特徵和級聯分類器的人臉檢測(三）

使用機器學習的方法進行人臉檢測的第一步需要訓練人臉分類器，這是一個耗時耗力的過程，需要收集大量的正負樣本，並且樣本質量的好壞對結果影響巨大，如果樣本沒有處理好，再優秀的機器學習分類演算法都是零。今年3月23日，微軟公司在推特（Twitter）社交平臺上推出了一個基於機

Dlib進行人臉檢測

環境設定網上有很多Windows下安裝dlib的步驟，都需要安裝VS2015、Cmake、boost等等，有點複雜；現提供一個比較簡單的方法，使用編譯好的python-dlib庫即可。

使用OpenCV進行人臉檢測（Viola-Jones人臉檢測方法）

擴充套件閱讀：　參考文獻：Paul Viola, Michael J. Jones. Robust Real-Time Face Detection[J]. International Journal of Computer Vision,2004,57(2):13

使用Dlib庫進行人臉檢測與對齊

簡介上一篇中，講述瞭如何在windows上編譯dlib的靜態庫dlib.lib。現在來使用dlib.lib進行人臉檢測與對齊。例子中原始碼來自官方案例，進行稍微修改。準備 1.編譯好的靜態庫檔案，dlib.lib 程式 1.新建win32控制檯程式，修改為 Relea

Spring boot入門（三）：SpringBoot整合結合AdminLTE(Freemarker)，利用generate自動生成程式碼，利用DataTable和PageHelper進行分頁顯示

　　關於SpringBoot和PageHelper，前篇部落格已經介紹過Spring boot入門（二）：Spring boot整合MySql,Mybatis和PageHelper外掛，前篇部落格大致講述了SpringBoot如何整合Mybatis和Pagehelper,但是沒有做出實際的範例，本篇部落格是連

利用arcgis和envi對衛星影象按城市進行拼接，分割

1、首先在envi中開啟多波段原素材，右鍵點選另存為TIFF，輸入儲存的路徑將原素材轉換為tif格式圖片。 2、之後開啟arcgis，匯入全國地區界資料，點選工具欄中的篩選工具。輸入查詢的範圍以及匹配的資訊獲得對應的省市邊框。我們可以使

開啟雙目攝像頭，連續擷取並分割為左右畫面進行儲存

#include <iostream> #include <opencv2/opencv.hpp> #include <fstream> #include <stdio.h> using namespace std

Mac 電腦利用Sleepwatcher和blueutil 實現電腦休眠自動關閉藍芽，喚醒自動開啟藍芽

首先交代下為什麼我要實現這個功能，因為本人使用Mac進行辦公操作，平時電腦也不怎麼喜歡關機，下班後直接就電腦休眠了，但是有的時候發現電腦會無緣無故打開了，出現好幾次這種問題，後面我發現原來是有的時候電腦修休眠了，但是在放入包中的過程中，觸碰到了滑鼠，滑鼠連線了電腦的藍芽直接喚

利用caffe和mxnet 開啟攝像頭，進行人臉檢測

相關推薦