基于opencv和MTCNN进行人脸区域裁剪，使用了facenet的tensorflow模型进行人脸特征映射.zip资源-CSDN文库

共12个文件

java：10个

xml：1个

properties：1个

人工智能

深度学习

tensorflow

186 浏览量 2024-03-28 18:04:03 上传评论收藏 14KB ZIP 举报

资源推荐

资源详情

资源评论

收起资源包目录

基于opencv和MTCNN进行人脸区域裁剪，使用了facenet 的 tensorflow 模型进行人脸特征映射.zip （12个子文件）

face-detect-master

pom.xml 2KB

src

main

resources

log4j.properties 3KB

java

com

walt

face

utils

TensorflowUtils.java 490B

ResourceUtils.java 2KB

ImageUtils.java 1KB

mtcnn

Mtcnn.java 13KB

Box.java 3KB

UdfTest.java 668B

facenet

FaceNet.java 1KB

opencv

ImageData.java 2KB

FaceDetection.java 3KB

Main.java 3KB

package com.walt.face.mtcnn; import com.walt.face.utils.TensorflowUtils; import net.coobird.thumbnailator.Thumbnails; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.tensorflow.Graph; import org.tensorflow.Session; import org.tensorflow.Tensor; import org.tensorflow.Tensors; import org.tensorflow.framework.ConfigProto; import org.tensorflow.framework.GPUOptions; import java.awt.image.BufferedImage; import java.io.IOException; import java.util.List; import java.util.Vector; import static java.lang.Math.max; import static java.lang.Math.min; import static java.util.stream.Collectors.toList; import static com.walt.face.utils.ResourceUtils.getResourceFilePath; /** * @author waltyou * @date 2018/12/06 */ public class Mtcnn { private static Logger logger = LoggerFactory.getLogger(Mtcnn.class); private static final float FACTOR = 0.709f; private static final float P_NET_THRESHOLD = 0.5f; private static final float R_NET_THRESHOLD = 0.5f; private static final float O_NET_THRESHOLD = 0.7f; private static final float IMAGE_MEAN = 127.5f; private static final float IMAGE_STD = 128; private static final String PD_PATH = "/models/mtcnn/mtcnn_freezed_model.pb"; private static final String P_NET_IN_NAME = "pnet/input:0"; private static final String[] P_NET_OUT_NAME = new String[] {"pnet/prob1:0", "pnet/conv4-2/BiasAdd:0"}; private static final String R_NET_IN_NAME = "rnet/input:0"; private static final String[] R_NET_OUT_NAME = new String[] {"rnet/prob1:0", "rnet/conv5-2/conv5-2:0",}; private static final String O_NET_IN_NAME = "onet/input:0"; private static final String[] O_NET_OUT_NAME = new String[] {"onet/prob1:0", "onet/conv6-2/conv6-2:0", "onet/conv6-3/conv6-3:0"}; private Session session; public Mtcnn() throws Exception { Graph graph = TensorflowUtils.getGraph(getResourceFilePath(PD_PATH)); byte[] config = setConfig(); session = new Session(graph, config); } private byte[] setConfig() { GPUOptions gpuOptions = GPUOptions.newBuilder() .setVisibleDeviceList("0") .setPerProcessGpuMemoryFraction(0.25) .setAllowGrowth(true) .build(); return ConfigProto.newBuilder() .setGpuOptions(gpuOptions) .setAllowSoftPlacement(true) .build().toByteArray(); } public Vector<Box> detectFaces(BufferedImage img, int minFaceSize) throws Exception { int w = img.getWidth(); int h = img.getHeight(); logger.info("【1】PNet generate candidate boxes..."); Vector<Box> boxes = pNet(img, minFaceSize, w, h); squareLimit(boxes, w, h); logger.info("PNet out boxes size:" + boxes.size()); if (boxes.size() == 0) { return boxes; } logger.info("【2】RNet"); boxes = rNet(img, boxes); squareLimit(boxes, w, h); logger.info("RNet out boxes size:" + boxes.size()); if (boxes.size() == 0) { return boxes; } logger.info("【3】ONet"); boxes = oNet(img, boxes); logger.info("ONet out boxes size:" + boxes.size()); return boxes; } private Vector<Box> pNet(BufferedImage img, int minFaceSize, int w, int h) throws IOException { int whMin = min(w, h); Vector<Box> totalBoxes = new Vector<>(); float currentFaceSize = minFaceSize; while (currentFaceSize <= whMin) { logger.info("currentFaceSize " + currentFaceSize); float scale = 12.0f / currentFaceSize; List<Box> list = pNetForword(img, scale); totalBoxes.addAll(list); //Face Size等比递增 currentFaceSize /= FACTOR; } //NMS 0.7 nms(totalBoxes, 0.7f, "Union"); return updateBoxes(totalBoxes); } private List<Box> pNetForword(BufferedImage img, float scale) throws IOException { //(1)Image Resize BufferedImage resizeImg = resize(img, scale); //(2)RUN CNN Tensor<Float> x = image2FloatTensor(resizeImg); List<Tensor<?>> outputs = predict(x, P_NET_IN_NAME, P_NET_OUT_NAME); Tensor<Float> outP = outputs.get(0).expect(Float.class); Tensor<Float> outB = outputs.get(1).expect(Float.class); long[] shape = outP.shape(); int pNetOutSizeH = (int) shape[1]; int pNetOutSizeW = (int) shape[2]; float[][][][] p = outP.copyTo(new float[1][pNetOutSizeH][pNetOutSizeW][2]); float[][][][] b = outB.copyTo(new float[1][pNetOutSizeH][pNetOutSizeW][4]); float[][][] pNetOutBias = b[0]; float[][] pNetOutProb = new float[pNetOutSizeH][pNetOutSizeW]; expandProb(p[0], pNetOutProb); //(3) data parse Vector<Box> curBoxes = new Vector<>(); generateBoxes(pNetOutProb, pNetOutBias, scale, curBoxes); //(4)nms 0.5 nms(curBoxes, 0.5f, "Union"); curBoxes.forEach(Box::calibrate); //(5)add to totalBoxes return curBoxes.stream().filter(box -> !box.deleted).collect(toList()); } private static BufferedImage resize(BufferedImage img, float scale) throws IOException { return Thumbnails.of(img).scale(scale).asBufferedImage(); } private List<Tensor<?>> predict(Tensor<Float> x, String inName, String[] outputNames) { Session.Runner runner = session.runner().feed(inName, x); for (String outName : outputNames) { runner.fetch(outName); } return runner.run(); } private Tensor<Float> image2FloatTensor(BufferedImage img) { float[][][][] floatValues = image2FloatArr(img); return Tensors.create(floatValues); } private float[][][][] image2FloatArr(BufferedImage img) { int w = img.getWidth(); int h = img.getHeight(); float[][][][] floatValues = new float[1][h][w][3]; for (int j = 0; j < h; j++) { for (int i = 0; i < w; i++) { int val = img.getRGB(i, j); floatValues[0][j][i][0] = (((val >> 16) & 0xFF) - IMAGE_MEAN) / IMAGE_STD; floatValues[0][j][i][1] = (((val >> 8) & 0xFF) - IMAGE_MEAN) / IMAGE_STD; floatValues[0][j][i][2] = ((val & 0xFF) - IMAGE_MEAN) / IMAGE_STD; } } return floatValues; } private void expandProb(float[][][] src, float[][] dst) { for (int i = 0; i < src.length; i++) { for (int j = 0; j < src[0].length; j++) { dst[i][j] = src[i][j][0]; } } } private void generateBoxes(float[][] prob, float[][][] bias, float scale, Vector<Box> boxes) { int h = prob.length; int w = prob[0].length; for (int y = 0; y < h; y++) { for (int x = 0; x < w; x++) { float score = prob[y][x]; //only accept prob >threadshold(0.6 here) if (score > P_NET_THRESHOLD) { Box box = new Box(); //score box.score = score; //box box.box[0] = Math.round(x * 2 / scale); box.box[1] = Math.round(y * 2 / scale); box.box[2] = Math.round((x * 2 + 11) / scale); box.box[3] = Math.round((y * 2 + 11) / scale); //bbr System.arraycopy(bias[y][x], 0, box.bbr, 0, 4); // for (int i = 0; i < 4; i++) { // box.bbr[i] = bias[y][x][i]; // } //add boxes.addElement(box); } } } } /** * Non-Maximum Suppression * nms，不符合条件的deleted设置为true */ private void nms(Vector<Box> boxes, float threshold, String method) { //NMS.两两比对 /

评论收藏

内容反馈