Python深度学习CNN卷积神经网络模型训练做人脸识别实例_卷积核大小输入通道输出通道资源-CSDN文库

共3个文件

py：2个

gif：1个

python

深度学习

人脸识别

图像识别

需积分: 5 157 浏览量 2023-06-30 14:50:37 上传评论 5 收藏 1.09MB ZIP 举报

资源推荐

资源详情

资源评论

收起资源包目录

DeepLearning_CNN_Model(olivettifaces).zip （3个子文件）

olivettifaces.gif 1.13MB

use_CNN_olivettifaces.py 6KB

train_CNN_olivettifaces.py 15KB

# -*-coding:utf8-*-# import os import sys import time import numpy from PIL import Image import theano import theano.tensor as T from theano.tensor.signal import downsample from theano.tensor.nnet import conv """ 加载图像数据的函数,dataset_path即图像olivettifaces的路径加载olivettifaces后，划分为train_data,valid_data,test_data三个数据集函数返回train_data,valid_data,test_data以及对应的label """ def load_data(dataset_path): img = Image.open(dataset_path) img_ndarray = numpy.asarray(img, dtype='float64')/256 faces=numpy.empty((400,2679)) for row in range(20): for column in range(20): faces[row*20+column]=numpy.ndarray.flatten(img_ndarray [row*57:(row+1)*57,column*47:(column+1)*47]) label=numpy.empty(400) for i in range(40): label[i*10:i*10+10]=i label=label.astype(numpy.int) #分成训练集、验证集、测试集，大小如下 train_data=numpy.empty((320,2679)) train_label=numpy.empty(320) valid_data=numpy.empty((40,2679)) valid_label=numpy.empty(40) test_data=numpy.empty((40,2679)) test_label=numpy.empty(40) for i in range(40): train_data[i*8:i*8+8]=faces[i*10:i*10+8] train_label[i*8:i*8+8]=label[i*10:i*10+8] valid_data[i]=faces[i*10+8] valid_label[i]=label[i*10+8] test_data[i]=faces[i*10+9] test_label[i]=label[i*10+9] #将数据集定义成shared类型，才能将数据复制进GPU，利用GPU加速程序。 def shared_dataset(data_x, data_y, borrow=True): shared_x = theano.shared(numpy.asarray(data_x, dtype=theano.config.floatX), borrow=borrow) shared_y = theano.shared(numpy.asarray(data_y, dtype=theano.config.floatX), borrow=borrow) return shared_x, T.cast(shared_y, 'int32') train_set_x, train_set_y = shared_dataset(train_data,train_label) valid_set_x, valid_set_y = shared_dataset(valid_data,valid_label) test_set_x, test_set_y = shared_dataset(test_data,test_label) rval = [(train_set_x, train_set_y), (valid_set_x, valid_set_y), (test_set_x, test_set_y)] return rval #分类器，即CNN最后一层，采用逻辑回归（softmax） class LogisticRegression(object): def __init__(self, input, n_in, n_out): self.W = theano.shared( value=numpy.zeros( (n_in, n_out), dtype=theano.config.floatX ), name='W', borrow=True ) self.b = theano.shared( value=numpy.zeros( (n_out,), dtype=theano.config.floatX ), name='b', borrow=True ) self.p_y_given_x = T.nnet.softmax(T.dot(input, self.W) + self.b) self.y_pred = T.argmax(self.p_y_given_x, axis=1) self.params = [self.W, self.b] def negative_log_likelihood(self, y): return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]), y]) def errors(self, y): if y.ndim != self.y_pred.ndim: raise TypeError( 'y should have the same shape as self.y_pred', ('y', y.type, 'y_pred', self.y_pred.type) ) if y.dtype.startswith('int'): return T.mean(T.neq(self.y_pred, y)) else: raise NotImplementedError() #全连接层，分类器前一层 class HiddenLayer(object): def __init__(self, rng, input, n_in, n_out, W=None, b=None, activation=T.tanh): self.input = input if W is None: W_values = numpy.asarray( rng.uniform( low=-numpy.sqrt(6. / (n_in + n_out)), high=numpy.sqrt(6. / (n_in + n_out)), size=(n_in, n_out) ), dtype=theano.config.floatX ) if activation == theano.tensor.nnet.sigmoid: W_values *= 4 W = theano.shared(value=W_values, name='W', borrow=True) if b is None: b_values = numpy.zeros((n_out,), dtype=theano.config.floatX) b = theano.shared(value=b_values, name='b', borrow=True) self.W = W self.b = b lin_output = T.dot(input, self.W) + self.b self.output = ( lin_output if activation is None else activation(lin_output) ) # parameters of the model self.params = [self.W, self.b] #卷积+采样层（conv+maxpooling） class LeNetConvPoolLayer(object): def __init__(self, rng, input, filter_shape, image_shape, poolsize=(2, 2)): assert image_shape[1] == filter_shape[1] self.input = input fan_in = numpy.prod(filter_shape[1:]) fan_out = (filter_shape[0] * numpy.prod(filter_shape[2:]) / numpy.prod(poolsize)) # initialize weights with random weights W_bound = numpy.sqrt(6. / (fan_in + fan_out)) self.W = theano.shared( numpy.asarray( rng.uniform(low=-W_bound, high=W_bound, size=filter_shape), dtype=theano.config.floatX ), borrow=True ) # the bias is a 1D tensor -- one bias per output feature map b_values = numpy.zeros((filter_shape[0],), dtype=theano.config.floatX) self.b = theano.shared(value=b_values, borrow=True) # 卷积 conv_out = conv.conv2d( input=input, filters=self.W, filter_shape=filter_shape, image_shape=image_shape ) # 子采样 pooled_out = downsample.max_pool_2d( input=conv_out, ds=poolsize, ignore_border=True ) self.output = T.tanh(pooled_out + self.b.dimshuffle('x', 0, 'x', 'x')) # store parameters of this layer self.params = [self.W, self.b] #保存训练参数的函数 def save_params(param1,param2,param3,param4): import cPickle write_file = open('params.pkl', 'wb') cPickle.dump(param1, write_file, -1) cPickle.dump(param2, write_file, -1) cPickle.dump(param3, write_file, -1) cPickle.dump(param4, write_file, -1) write_file.close() """ 上面定义好了CNN的一些基本构件，下面的函数将CNN应用于olivettifaces这个数据集，CNN的模型基于LeNet。采用的优化算法是批量随机梯度下降算法，minibatch SGD，所以下面很多参数都带有batch_size，比如image_shape=(batch_size, 1, 57, 47) 可以设置的参数有： batch_size,但应注意n_train_batches、n_valid_batches、n_test_batches的计算都依赖于batch_size nkerns=[5, 10]即第一二层的卷积核个数可以设置全连接层HiddenLayer的输出神经元个数n_out可以设置，要同时更改分类器的输入n_in 另外，还有一个很重要的就是学习速率learning_rate. """ def evaluate_olivettifaces(learning_rate=0.05, n_epochs=200, dataset='olivettifaces.gif', nkerns=[5, 10], batch_size=40): #随机数生成器，用于初始化参数 rng = numpy.random.RandomState(23455) #加载数据 datasets = load_data(dataset) train_set_x, train_set_y = datasets[0] valid_set_x, valid_set_y = datasets[1] test_set_x, test_set_y = datasets[2] #计算各数据集的batch个数 n_train_batches = train_set_x.get_value(borrow=True).shape[0] n_valid_batches = valid_set_x.get_value(borrow=True).shape[0] n_test_batches = test_set_x.get_value(borrow=True).shape[0] n_train_batches /= batch_size n_valid_batches /= batch_size n_test_batches /= batch_size #定义几个变量，x代表人脸数据，作为layer0的输入 index = T.lscalar() x = T.matrix('x') y = T.ivector('y') ###################### #建立

评论收藏

内容反馈