基于tensorflow的hourglass模型demo.zip资源-CSDN文库

共2个文件

py：1个

png：1个

126 浏览量 2024-03-27 16:53:02 上传评论收藏 28KB ZIP 举报

在人工智能领域，深度学习是一种强大的技术，它模拟人脑神经网络的工作原理，处理复杂的数据问题。TensorFlow，作为Google开源的深度学习库，是实现这一技术的重要工具。本压缩包"基于tensorflow的hourglass模型demo.zip"提供了一个使用TensorFlow实现Hourglass模型的示例项目，名为"hourglass_tensorflow_demo-master"，它可以帮助我们理解并应用Hourglass网络结构。 Hourglass模型，源自于计算机视觉中的一种网络架构，主要用于图像分割任务。这个模型因其形似时钟沙漏而得名，其特点在于其多层次的递归结构。Hourglass网络通过多层下采样和上采样，保持了较高分辨率的特征信息，使得在预测像素级别的标签时具有很高的准确性。这种模型在人体姿态估计、语义分割等领域表现出色。在TensorFlow中实现Hourglass模型，首先需要理解并构建模型的基本组件，包括卷积层（Conv2D）、反卷积层（Conv2DTranspose）以及池化层（MaxPooling2D）。这些层构建了网络的下采样和上采样部分，确保数据在传递过程中保持必要的信息。在"hourglass_tensorflow_demo-master"项目中，可能包含了以下关键部分： 1. 数据预处理：对输入图像进行标准化、调整大小等操作，使其符合模型训练的要求。 2. 模型定义：使用TensorFlow的Keras API来构建Hourglass网络结构。这通常涉及多个卷积、池化和反卷积层的堆叠，以及可能的跳跃连接（skip connections）以合并不同尺度的特征。 3. 训练流程：设置损失函数（如交叉熵损失）和优化器（如Adam），并定义训练和验证数据集，进行模型的训练。 4. 评估与可视化：在验证集上评估模型性能，可能包括计算IoU（Intersection over Union）等指标，并使用可视化工具（如TensorBoard）展示训练过程中的损失和精度变化。 5. 应用部署：将训练好的模型保存为.h5或.pb格式，以便在实际应用中加载并进行预测。通过研究和实践这个demo项目，开发者可以深入了解如何利用TensorFlow构建复杂的深度学习模型，特别是在图像分割任务上的应用。此外，还能学习到如何优化模型参数，调整超参数，以提高模型的准确性和效率。这将对于提升在人工智能和深度学习领域的专业技能非常有帮助。

资源推荐

资源详情

资源评论

收起资源包目录

基于tensorflow的hourglass模型demo.zip （2个子文件）

hourglass_tensorflow_demo-master

hourglass.py 11KB

img

[J{5790MF`XD6KOYL2}V}6V.png 29KB

# coding: utf-8 # In[1]: import tensorflow as tf import cv2 import numpy as np slim=tf.contrib.slim import time import os from tensorflow.python.ops import control_flow_ops # In[2]: #残差网络 def convBlock(inputs,numOut,is_training,scope=''): with slim.arg_scope([slim.conv2d],padding='SAME', activation_fn=tf.nn.relu, weights_initializer=tf.contrib.layers.xavier_initializer(), normalizer_fn=slim.batch_norm, normalizer_params={'is_training': is_training, 'decay': 0.95}): net=slim.conv2d(inputs,numOut//2,kernel_size=[1,1],scope= scope+'cb1') net=slim.conv2d(net,numOut//2,kernel_size=[3,3],scope= scope+'cb2') net=slim.conv2d(net,numOut,kernel_size=[1,1],scope= scope+'cb3') return net def skipLayer(inputs,numOut,scope=''): numIn=inputs.shape[-1] if numIn==numOut: return inputs else: return slim.conv2d(inputs,numOut,kernel_size=[1,1],activation_fn=None,scope=scope+'sk') def residual(inputs,numOut,is_training,scope=''): convb=convBlock(inputs,numOut,is_training,scope) skip=skipLayer(inputs,numOut,scope) return tf.add_n([convb,skip],name=scope+'re') # In[3]: #hourglass网络 def hourglass(inputs, n, numOut,is_training, name = 'hourglass'): """ Hourglass Module Args: inputs : Input Tensor n : Number of downsampling step numOut : Number of Output Features (channels) name : Name of the block """ with tf.name_scope(name): # Upper Branch up_1 = residual(inputs, numOut,is_training,scope = str(n)+'up_1') # Lower Branch low_ = tf.contrib.layers.max_pool2d(inputs, [2,2], [2,2], padding='VALID') low_1= residual(low_, numOut,is_training,scope = str(n)+'low_1') if n > 0: low_2 =hourglass(low_1, n-1, numOut,is_training, name = str(n)+'low_2') else: low_2 =residual(low_1, numOut,is_training,scope =str(n)+ 'low_2') low_3 = residual(low_2, numOut, is_training,scope = str(n)+'low_3') up_2 = tf.image.resize_nearest_neighbor(low_3, tf.shape(low_3)[1:3]*2, name =str(n)+ 'upsampling') return tf.add_n([up_2,up_1], name=name+'out_hg') # In[4]: #1x1卷积网络 def lin(inputs,numOut,is_training,scope=''): with slim.arg_scope([slim.conv2d],padding='SAME', activation_fn=tf.nn.relu, weights_initializer=tf.contrib.layers.xavier_initializer(), normalizer_fn=slim.batch_norm, normalizer_params={'is_training': is_training, 'decay': 0.95}): return slim.conv2d(inputs,numOut,kernel_size=[1,1],scope=scope+'lin') # In[9]: class HgModel(): def __init__(self,stages,joints): self.stages = stages self.stage_heatmap = [] self.stage_loss = [0] * stages self.total_loss = 0 self.input_image = None self.gt_heatmap = None self.learning_rate = 0 self.merged_summary = None self.joints = joints self.batch_size = 16 def build_model(self,input_image,iftrain): with tf.variable_scope('processing'): with slim.arg_scope([slim.conv2d],padding='SAME', activation_fn=tf.nn.relu, weights_initializer=tf.contrib.layers.xavier_initializer(), normalizer_fn=slim.batch_norm, normalizer_params={'is_training': iftrain, 'decay': 0.95}): # net=tf.pad(input_image,np.array([[0,0],[3,3],[3,3],[0,0]])) net=slim.conv2d(input_image,64,kernel_size=[7,7],stride=2,scope='conv1') net=residual(net,128,iftrain,scope='conv2') net=slim.max_pool2d(net,kernel_size=[2,2],stride=2,padding='SAME',scope='pool1') net=residual(net,128,iftrain,scope='conv3') inter=residual(net,256,iftrain,scope='conv4') out=[] for i in range(self.stages): with tf.variable_scope('stage_'+str(i+1)): hg=hourglass(inter,4,256,iftrain,name='hg') l1=hg l1=residual(l1,256,iftrain,scope='l1') l1=lin(l1,256,iftrain,scope='l2') tmpout=slim.conv2d(l1,self.joints,kernel_size=[1,1],activation_fn=None,scope='l3') out.append(tmpout) if i< self.stages: l1_=slim.conv2d(l1,256,kernel_size=[1,1],activation_fn=None,scope='l4') tmpout_=slim.conv2d(tmpout,256,kernel_size=[1,1],activation_fn=None,scope='l5') inter=tf.add_n([inter,l1_,tmpout_]) self.stage_heatmap=out def build_loss(self, gt_heatmap, lr, lr_decay_rate, lr_decay_step,optimizer='Adam'): self.gt_heatmap = gt_heatmap self.total_loss = 0 self.learning_rate = lr self.lr_decay_rate = lr_decay_rate self.lr_decay_step = lr_decay_step self.optimizer=optimizer for stage in range(self.stages): with tf.variable_scope('stage' + str(stage+1) + '_loss'): self.stage_loss[stage] = tf.nn.l2_loss(self.stage_heatmap[stage] - self.gt_heatmap[:,:,:,:13], name='l2_loss') / self.batch_size tf.summary.scalar('stage' + str(stage+1) + '_loss', self.stage_loss[stage]) with tf.variable_scope('total_loss'): for stage in range(self.stages): self.total_loss += self.stage_loss[stage] tf.summary.scalar('total_loss', self.total_loss) with tf.variable_scope('train'): self.global_step = tf.contrib.framework.get_or_create_global_step() self.cur_lr = tf.train.exponential_decay(self.learning_rate, global_step=self.global_step, decay_rate=self.lr_decay_rate, decay_steps=self.lr_decay_step) tf.summary.scalar('learning_rate', self.cur_lr) self.optimizer = tf.train.RMSPropOptimizer(learning_rate=self.cur_lr) self.train_step = slim.learning.create_train_op(self.total_loss, self.optimizer, global_step=self.global_step) update_ops = tf.get_collection(tf.GraphKeys.UPDATE_OPS) if update_ops: updates = tf.group(*update_ops) self.total_loss = control_flow_ops.with_dependencies([updates], self.total_loss) self.merged_summary = tf.summary.merge_all() # In[6]: def print_current_training_stats(global_step, cur_lr, total_loss,total_loss1, time_elapsed): stats = 'Step: {}/{} ----- Cur_lr: {:1.7f} ----- Time: {:>2.2f} sec.'.format(global_step, 300000, cur_lr, time_elapsed) print(stats) print('Training total_loss: {:>7.2f} Testing total_loss:{:>7.2f}'.format(total_loss,total_loss1)) # In[7]: def read_and_decode(filename): filename_queue = tf.train.string_input_producer(filename) reader = tf.TFRecordReader() _, serialized_example = reader.read(filename_queue) #返回文件名和文件 features = tf.parse_single_example(serialized_example, features={ 'label': tf.FixedLenFeature([], tf.string), 'img_raw' : tf.FixedLenFeature([], tf.string), }) img = tf.decode_raw(features['img_raw'], tf.uint8) img = tf.reshape(img, [256, 256, 3]) img = tf.cast(img, tf.fl

评论收藏

内容反馈