使用二维数据构造简单卷积神经网络

觉得有用的话,欢迎一起讨论相互学习~

TensorflowTutorial_二维数据构造简单CNN
图像和一些时序数据集都可以用二维数据的形式表现，我们此次使用随机分布的二位数据构造一个简单的CNN—网络卷积-最大池化-全连接
参考代码

# Implementing Different Layers

# ---------------------------------------

#

# We will illustrate how to use different types

# of layers in TensorFlow

#

# The layers of interest are:

#  (1) Convolutional Layer卷积层

#  (2) Activation Layer激活层

#  (3) Max-Pool Layer池化层

#  (4) Fully Connected Layer 全连接层

#

# We will generate two different data sets for this

#  script, a 1-D data set (row of data) and

#  a 2-D data set (similar to picture)

import tensorflow as tf

import matplotlib.pyplot as plt

import csv

import os

import random

import numpy as np

import random

from tensorflow.python.framework import ops

# ---------------------------------------------------|

# -------------------2D-data-------------------------|

# ---------------------------------------------------|

# Reset Graph 重置图模型

ops.reset_default_graph()

sess = tf.Session()

# parameters for the run 运行参数

row_size = 10  # 2D图形高

col_size = 10  # 2D图形长

conv_size = 2

conv_stride_size = 2  # 卷积步长

maxpool_size = 2

maxpool_stride_size = 1  # 池化步长

# ensure reproducibility 确保复现性

seed = 13

np.random.seed(seed)

tf.set_random_seed(seed)

# Generate 2D data生成随机二维数据

data_size = [row_size, col_size]

data_2d = np.random.normal(size=data_size)

# --------Placeholder--------

x_input_2d = tf.placeholder(dtype=tf.float32, shape=data_size)

# Convolution 卷积层

def conv_layer_2d(input_2d, my_filter, stride_size):

    # TensorFlow's 'conv2d()' function only works with 4D arrays:

    # [batch, height, width, channels], we have 1 batch, and

    # 1 channel, but we do have width AND height this time.

    # So next we create the 4D array by inserting dimension 1's.

    # Tensorflow的卷积操作默认输入有四个维度[batch_size, height, width, channels]

    # 此处我们将维度增加到四维

    input_3d = tf.expand_dims(input_2d, 0)

    input_4d = tf.expand_dims(input_3d, 3)

    convolution_output = tf.nn.conv2d(input_4d, filter=my_filter,

                                      strides=[1, stride_size, stride_size, 1], padding="VALID")

    # filter表示卷积核，数据维度为[卷积核高度，卷积核长度，输入通道数，输出通道数]

    # stride_size表示步长，数据维度为[批处理数据大小,步长高，步长宽，通道数]，其中批处理数据大小和通道数一般跨度都为1，不需要修改。

    # Get rid of unnecessary dimensions

    # 将维数为1的维度去掉，保留数值数据。

    conv_output_2d = tf.squeeze(convolution_output)

    return (conv_output_2d)

# Create Convolutional Filter

my_filter = tf.Variable(tf.random_normal(shape=[conv_size, conv_size, 1, 1]))

# Create Convolutional Layer

my_convolution_output = conv_layer_2d(x_input_2d, my_filter, stride_size=conv_stride_size)

# --------Activation--------

def activation(input_1d):

    return (tf.nn.relu(input_1d))

# Create Activation Layer 激活层

my_activation_output = activation(my_convolution_output)

# --------Max Pool--------

def max_pool(input_2d, width, height, stride):

    # Just like 'conv2d()' above, max_pool() works with 4D arrays.

    # [batch_size=1, height=given, width=given, channels=1]

    input_3d = tf.expand_dims(input_2d, 0)

    input_4d = tf.expand_dims(input_3d, 3)

    # Perform the max pooling with strides = [1,1,1,1]

    # If we wanted to increase the stride on our data dimension, say by

    # a factor of '2', we put strides = [1, 2, 2, 1]

    pool_output = tf.nn.max_pool(input_4d, ksize=[1, height, width, 1],

                                 strides=[1, stride, stride, 1],

                                 padding='VALID')

    # Get rid of unnecessary dimensions

    pool_output_2d = tf.squeeze(pool_output)

    return (pool_output_2d)

# Create Max-Pool Layer 最大池化层

# 即选择窗口中的最大值作为输出，池化层的窗口格式定义和卷积核的不一样

# 其四维数组格式定义和卷积步长，池化步长一致，和输入格式相同，即

# [batch_size, height, width, channels]

my_maxpool_output = max_pool(my_activation_output,

                             width=maxpool_size, height=maxpool_size, stride=maxpool_stride_size)

# --------Fully Connected--------

def fully_connected(input_layer, num_outputs):

    # 扁平化/光栅化处理使最大池化层输出为一维向量形式

    flat_input = tf.reshape(input_layer, [-1])

    # 设定weight的形状

    weight_shape = tf.squeeze(tf.stack([tf.shape(flat_input), [num_outputs]]))

    # 初始化weight

    weight = tf.random_normal(weight_shape, stddev=0.1)

    # 初始化bias

    bias = tf.random_normal(shape=[num_outputs])

    # 将一维输入还原为二维

    input_2d = tf.expand_dims(flat_input, 0)

    # 计算输出

    full_output = tf.add(tf.matmul(input_2d, weight), bias)

    # 降维，去掉维度为1的维度，便于进行观察

    full_output_2d = tf.squeeze(full_output)

    return (full_output_2d)

# Create Fully Connected Layer

my_full_output = fully_connected(my_maxpool_output, 5)

# Run graph

# Initialize Variables

init = tf.global_variables_initializer()

sess.run(init)

feed_dict = {x_input_2d: data_2d}

print('\n>>>> 2D Data <<<<')

# Convolution Output

print('Input = %s array'%(x_input_2d.shape.as_list()))

print('%s Convolution, stride size = [%d, %d] , results in the %s array'%

      (my_filter.get_shape().as_list()[:2], conv_stride_size, conv_stride_size, my_convolution_output.shape.as_list()))

print(sess.run(my_convolution_output, feed_dict=feed_dict))

# Activation Output

print('\nInput = the above %s array'%(my_convolution_output.shape.as_list()))

print('ReLU element wise returns the %s array'%(my_activation_output.shape.as_list()))

print(sess.run(my_activation_output, feed_dict=feed_dict))

# Max Pool Output

print('\nInput = the above %s array'%(my_activation_output.shape.as_list()))

print('MaxPool, stride size = [%d, %d], results in %s array'%

      (maxpool_stride_size, maxpool_stride_size, my_maxpool_output.shape.as_list()))

print(sess.run(my_maxpool_output, feed_dict=feed_dict))

# Fully Connected Output 全连接层

print('\nInput = the above %s array'%(my_maxpool_output.shape.as_list()))

# 全连接层输出除掉batch_size和channel维度后剩余维度为[4,4]

print('Fully connected layer on all %d rows results in %s outputs:'%

      (my_maxpool_output.shape.as_list()[0], my_full_output.shape.as_list()[0]))

# 由于全连接层神经元为5个所以输出维度为5

print(sess.run(my_full_output, feed_dict=feed_dict))

'''对于卷积层输出维度[batch_size,output_size,output_size',channels]

其中output_size及output_size'表示为对应维度上通过(W-F+2P)/S+1得到的结果

W为数据维度，F为卷积核或池化窗口的宽或高，P为Padding大小，其中设置卷积为Valid时，Padding为0若设置为SAME卷积，则会有Padding，S是步长大小

本例子中卷积层计算公式为[(10-2)+0]/2+1=5，池化层计算公式为[(5-2)+0]/1+1=4'''

# >>>> 2D Data <<<<

# Input = [10, 10] array

# [2, 2] Convolution, stride size = [2, 2] , results in the [5, 5] array

# [[ 0.14431179  0.72783369  1.51149166 -1.28099763  1.78439188]

#  [-2.54503059  0.76156765 -0.51650006  0.77131093  0.37542343]

#  [ 0.49345911  0.01592223  0.38653135 -1.47997665  0.6952765 ]

#  [-0.34617192 -2.53189754 -0.9525758  -1.4357065   0.66257358]

#  [-1.98540258  0.34398788  2.53760481 -0.86784822 -0.3100495 ]]

#

# Input = the above [5, 5] array

# ReLU element wise returns the [5, 5] array

# [[ 0.14431179  0.72783369  1.51149166  0.          1.78439188]

#  [ 0.          0.76156765  0.          0.77131093  0.37542343]

#  [ 0.49345911  0.01592223  0.38653135  0.          0.6952765 ]

#  [ 0.          0.          0.          0.          0.66257358]

#  [ 0.          0.34398788  2.53760481  0.          0.        ]]

#

# Input = the above [5, 5] array

# MaxPool, stride size = [1, 1], results in [4, 4] array

# [[ 0.76156765  1.51149166  1.51149166  1.78439188]

#  [ 0.76156765  0.76156765  0.77131093  0.77131093]

#  [ 0.49345911  0.38653135  0.38653135  0.6952765 ]

#  [ 0.34398788  2.53760481  2.53760481  0.66257358]]

#

# Input = the above [4, 4] array

# Fully connected layer on all 4 rows results in 5 outputs:

# [ 0.08245847 -0.16351229 -0.55429065 -0.24322605 -0.99900764]
参考文献

TensorFlow机器学习实战指南
秒客网

TensorflowTutorial_二维数据构造简单CNN

使用二维数据构造简单卷积神经网络

觉得有用的话,欢迎一起讨论相互学习~

参考代码

相关文章