cifar10-classification/ConvNet.py at master · autasi/cifar10-classification · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import tensorflow as tf, math

WEIGHT_DECAY = 0.0005
BN = False
MOMENTUM = 0.9
EPSILON = 1e-4

class ConvNet(object):

    def _activation_summary(self,x):
        tensor_name = x.op.name
        tf.histogram_summary(tensor_name + '/activations', x)
        tf.scalar_summary(tensor_name + '/sparsity', tf.nn.zero_fraction(x))

    def _variable_trunc_normal(self,name, shape, trainable=True):
        return tf.get_variable(name, shape,
            initializer=tf.truncated_normal_initializer(stddev=0.01),
            trainable=trainable)

    def _variable_constant(self,name, shape, value, trainable=True):
        return tf.get_variable(name, shape,
            initializer=tf.constant_initializer(value),
            trainable=trainable)

    def _batch_normalization(self, x, n_out, momentum_list):
        gamma = tf.get_variable('gamma', [n_out],
            initializer = tf.constant_initializer(1.0), trainable=True)
        beta = tf.get_variable('beta', [n_out],
            initializer = tf.constant_initializer(0.0), trainable=True)

        batch_mean, batch_var = tf.nn.moments(x, momentum_list, \
                    name='moments')
        ema = tf.train.ExponentialMovingAverage(decay=MOMENTUM)
        def update():
            ema_apply_op = ema.apply([batch_mean, batch_var])
            with tf.control_dependencies([ema_apply_op]):
                return (tf.identity(batch_mean), tf.identity(batch_var))
        mean, var = tf.cond(self.train_mode,
            update,
            lambda: (ema.average(batch_mean), ema.average(batch_var)))
        x = tf.nn.batch_normalization(x, mean, var, \
            beta, gamma, EPSILON)
        return x

    def _add_weight_decay(self, var):
        if self.weight_decay:
            weight_decay = tf.mul(tf.nn.l2_loss(var), self.weight_decay,
                    name='weight_loss')
            tf.add_to_collection('weight_losses', weight_decay)

    def _conv(self, input, shape, strides, name, alpha=0.1):
        """
        args:
            shape : [3, 3, in, out]
        """

        if self.bn_mode:
            with tf.variable_scope(name) as scope:
                kernel = self._variable_trunc_normal('weights', shape)
                conv = tf.nn.conv2d(input, kernel, strides, padding='SAME')
                bn_conv = self._batch_normalization(conv, shape[-1], [0, 1, 2])
                conv_ = tf.maximum(bn_conv, alpha*bn_conv, name=scope.name)
                if tf.get_variable_scope().reuse is False:
                    self._add_weight_decay(kernel)
                    self._activation_summary(conv_)
        else:
            with tf.variable_scope(name) as scope:
                kernel = self._variable_trunc_normal('weights', shape)
                conv = tf.nn.conv2d(input,kernel,strides, padding='SAME')
                biases = self._variable_constant('biases', shape[-1], value=0.01)
                bias = tf.nn.bias_add(conv, biases)
                conv_ = tf.maximum(bias, alpha*bias, name=scope.name)
                if tf.get_variable_scope().reuse is False:
                    self._add_weight_decay(kernel)
                    self._activation_summary(conv_)

        return conv_

    def _fc(self, input, shape, name, alpha=0.1, last=False):

        if self.bn_mode and not last:
            with tf.variable_scope(name) as scope:
                weights = self._variable_trunc_normal('weights', shape)
                fc = tf.matmul(input, weights)
                fc = self._batch_normalization(fc, shape[-1], [0])
                fc = tf.maximum(fc, alpha*fc, name=scope.name)
                if tf.get_variable_scope().reuse is False:
                    self._add_weight_decay(weights)
                    self._activation_summary(fc)
        else:
            with tf.variable_scope(name) as scope:
                weights = self._variable_trunc_normal('weights', shape)
                biases = self._variable_constant('biases', shape[-1], value=0.0)
                fc = tf.matmul(input, weights) + biases
                if not last:
                    fc = tf.maximum(fc, alpha*fc, name=scope.name)
                if tf.get_variable_scope().reuse is False:
                    self._add_weight_decay(weights)
                    self._activation_summary(fc)
        return fc

    def ConvLayer(self, input, in_filter, out_filter, layer_num):
        conv_strides = [1,1,1,1]
        pool_strides = [1,2,2,1]
        ksize = [1,2,2,1]

        _conv1 = self._conv(input, [3,3,in_filter,out_filter], conv_strides,
                name = 'conv%d1'%layer_num)
        _conv2 = self._conv(_conv1, [3,3,out_filter,out_filter], conv_strides,
                name = 'conv%d2'%layer_num)
        _pool = tf.nn.max_pool(_conv2, ksize, pool_strides, padding='VALID',
                name = 'pool%d'%layer_num)
        _drop = tf.nn.dropout(_pool, self.dropout)

        return _drop

    def __init__(self, dropout = 0.5, hidden_dim = 600, bn_mode = False):
        self.weight_decay = WEIGHT_DECAY
        self.dropout = dropout
        self.hidden_dim = hidden_dim
        self.bn_mode = bn_mode

    def inference(self, images, batch_size, train_mode):
        self.train_mode = train_mode
        self.dropout = tf.cond(train_mode,
            lambda: tf.Variable(self.dropout, trainable=False),
            lambda: tf.Variable(1.0, trainable=False))


        layer0 = self.ConvLayer(images, 3, 32, 0)
        layer1 = self.ConvLayer(layer0, 32, 64, 1)
        layer2 = self.ConvLayer(layer1, 64, 128, 2)
        layer3 = self.ConvLayer(layer2, 128, 256, 3)

        # fc layer
        dim = 1
        for d in layer3.get_shape()[1:].as_list():
            dim *= d
        nn_in = tf.reshape(layer3, [batch_size, dim])
        nn_in = tf.nn.dropout(nn_in, self.dropout)

        fc1 = self._fc(nn_in, [dim, self.hidden_dim], name = 'fc1')
        drop_f1 = tf.nn.dropout(fc1, self.dropout)
        fc2 = self._fc(drop_f1, [self.hidden_dim,10], name='fc2', last=True)

        return fc2