tf_tutorial_ipi/tutorial_4_build_run_network.py at master · Childhoo/tf_tutorial_ipi · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
import tensorflow as tf
import numpy as np
from tensorflow.python.tools import inspect_checkpoint as chkp

"""
-------------------------------------------------------------------------------
basic module defined below
"""
def conv_relu(input, kernel_shape, bias_shape):
    # Create variable named "weights".
    weights = tf.get_variable("weights", kernel_shape,
        initializer=tf.random_normal_initializer())

    # Create variable named "biases".
    biases = tf.get_variable("biases", bias_shape,
        initializer=tf.constant_initializer(0.0))

    conv = tf.nn.conv2d(input, weights,
        strides=[1, 1, 1, 1], padding='VALID')
    relu = tf.nn.relu(conv + biases)

    #create some summaries for the variables
    variable_summaries(weights)
    variable_summaries(biases)
    variable_summaries(conv)
    tf.summary.histogram('relu_activations', relu)
    return relu

def conv_relu_maxpool(input, kernel_shape, bias_shape):
    # Create variable named "weights".
    weights = tf.get_variable("weights", kernel_shape,
        initializer=tf.random_normal_initializer())
    # Create variable named "biases".
    biases = tf.get_variable("biases", bias_shape,
        initializer=tf.constant_initializer(0.0))
    conv = tf.nn.conv2d(input, weights,
        strides=[1, 1, 1, 1], padding='VALID')
    relu = tf.nn.relu(conv + biases)
    maxpool = tf.nn.max_pool(relu,[1,2,2,1],
                             strides=[1, 2, 2, 1],
                             name='max-pool',
                             padding='VALID')
    variable_summaries(weights)
    variable_summaries(biases)
    variable_summaries(conv)
    tf.summary.histogram('relu_activations', relu)
    return maxpool

#define a function for summary variables
def variable_summaries(var):
    """Attach a lot of summaries to a Tensor (for TensorBoard visualization)."""
    with tf.name_scope('summaries'):
        mean = tf.reduce_mean(var)
        tf.summary.scalar('mean', mean)
        with tf.name_scope('stddev'):
            stddev = tf.sqrt(tf.reduce_mean(tf.square(var - mean)))
        tf.summary.scalar('stddev', stddev)
        tf.summary.scalar('max', tf.reduce_max(var))
        tf.summary.scalar('min', tf.reduce_min(var))
        tf.summary.histogram('histogram', var)
"""
end of basic module definition
-------------------------------------------------------------------------------
"""


"""
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
randomly generate training data

"""
# generate random data for test runing of the dataset
data = np.random.rand(300,32,32,3) #randomly generate data
#generate random labels [one-hot format for np.eye(10)]
values = np.random.randint(10, size=300)
n_values = np.max(values) + 1
print(n_values)
labels_gt = np.eye(n_values)[values]

"""
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
"""


"""
-------------------------------------------------------------------------------
define the graph
"""
# start to define the network which is used for classification
#build 3 conv-relu-maxpool layers. The 3rd layer without pooling

# when tensors of variables are created, it is automatically assigned
# to tf.Graph.Trainable_variables
g1 = tf.Graph()
with g1.as_default():
    # placeholder for the network input
    input_img = tf.placeholder(tf.float32,shape=(None,32,32,3))
    labels =  tf.placeholder(tf.float32,shape=(None,10))

    with tf.variable_scope("1st-layer"):
        output_1 = conv_relu_maxpool(input_img,[5,5,3,10],[10])

    with tf.variable_scope("2nd-layer"):
        output_2 = conv_relu_maxpool(output_1,[5,5,10,20],[20])
    with tf.variable_scope("3rd-layer"):
        output_3 = conv_relu(output_2,[5,5,20,50],[50])

    #build 2 fully connected layers
    output_3 = tf.reshape(tf.squeeze(output_3),[-1,50])
    fc_1 = tf.layers.dense(output_3, units=200, activation=tf.nn.relu)
    fc_2 = tf.layers.dense(fc_1, units=10, activation=tf.nn.relu)

    # predictions and losses of the network
    predictions = {
        # Generate predictions (for PREDICT and EVAL mode)
        "classes": tf.argmax(input=fc_2, axis=1),
        # Add `softmax_tensor` to the graph. It is used for PREDICT and by the
        # `logging_hook`.
        "probabilities": tf.nn.softmax(fc_2, name="softmax_tensor")
    }

    #define loss of the network
    loss = tf.losses.softmax_cross_entropy(labels, fc_2)
    tf.summary.scalar("loss",loss)

    #define the training optimizer, it automatically do the forward and backward prop.
    # however, you can also compute the gradient and apply them yourself.
#    train_op = tf.train.AdagradOptimizer(0.001).minimize(loss)

    # the second way of processing the gradients (DIY style)

    optimizer = tf.train.AdagradOptimizer(0.001)
    #variables created before were automatically added to trainable_variables...
    grad_var_list = optimizer.compute_gradients(loss, tf.trainable_variables())
    #do some operation to calculated gradients...

    new_grads_and_vars = []
    for idx, (grad, var) in enumerate(grad_var_list):
        grad = tf.clip_by_norm(grad, 50) #clip large gradients
        new_grads_and_vars.append((grad, var))
    grad_var_list = new_grads_and_vars

    #summary gradients for tensorboard
    for grad, var in grad_var_list:
        tf.summary.histogram(var.name + '/gradient', grad)
    optim_selfbuild = optimizer.apply_gradients(grad_var_list)

    #add operations to save and restore all variables in graph
    # passing a tensor list for selected tensor to save is also possible
    saver = tf.train.Saver()
    merge_summary_op = tf.summary.merge_all()
#saver_part = tf.train.Saver({"fc_1":fc_1,"output_3":output_3})
"""
-------------------------------------------------------------------------------
"""


"""
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
run graph in a session with the randomly generated data and label
"""
with tf.Session(graph=g1) as sess:
    writer = tf.summary.FileWriter("/tmp/log/", sess.graph)

    #if there is pretrained weights, restore them; otherwise train from scratch
    latest_checkpoint = tf.train.latest_checkpoint('/tmp/log/')
    if latest_checkpoint is not None:
        saver.restore(sess, latest_checkpoint)
#        chkp.print_tensors_in_checkpoint_file("/tmp/model.ckpt",
#                                              tensor_name='', all_tensors=True)
    else:
        sess.run(tf.global_variables_initializer())

    for i in range(100):
        feed_dict={input_img:data, labels:labels_gt}

        if i%10 ==0:
            #summary every 10 steps
            summary, train = sess.run([merge_summary_op, optim_selfbuild], feed_dict)
            writer.add_summary(summary,i)
            writer.flush()
            print("loss in %5d th step: %.4f" % (i,loss.eval(feed_dict)))
        else:
            sess.run(optim_selfbuild, feed_dict)

    # save variables to checkpoint file
    save_path = saver.save(sess, "/tmp/log/model.ckpt")
    print("Model saved in path: %s" % save_path)
    writer.close()
"""
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
"""