質問編集履歴

コメント追記。

2019/09/01 09:54

投稿

open_your_eyes

スコア4

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -7,6 +7,8 @@
 （少数点4桁くらい表示していますが、まったく変化せず）。
 計算グラフがうまくできておらず、誤差逆伝播ができていないのかと推察しています。
+以下、インデントが上手くされておらず、読みにくいコードになっておりすみません。
 def _shortcut(inputs, residual)
     n_filters = residual.shape[3]
     print('n_filters=',n_filters)

#つきのコメントを削除

2019/09/01 09:54

投稿

open_your_eyes

スコア4

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -7,12 +7,9 @@
 （少数点4桁くらい表示していますが、まったく変化せず）。
 計算グラフがうまくできておらず、誤差逆伝播ができていないのかと推察しています。
-# ResNet
-def _shortcut(inputs, residual): #inputs: ResBlockへの入力そのもの（ショートカットしたデータ）, residual: ResBlockの中で処理されたデータ
-# residualのチャンネル数を取得
+def _shortcut(inputs, residual)
     n_filters = residual.shape[3]
     print('n_filters=',n_filters)
-# inputsのチャンネル数をresidualのチャンネル数に合わせる（1x1畳み込み）
     shortcut = tf.layers.Conv2D(n_filters, kernel_size=[1, 1], strides=[1, 1], padding='VALID')(inputs)
     return tf.keras.layers.add([shortcut, residual])
@@ -28,42 +25,41 @@
         return _shortcut(input, x)
     return f
-### ネットワーク ###
 tf.reset_default_graph()
 is_training = tf.placeholder(tf.bool, shape=())
 x = tf.placeholder(tf.float32, [None, 32, 32, 3]) #入力データ
 t = tf.placeholder(tf.float32, [None, 10]) #正解ラベル
-### ネットワーク本体 ###
 h = tf.layers.Conv2D(filters=32, kernel_size=[7, 7], strides=[1, 1], kernel_initializer=initializer, padding='SAME')(x)
 h = tf.layers.BatchNormalization()(h, training=is_training)
 h = tf.nn.relu(h)
-h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h) # 32x32x32 -> 16x16x32
+h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h)
-h = _resblock(n_filters=64)(h) # 16x16x32 -> 16x16x64
 h = _resblock(n_filters=64)(h)
 h = _resblock(n_filters=64)(h)
+h = _resblock(n_filters=64)(h)
-h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h) # 16x16x64 -> 8x8x64
+h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h)
-h = _resblock(n_filters=128)(h) # 8x8x64 -> 8x8x128
 h = _resblock(n_filters=128)(h)
 h = _resblock(n_filters=128)(h)
+h = _resblock(n_filters=128)(h)
-h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h) # 8x8x128 -> 4x4x128
+h = tf.layers.MaxPooling2D(pool_size=[2, 2], strides=2)(h)
-h = _resblock(n_filters=256)(h) # 4x4x128 -> 4x4x256
+h = _resblock(n_filters=256)(h)
 h = _resblock(n_filters=256)(h)
 h = _resblock(n_filters=256)(h)
-# Global Average Pooling
-h = tf.keras.layers.GlobalAveragePooling2D()(h) # 4x4x256 -> 256
+h = tf.keras.layers.GlobalAveragePooling2D()(h)
-# FCN(全結合ネットワーク)
 h = tf.layers.Dense(units=128, activation=tf.nn.relu)(h)
-y = tf.layers.Dense(units=10, activation=tf.nn.softmax)(h) #各クラスのスコア
+y = tf.layers.Dense(units=10, activation=tf.nn.softmax)(h)
 cost = - tf.reduce_mean(tf.reduce_sum(t * tf_log(y), axis=1))
 update_ops = tf.get_collection(tf.GraphKeys.UPDATE_OPS)
 with tf.control_dependencies(update_ops):
-#    optimizer = tf.train.AdamOptimizer(0.01).minimize(cost)
+    optimizer = tf.train.AdamOptimizer(0.01).minimize(cost)
-    optimizer = tf.train.GradientDecentOptimizer(0.01).minimize(cost)
 Tensorflow自体に不慣れであり、基本的なミスなのかもしれませんが、
 どうぞよろしくお願いいたします。