編集履歴

質問編集履歴

プログラムを全文記載しました。

2019/10/10 06:11

投稿

koukimaru22

スコア6

test CHANGED Viewed

File without changes

test CHANGED Viewed

@@ -28,13 +28,97 @@
 ```python3
+ def target_category_loss(x, category_index, nb_classes):
+    return tf.multiply(x, K.one_hot([category_index], nb_classes))
+def target_category_loss_output_shape(input_shape):
+    return input_shape
+def normalize(x):
+    return x / (K.sqrt(K.mean(K.square(x))) + 1e-5)
+def load_image(path):
+        img_path = path
+    img = image.load_img(img_path, target_size=(224, 224))
+    x = image.img_to_array(img)
+    x = np.expand_dims(x, axis=0)
+    x = preprocess_input(x)
+    return x
+def register_gradient():
+    if "GuidedBackProp" not in ops._gradient_registry._registry:
+        @ops.RegisterGradient("GuidedBackProp")
+        def _GuidedBackProp(op, grad):
+            dtype = op.inputs[0].dtype
+            return grad * tf.cast(grad > 0., dtype) * \
+                tf.cast(op.inputs[0] > 0., dtype)
+def compile_saliency_function(model, activation_layer='block5_conv3'):
+    input_img = model.input
+    layer_dict = dict([(layer.name, layer) for layer in model.layers[1:]])
+    layer_output = layer_dict[activation_layer].output
+    max_output = K.max(layer_output, axis=3)
+    saliency = K.gradients(K.sum(max_output), input_img)[0]
+    return K.function([input_img, K.learning_phase()], [saliency])
+def modify_backprop(model, name):
+    g = tf.get_default_graph()
+    with g.gradient_override_map({'Relu': name}):
+        new_model = VGG16(weights='imagenet')
+    return new_model
- def deprocess_image(x):
+def deprocess_image(x):
     if np.ndim(x) > 3:
-        x = np.squeeze(x)
+        x = np.squeeze(x)
-        # normalize tensor: center on 0., ensure std is 0.1
     x -= x.mean()
@@ -44,16 +128,12 @@
-    # clip to [0, 1]
     x += 0.5
     x = np.clip(x, 0, 1)
-    # convert to RGB array
     x *= 255
     if K.image_dim_ordering() == 'tf':
@@ -66,6 +146,112 @@
+def grad_cam(input_model, image, category_index, layer_name):
+    nb_classes = 1000
+    target_layer = lambda x: target_category_loss(x, category_index, nb_classes)
+    x = input_model.layers[-1].output
+    x = Lambda(target_layer, output_shape=target_category_loss_output_shape)(x)
+    model = keras.models.Model(input_model.layers[0].input, x)
+    loss = K.sum(model.layers[-1].output)
+    conv_output = [l for l in model.layers if l.name is layer_name][0].output
+    grads = normalize(K.gradients(loss, conv_output)[0])
+    gradient_function = K.function([model.layers[0].input], [conv_output, grads])
+    output, grads_val = gradient_function([image])
+    output, grads_val = output[0, :], grads_val[0, :, :, :]
+    weights = np.mean(grads_val, axis = (0, 1))
+    cam = np.ones(output.shape[0 : 2], dtype = np.float32)
+    for i, w in enumerate(weights):
+        cam += w * output[:, :, i]
+    cam = cv2.resize(cam, (224, 224))
+    cam = np.maximum(cam, 0)
+    heatmap = cam / np.max(cam)
+    image = image[0, :]
+    image -= np.min(image)
+    image = np.minimum(image, 255)
+    cam = cv2.applyColorMap(np.uint8(255*heatmap), cv2.COLORMAP_JET)
+    cam = np.float32(cam) + np.float32(image)
+    cam = 255 * cam / np.max(cam)
+    return np.uint8(cam), heatmap
+preprocessed_input = load_image("./dog_cat.jpg")
+model = VGG16(weights='imagenet')
+predictions = model.predict(preprocessed_input)
+top_1 = decode_predictions(predictions)[0][0]
+print('Predicted class:')
+print('%s (%s) with probability %.2f' % (top_1[1], top_1[0], top_1[2]))
+predicted_class = np.argmax(predictions)
+print(predicted_class)
+cam, heatmap = grad_cam(model, preprocessed_input, predicted_class, "block5_conv3")
+cv2.imwrite("gradcam.jpg", cam)
 register_gradient()
 guided_model = modify_backprop(model, 'GuidedBackProp')
@@ -76,11 +262,7 @@
 gradcam = saliency[0] * heatmap[..., np.newaxis]
-cv2.imwrite("guied_gradcam.jpg", deprocess_image(gradcam))
+cv2.imwrite("guided_gradcam.jpg", deprocess_image(gradcam))