回答編集履歴

2018/11/10 16:37

投稿

スコア21960

answer CHANGED Viewed

@@ -109,4 +109,66 @@
 # 計算した値が numpy と TensorFlow で一致するか
 print(np.allclose(loss1, loss2))
+```
+## 追記
+各処理がなにをやっているのか簡単な例を追加しました。
+TensorFlow のテンソルに対して、numpy の indexing のような操作ができないようなので、少々わかりづらいやり方を取らざる得なくなっています。
+```python
+    import tensorflow as tf
+    with tf.Session() as sess:
+        label_dim = 6
+        labels = tf.constant([[1, 2, 3, 4, 5, 6],
+                              [7, 8, 9, 10, 11, 12],
+                              [13, 14, 15, 16, 17, 18]])
+        # ラベルから Y_true を抽出する。
+        mask = tf.tile([True, True, False], (label_dim // 3,))
+        print(mask.eval())  # [ True  True False  True  True False]
+        # 各サンプルの 1, 2, 4, 5 列目を抜き出している。
+        Y_true = tf.boolean_mask(labels, mask, axis=1)
+        print(Y_true.eval())
+        # [[ 1  2  4  5]
+        #  [ 7  8 10 11]
+        #  [13 14 16 17]]
+        # ラベルから重み係数を抽出する。
+        mask = tf.math.logical_not(mask)
+        print(mask.eval())  # [False False  True False False  True]
+        # 各サンプルの 3, 6 列目を抜き出している。
+        coeff = tf.boolean_mask(labels, mask, axis=1)
+        print(coeff.eval())
+        # [[ 3  6]
+        #  [ 9 12]
+        #  [15 18]]
+        # 末尾に次元を1つ追加している。ones のほうも同様
+        print(tf.shape(coeff).eval())  # [3 2]
+        print(tf.shape(coeff[..., tf.newaxis]).eval())  # [3 2 1]
+        # 次元を1つ増やし、axis=-1 で結合している。
+        ones = tf.ones_like(coeff)
+        concat = tf.concat([ones[..., tf.newaxis], coeff[..., tf.newaxis]], axis=-1)
+        print(concat.eval())
+        # [[[ 1  3]
+        #   [ 1  6]]
+        #  [[ 1  9]
+        #   [ 1 12]]
+        #  [[ 1 15]
+        #   [ 1 18]]]
+        # [3 2 2] を [3, 4] に戻している。
+        W = tf.reshape(concat, [tf.shape(ones)[0], -1])
+        print(tf.shape(concat).eval())  # [3 2 2]
+        print(tf.shape(W).eval())  # [3 4]
+        print(W.eval())
+        # [[ 1  3  1  6]
+        #  [ 1  9  1 12]
+        #  [ 1 15  1 18]]
 ```

2018/11/10 16:37

投稿

tiitoi

スコア21960

answer CHANGED Viewed

@@ -3,66 +3,110 @@
 ## 問題設定
-簡単にするため、バッチ次元及び最後の2つの次元は除いています。
+BatchSize=30, LabelDim=75, OutputDim=50
-モデルの入力データ X: (InputDims) の numpy 配列
+モデルの入力 data: (BatchSize, 16, 16, 1) の配列
-モデルの出力データ Y_pred: (InputDims // 3 * 2) の numpy 配列
+モデルの出力 Y_pred: (BatchSize, OutputDim) の配列
+ラベル labels: (BatchSize, LabelDim) の配列
-まず入力データ X を　MSE を計算する際の正解データと重み係数に分解します。
-配列 X のうち、1, 2, 4, 5, 7, 8, ... というように3の倍数以外のインデックスの要素を抽出した部分配列を作り、
-これを Y_true とします。
+## サンプルコード
-また配列 X のうち、3, 6, 9, ... というように3の倍数のインデックスの要素を抽出した部分配列を作り、W とします。
-W の要素に w_1, w_2, w_3, ... に交互に1を加えて、
-W = [1, w_1, 1, w_2, ...] とします。
+### テスト用に入力及びラベルを作成する。
+```python
-すると、サンプル1つの損失関数は以下のように表せます。
+import numpy as np
-mean((Y_true - Y_pred) ** 2 * W)
+batch_size = 30  # バッチサイズ
+input_shape = (16, 16, 1)  # モデルの入力サイズ
+label_dim = 75  # ラベルの次元数
+output_dim = 50  # 出力の次元数
-## numpy のサンプルコード
+# ダミーの入力データ及びラベルを作成する。
+data = np.random.randn(batch_size, *input_shape)  # データ
+labels = np.random.randn(batch_size, label_dim)  # ラベル
+print('data.shape', data.shape)  # data.shape (30, 16, 16, 1)
+print('labels.shape', labels.shape)  # labels.shape (30, 75)
+```
+### テスト用に簡単なモデルを作成する。
 ```python
-batch_size = 30
-input_dim = 75
+import tensorflow as tf
-assert 75 % 3 == 0  # input_dim は3で割り切れないとおかしい
+from keras.models import Sequential
-output_dim = input_dim // 3 * 2
+from keras.layers import Conv2D, GlobalMaxPooling2D
-# ダミーの入力データ及び出力データを作成する。
-input_tensor = np.random.randn(batch_size, input_dim, 1, 1)
+# 入力が  (BatchSize, 16, 16, 1) で出力が (BatchSize, 50) のダミーのモデルを作成する。
-Y_pred = np.random.randn(batch_size, output_dim, 1, 1)
+model = Sequential()
-print('input_tensor.shape', input_tensor.shape)  # input_tensor.shape (30, 75, 1, 1)
+model.add(Conv2D(output_dim, kernel_size=(3, 3), input_shape=input_shape))
-print('Y_pred.shape', output_tensor.shape)  # Y_pred.shape (3, 8, 1, 1)
+model.add(GlobalMaxPooling2D())
+model.summary()
+```
+```
-# 入力データ X を　MSE を計算する際の正解データと重み係数に分解
+_________________________________________________________________
-##############################################################
+Layer (type)                 Output Shape              Param #
+=================================================================
+conv2d_1 (Conv2D)            (None, 14, 14, 50)        500
+_________________________________________________________________
+global_max_pooling2d_1 (Glob (None, 50)                0
+=================================================================
+Total params: 500
+Trainable params: 500
+Non-trainable params: 0
+_________________________________________________________________
+```
-# 1, 2, 4, 5, 7, 8, ... というように3の倍数以外が True のマスク
-Y_true_indices = np.mod(np.arange(input_dim) + 1, 3) != 0
-print(Y_true_indices)
+### 損失関数の定義
-# [ True  True False  True  True False  True  True False  True  True False]
-# 3, 6, 9, ... というように3の倍数が True のマスク
+```python
-W_indices = np.logical_not(Y_true_indices)
+def custom_loss(labels, Y_pred):
+    # ラベルから Y_true を抽出する。
-# [False False  True False False  True False False  True False False  True]
+    mask = tf.tile([True, True, False], (label_dim // 3,))
-print(W_indices)
+    Y_true = tf.boolean_mask(labels, mask, axis=1)
+    # ラベルから重み係数を抽出する。
-Y_true = input_tensor[:, Y_true_indices, ...]
+    mask = tf.math.logical_not(mask)
-coeff = input_tensor[:, W_indices, ...]
+    coeff = tf.boolean_mask(labels, mask, axis=1)
-print('Y_true.shape', Y_true.shape)  # Y_true.shape (30, 50, 1, 1)
-print('coeff.shape', coeff.shape)  # coeff.shape (30, 25, 1, 1)
+    # 重み係数を作成する。
+    ones = tf.ones_like(coeff)
+    W = tf.reshape(
+        tf.concat([ones[..., tf.newaxis], coeff[..., tf.newaxis]], axis=-1),
+        [tf.shape(ones)[0], -1])
+    return tf.reduce_mean((Y_true - Y_pred) ** 2 * W)
+```
+### 損失関数の値計算
+```
+model.compile(loss=custom_loss, optimizer='adam')
+model.fit(data, labels, epochs=3)
+loss1 = model.evaluate(data, labels)
+print(loss1)  # 0.6780742406845093
+```
+### numpy での計算
+```
+# モデルの出力
+Y_pred = model.predict(data)
+# ラベルから Y_true を抽出する。
+mask = np.ones(labels.shape[1], dtype=bool)
+mask[2::3] = False
+Y_true = labels[:, mask]
+# ラベルから重み係数を抽出する。
+mask = np.logical_not(mask)
+coeff = labels[:, mask]
 # 重み係数を作成する。
 W = np.ones_like(Y_true)
-W[:, 1::2, ...] = coeff
+W[:, 1::2] = coeff
-print('W.shape', W.shape)  # W.shape (30, 50, 1, 1)
-# 重み付き2乗誤差
-loss = np.mean((Y_true - Y_pred) ** 2 * W)
+loss2 = np.mean((Y_true - Y_pred) ** 2 * W)
-print(loss)
-```
-## Keras でこれと同じことを行うには
-Keras の Lambda 関数内では TensorFlow の関数を利用できます。
+# 計算した値が numpy と TensorFlow で一致するか
-numpy でできることは TensorFlow の関数を使ってもできるので、同じ方針で作りましょう。
+print(np.allclose(loss1, loss2))
+```

2018/11/10 14:24

投稿

tiitoi

スコア21960

answer CHANGED Viewed

@@ -1,7 +1,7 @@
 Python では数値計算を行うための for 文は基本的に遅くなるため NG です。
 for 文を使わないで計算できるようにしましょう。
-## 問題設定とその理解
+## 問題設定
 簡単にするため、バッチ次元及び最後の2つの次元は除いています。