質問編集履歴

おそらくエラーの原因と思われるデータローダのコードを補足しました。

2024/01/17 05:25

投稿

hataaaaa

スコア0

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -176,4 +176,98 @@
 データローダーに問題があると思われるが原因が分からなかった。
 ### 補足
+class DataTransform():
+    """
+    画像とアノテーションの前処理クラス。訓練時と検証時で異なる動作をする。
+    画像のサイズをinput_size x input_sizeにする。
+    訓練時はデータオーギュメンテーションする。
+    Attributes
+    ----------
+    input_size : int
+        リサイズ先の画像の大きさ。
+    color_mean : (R, G, B)
+        各色チャネルの平均値。
+    color_std : (R, G, B)
+        各色チャネルの標準偏差。
+    """
+    def __init__(self, input_size, color_mean, color_std):
+        self.data_transform = {
+            'train': Compose([
+                Scale(scale=[0.5, 1.5]),  # 画像の拡大
+                RandomRotation(angle=[-10, 10]),  # 回転
+                RandomMirror(),  # ランダムミラー
+                Resize(input_size),  # リサイズ(input_size)
+                Normalize_Tensor(color_mean, color_std)  # 色情報の標準化とテンソル化
-特になし
+            ]),
+            'val': Compose([
+                Resize(input_size),  # リサイズ(input_size)
+                Normalize_Tensor(color_mean, color_std)  # 色情報の標準化とテンソル化
+            ])
+        }
+    def __call__(self, phase, img, anno_class_img):
+        """
+        Parameters
+        ----------
+        phase : 'train' or 'val'
+            前処理のモードを指定。
+        """
+        return self.data_transform[phase](img, anno_class_img)
+class VOCDataset(data.Dataset):
+    """
+    VOC2012のDatasetを作成するクラス。PyTorchのDatasetクラスを継承。
+    Attributes
+    ----------
+    img_list : リスト
+        画像のパスを格納したリスト
+    anno_list : リスト
+        アノテーションへのパスを格納したリスト
+    phase : 'train' or 'test'
+        学習か訓練かを設定する。
+    transform : object
+        前処理クラスのインスタンス
+    """
+    def __init__(self, img_list, anno_list, phase, transform):
+        self.img_list = img_list
+        self.anno_list = anno_list
+        self.phase = phase
+        self.transform = transform
+    def __len__(self):
+        '''画像の枚数を返す'''
+        return len(self.img_list)
+    def __getitem__(self, index):
+        '''
+        前処理をした画像のTensor形式のデータとアノテーションを取得
+        '''
+        img, anno_class_img = self.pull_item(index)
+        print("Before transformation - img shape:", img.shape)
+        print("Before transformation - anno_class_img shape:", anno_class_img.shape)
+        return img, anno_class_img
+    def pull_item(self, index):
+        '''画像のTensor形式のデータ、アノテーションを取得する'''
+        # 1. 画像読み込み
+        image_file_path = self.img_list[index]
+        img = Image.open(image_file_path)   # [高さ][幅][色RGB]
+        # 2. アノテーション画像読み込み
+        anno_file_path = self.anno_list[index]
+        anno_class_img = Image.open(anno_file_path)   # [高さ][幅]
+        # 3. 前処理を実施
+        img, anno_class_img = self.transform(self.phase, img, anno_class_img)
+        print("After transformation - img shape:", img.shape)
+        print("After transformation - anno_class_img shape:", anno_class_img.shape)
+        return img, anno_class_img

Jupyter Visual Studio Python