質問編集履歴

情報の詳細化

2017/08/16 09:09

投稿

bof

スコア18

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -148,4 +148,5 @@
     print("expected: ", className[classId], ", actual: ", actual, result)
 print("suceess percentage:", success/(success+fail))
-```
+```
+取り込んだ画像をpatchにしたものから特徴点(keypoint)を抽出する段階で、特徴点をpatchの中心に指定したいのですが，そこがうまくいってません。

情報の詳細化

2017/08/16 09:09

投稿

bof

スコア18

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -71,8 +71,7 @@
     # 特徴点とその特徴を計算
     while x<9604:
         #keypoints, descriptors= detector.detectAndCompute(patches, None)
-        keypoints = cv2.KeyPoint(patches[x][1][1].pt,size=9, angele=-1, response=0, octave=0, class_id=-1)
+        keypoints = cv2.KeyPoint(patches[x][1][0],patches[x][0][1],size=9, angele=-1, response=0, octave=0, class_id=-1)
-        #keypoints = [cv2.KeyPoint(patches[x][1][1], 1) for x in range(9604)]
         descriptors = detector.compute(patches[x], keypoints)
         #print(patches[x].dtype, keypoints)
         x=x+1

情報の詳細化

2017/08/16 09:04

投稿

bof

スコア18

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -12,4 +12,141 @@
 keypoints, descriptors= detector.detectAndCompute(patches[x], None)
 ```
 patch[x].dtypeはuint8なのですが、descriptorsがNonetypeになってしまいます。
-どのように修正すればよいのか教えていただければ幸いです。
+どのように修正すればよいのか教えていただければ幸いです。
+```ここに言語を入力
+# -*- coding: utf-8 -*-
+import os
+import sys
+import cv2
+import numpy as np
+from sklearn.feature_extraction import image
+## 画像データのクラスIDとパスを取得
+#
+# @param dir_path 検索ディレクトリ
+# @return data_sets [クラスID, 画像データのパス]のリスト
+def getDataSet(dir_path):
+    data_sets = []
+    sub_dirs = os.listdir(dir_path)
+    for classId in sub_dirs:
+        sub_dir_path = dir_path + '/' + classId
+        img_files = os.listdir(sub_dir_path)
+        for f in img_files:
+            data_sets.append([classId, sub_dir_path + '/' + f])
+    return data_sets
+"""
+main
+"""
+# 定数定義
+GRAYSCALE = 0
+# KAZE特徴量抽出器
+detector = cv2.xfeatures2d.SIFT_create()
+"""
+train
+"""
+print("train start")
+# 訓練データのパスを取得
+train_set = getDataSet('train_img')
+# 辞書サイズ
+dictionarySize = 9
+# Bag Of Visual Words分類器
+bowTrainer = cv2.BOWKMeansTrainer(dictionarySize)
+x=0
+# 各画像を分析
+for i, (classId, data_path) in enumerate(train_set):
+    # 進捗表示
+    sys.stdout.write(".")
+    # カラーで画像読み込み
+    color = cv2.imread(data_path, cv2.IMREAD_COLOR)
+    size = (100,100)
+    colora = cv2.resize(color,size)
+    patches = image.extract_patches_2d(colora, (3, 3))
+    patches = patches.astype(np.uint8)
+    #print(color.shape, patches.shape, patches.dtype)
+    # 特徴点とその特徴を計算
+    while x<9604:
+        #keypoints, descriptors= detector.detectAndCompute(patches, None)
+        keypoints = cv2.KeyPoint(patches[x][1][1].pt,size=9, angele=-1, response=0, octave=0, class_id=-1)
+        #keypoints = [cv2.KeyPoint(patches[x][1][1], 1) for x in range(9604)]
+        descriptors = detector.compute(patches[x], keypoints)
+        #print(patches[x].dtype, keypoints)
+        x=x+1
+    #descriptors = detector.compute(patches, keypoints)
+    # intからfloat32に変換
+        descriptors = descriptors.astype(np.float32)
+    # 特徴ベクトルをBag Of Visual Words分類器にセット
+        bowTrainer.add(descriptors)
+# Bag Of Visual Words分類器で特徴ベクトルを分類
+codebook = bowTrainer.cluster()
+# 訓練完了
+print("train finish")
+"""
+test
+"""
+print("test start")
+# テストデータのパス取得
+test_set = getDataSet("test_img")
+# KNNを使って総当たりでマッチング
+matcher = cv2.BFMatcher()
+# Bag Of Visual Words抽出器
+bowExtractor = cv2.BOWImgDescriptorExtractor(detector, matcher)
+# トレーニング結果をセット
+bowExtractor.setVocabulary(codebook)
+success = 0
+fail = 0
+# 正しく学習できたか検証する
+for i, (classId, data_path) in enumerate(test_set):
+    # グレースケールで読み込み
+    gray = cv2.imread(data_path, cv2.IMREAD_COLOR)
+    # 特徴点と特徴ベクトルを計算
+    print(gray.dtype)
+    size = (100,100)
+    graya = cv2.resize(gray,size)
+    patches = image.extract_patches_2d(graya, (3, 3))
+    print(patches.shape)
+    while x<9604:
+        keypoints, descriptors= detector.detectAndCompute(patches[x], None)
+    # intからfloat32に変換 特徴量
+        descriptors = descriptors.astype(np.float32)
+    # Bag Of Visual Wordsの計算 ヒストグラム
+        bowDescriptors = bowExtractor.compute(patches[x], keypoints)
+    # 結果表示
+    className = {"0": "airplane",
+                 "1": "ferry",
+                 "2": "laptop"}
+    actual = "???"
+    if bowDescriptors[0][0] > bowDescriptors[0][1] and bowDescriptors[0][0] > bowDescriptors[0][2]:
+        actual = className["0"]
+    elif bowDescriptors[0][0] < bowDescriptors[0][1] and bowDescriptors[0][2] < bowDescriptors[0][1]:
+        actual = className["1"]
+    else:
+        actual = className["2"]
+    result = ""
+    if actual == "???":
+        result = " => unknown."
+    elif className[classId] == actual:
+        result = " => success!!"
+        success = success + 1
+    else:
+        result = " => fail"
+        fail = fail + 1
+    print("expected: ", className[classId], ", actual: ", actual, result)
+print("suceess percentage:", success/(success+fail))
+```