編集履歴

質問編集履歴

問題点の訂正.

2021/01/19 01:51

投稿

porcini

スコア0

test CHANGED Viewed

File without changes

test CHANGED Viewed

@@ -10,7 +10,9 @@
 問題は, 検出された座標を取得して服の画像が表示することが出来ないという点で躓いています.
-1つ目のソースコードの下部, 米印(＊)の部分で服の画像を出力させようとしています.
+1つ目のソースコードの下部, **米印(＊)**の部分で服の画像を出力させようとしています.
+動作としては, 上半身の認識が確認できた時にボタンを押し, Upper bodyの座標に服の画像を出力する。
 また, 2つ目のソースコードでは基本的に物体検出させる詳細が書かれています.

服の画像を出力するタイミングを、Buttonが押された時に動くように変更しました。それに伴い、Buttonの追加とソースコードの1部を変更しました。

2021/01/19 01:51

投稿

porcini

スコア0

test CHANGED Viewed

File without changes

test CHANGED Viewed

@@ -78,342 +78,350 @@
 **********************
-    @IBOutlet weak var UIImageView: UIImageView!
+　　@IBOutlet weak var UIImageView: UIImageView!
+　　@IBAction func tapBtn(_ sender: Any) {
-    func imageset(_ bounds: CGRect, identifier: String) -> UIImageView {
+        func imageset(_ bounds: CGRect, identifier: String) -> UIImageView {
+            let textLayer = CATextLayer()
+            let images = UIKit.UIImageView()
+            images.bounds = bounds
+            if textLayer.name == "Upper body"{
+            images.image = UIImage(named: "Upper body")
+            images.frame = CGRect(x: bounds.midX, y: bounds.midY, width: 　　　　bounds.size.height, height: bounds.size.width)
+            images.center = CGPoint(x: bounds.midX, y: bounds.minY)
+            self.view.addSubview(images)
+            }else{
+                print("error")
+            }
+            return images
+        }
+    }
+***********************
+```
+```Swift
+import UIKit
+import AVFoundation
+import Vision
+class VisionObjectRecognitionViewController: ViewController {
+    private var detectionOverlay: CALayer! = nil
+    // Visionパーツ
+    private var requests = [VNRequest]()
+    @discardableResult
+    func setupVision() -> NSError? {
+        // Visionパーツのセットアップ
+        let error: NSError! = nil
+        // MLモデルの指定, Visionモデルの指定
+        guard let modelURL = Bundle.main.url(forResource: "MyObjectDetector7", withExtension: "mlmodelc") else {
+            return NSError(domain: "VisionObjectRecognitionViewController", code: -1, userInfo: [NSLocalizedDescriptionKey: "Modelファイルがありません."])
+        }
+        do {
+            let visionModel = try VNCoreMLModel(for: MLModel(contentsOf: modelURL))
+            let objectRecognition = VNCoreMLRequest(model: visionModel, completionHandler: { (request, error) in
+                DispatchQueue.main.async(execute: {
+                    // メインキューで全てのUI更新を実行
+                    if let results = request.results {
+                        self.drawVisionRequestResults(results)
+                    }
+                })
+            })
+            self.requests = [objectRecognition]
+        } catch let error as NSError {
+            print("Modelが読み込めませんでした. (error)")
+        }
+        return error
+    }
+    func drawVisionRequestResults(_ results: [Any]) {
+        CATransaction.begin()
+        CATransaction.setValue(kCFBooleanTrue, forKey: kCATransactionDisableActions)
+        detectionOverlay.sublayers = nil // 古い認識したオブジェクトの値を削除
+        for observation in results where observation is VNRecognizedObjectObservation {
+            guard let objectObservation = observation as? VNRecognizedObjectObservation else {
+                continue
+            }
+            // 最も信頼性の高いラベルのみを選択
+            let topLabelObservation = objectObservation.labels[0] //最も信頼度の高い値を選ぶ
+            let objectBounds = VNImageRectForNormalizedRect(objectObservation.boundingBox, Int(bufferSize.width), Int(bufferSize.height))
+            let shapeLayer = self.createRoundedRectLayerWithBounds(objectBounds)
+            let textLayer = self.createTextSubLayerInBounds(objectBounds,
+                                                            identifier: topLabelObservation.identifier,
+                                                            confidence: topLabelObservation.confidence)
+            shapeLayer.addSublayer(textLayer)
+            detectionOverlay.addSublayer(shapeLayer)
+        }
+        self.updateLayerGeometry()
+        CATransaction.commit()
+    }
+    override func captureOutput(_ output: AVCaptureOutput, didOutput sampleBuffer: CMSampleBuffer, from connection: AVCaptureConnection) {
+        guard let pixelBuffer = CMSampleBufferGetImageBuffer(sampleBuffer) else {
+            return
+        }
+        let exifOrientation = exifOrientationFromDeviceOrientation()
+        let imageRequestHandler = VNImageRequestHandler(cvPixelBuffer: pixelBuffer, orientation: exifOrientation, options: [:])
+        do {
+            try imageRequestHandler.perform(self.requests)
+        } catch {
+            print(error)
+        }
+    }
+    override func setupAVCapture() {
+        super.setupAVCapture()
+        // セットアップVisionパーツ
+        setupLayers()
+        updateLayerGeometry()
+        setupVision()
+        // キャプチャセッションをスタート
+        startCaptureSession()
+    }
+    func setupLayers() {
+        detectionOverlay = CALayer() // 観測された全てのコンテナレイヤー(レンダリングを含む)
+        detectionOverlay.name = "DetectionOverlay"
+        detectionOverlay.bounds = CGRect(x: 0.0,
+                                         y: 0.0,
+                                         width: bufferSize.width,
+                                         height: bufferSize.height)
+        detectionOverlay.position = CGPoint(x: rootLayer.bounds.midX, y: rootLayer.bounds.midY)
+        rootLayer.addSublayer(detectionOverlay)
+    }
+    func updateLayerGeometry() {
+        let bounds = rootLayer.bounds
+        var scale: CGFloat
+        let xScale: CGFloat = bounds.size.width / bufferSize.height
+        let yScale: CGFloat = bounds.size.height / bufferSize.width
+        scale = fmax(xScale, yScale)
+        if scale.isInfinite {
+            scale = 1.0
+        }
+        CATransaction.begin()
+        CATransaction.setValue(kCFBooleanTrue, forKey: kCATransactionDisableActions)
+        //レイヤーを画面の向きにし, スケールとミラーリング
+        detectionOverlay.setAffineTransform(CGAffineTransform(rotationAngle: CGFloat(.pi / 2.0)).scaledBy(x: scale, y: -scale))
+        //レーヤーを中央に配置
+        detectionOverlay.position = CGPoint(x: bounds.midX, y: bounds.midY)
+        CATransaction.commit()
+    }
+    func createTextSubLayerInBounds(_ bounds: CGRect, identifier: String, confidence: VNConfidence) -> CATextLayer {
         let textLayer = CATextLayer()
-        let images = UIKit.UIImageView()
-        images.bounds = bounds
-        if textLayer.name == "Upper body"{
+        textLayer.name = "Object Label"
+        let formattedString = NSMutableAttributedString(string: String(format: "(identifier)\nConfidence:  %.2f", confidence))
-        images.image = UIImage(named: "Upper body")
+        let largeFont = UIFont(name: "Helvetica", size: 24.0)!
+        formattedString.addAttributes([NSAttributedString.Key.font: largeFont], range: NSRange(location: 0, length: identifier.count))
+        textLayer.string = formattedString
-        images.frame = CGRect(x: bounds.midX, y: bounds.midY, width: bounds.size.height, height: bounds.size.width)
+        textLayer.bounds = CGRect(x: 0, y: 0, width: bounds.size.height - 10, height: bounds.size.width - 10)
-        images.center = CGPoint(x: bounds.midX, y: bounds.minY)
+        textLayer.position = CGPoint(x: bounds.midX, y: bounds.midY)
-        self.view.addSubview(images)
+        textLayer.shadowOpacity = 0.7
+        textLayer.shadowOffset = CGSize(width: 2, height: 2)
+        textLayer.foregroundColor = CGColor(colorSpace: CGColorSpaceCreateDeviceRGB(), components: [0.0, 0.0, 0.0, 1.0])
+        textLayer.contentsScale = 2.0 // retina rendering
+        //レイヤーを画面の向きに回転させ, 拡大縮小してミラーリングする
+        textLayer.setAffineTransform(CGAffineTransform(rotationAngle: CGFloat(.pi / 2.0)).scaledBy(x: 1.0, y: -1.0))
+        return textLayer
-        }
+    }
+    //認識した座標に矩形を表示
+    func createRoundedRectLayerWithBounds(_ bounds: CGRect) -> CALayer {
+        let shapeLayer = CALayer()
+        shapeLayer.bounds = bounds
+        shapeLayer.position = CGPoint(x: bounds.midX, y: bounds.midY)
+        shapeLayer.name = "Found Object"
+        shapeLayer.backgroundColor = CGColor(colorSpace: CGColorSpaceCreateDeviceRGB(), components: [1.0, 1.0, 1.0, 0.4])
+        shapeLayer.cornerRadius = 7
-        return images
+        return shapeLayer
-    }
+    }
-***********************
+}
 ```
-```Swift
-import UIKit
-import AVFoundation
-import Vision
-class VisionObjectRecognitionViewController: ViewController {
-    private var detectionOverlay: CALayer! = nil
-    // Visionパーツ
-    private var requests = [VNRequest]()
-    @discardableResult
-    func setupVision() -> NSError? {
-        // Visionパーツのセットアップ
-        let error: NSError! = nil
-        // MLモデルの指定, Visionモデルの指定
-        guard let modelURL = Bundle.main.url(forResource: "MyObjectDetector7", withExtension: "mlmodelc") else {
-            return NSError(domain: "VisionObjectRecognitionViewController", code: -1, userInfo: [NSLocalizedDescriptionKey: "Modelファイルがありません."])
-        }
-        do {
-            let visionModel = try VNCoreMLModel(for: MLModel(contentsOf: modelURL))
-            let objectRecognition = VNCoreMLRequest(model: visionModel, completionHandler: { (request, error) in
-                DispatchQueue.main.async(execute: {
-                    // メインキューで全てのUI更新を実行
-                    if let results = request.results {
-                        self.drawVisionRequestResults(results)
-                    }
-                })
-            })
-            self.requests = [objectRecognition]
-        } catch let error as NSError {
-            print("Modelが読み込めませんでした. (error)")
-        }
-        return error
-    }
-    func drawVisionRequestResults(_ results: [Any]) {
-        CATransaction.begin()
-        CATransaction.setValue(kCFBooleanTrue, forKey: kCATransactionDisableActions)
-        detectionOverlay.sublayers = nil // 古い認識したオブジェクトの値を削除
-        for observation in results where observation is VNRecognizedObjectObservation {
-            guard let objectObservation = observation as? VNRecognizedObjectObservation else {
-                continue
-            }
-            // 最も信頼性の高いラベルのみを選択
-            let topLabelObservation = objectObservation.labels[0] //最も信頼度の高い値を選ぶ
-            let objectBounds = VNImageRectForNormalizedRect(objectObservation.boundingBox, Int(bufferSize.width), Int(bufferSize.height))
-            let shapeLayer = self.createRoundedRectLayerWithBounds(objectBounds)
-            let textLayer = self.createTextSubLayerInBounds(objectBounds,
-                                                            identifier: topLabelObservation.identifier,
-                                                            confidence: topLabelObservation.confidence)
-            shapeLayer.addSublayer(textLayer)
-            detectionOverlay.addSublayer(shapeLayer)
-        }
-        self.updateLayerGeometry()
-        CATransaction.commit()
-    }
-    override func captureOutput(_ output: AVCaptureOutput, didOutput sampleBuffer: CMSampleBuffer, from connection: AVCaptureConnection) {
-        guard let pixelBuffer = CMSampleBufferGetImageBuffer(sampleBuffer) else {
-            return
-        }
-        let exifOrientation = exifOrientationFromDeviceOrientation()
-        let imageRequestHandler = VNImageRequestHandler(cvPixelBuffer: pixelBuffer, orientation: exifOrientation, options: [:])
-        do {
-            try imageRequestHandler.perform(self.requests)
-        } catch {
-            print(error)
-        }
-    }
-    override func setupAVCapture() {
-        super.setupAVCapture()
-        // セットアップVisionパーツ
-        setupLayers()
-        updateLayerGeometry()
-        setupVision()
-        // キャプチャセッションをスタート
-        startCaptureSession()
-    }
-    func setupLayers() {
-        detectionOverlay = CALayer() // 観測された全てのコンテナレイヤー(レンダリングを含む)
-        detectionOverlay.name = "DetectionOverlay"
-        detectionOverlay.bounds = CGRect(x: 0.0,
-                                         y: 0.0,
-                                         width: bufferSize.width,
-                                         height: bufferSize.height)
-        detectionOverlay.position = CGPoint(x: rootLayer.bounds.midX, y: rootLayer.bounds.midY)
-        rootLayer.addSublayer(detectionOverlay)
-    }
-    func updateLayerGeometry() {
-        let bounds = rootLayer.bounds
-        var scale: CGFloat
-        let xScale: CGFloat = bounds.size.width / bufferSize.height
-        let yScale: CGFloat = bounds.size.height / bufferSize.width
-        scale = fmax(xScale, yScale)
-        if scale.isInfinite {
-            scale = 1.0
-        }
-        CATransaction.begin()
-        CATransaction.setValue(kCFBooleanTrue, forKey: kCATransactionDisableActions)
-        //レイヤーを画面の向きにし, スケールとミラーリング
-        detectionOverlay.setAffineTransform(CGAffineTransform(rotationAngle: CGFloat(.pi / 2.0)).scaledBy(x: scale, y: -scale))
-        //レーヤーを中央に配置
-        detectionOverlay.position = CGPoint(x: bounds.midX, y: bounds.midY)
-        CATransaction.commit()
-    }
-    func createTextSubLayerInBounds(_ bounds: CGRect, identifier: String, confidence: VNConfidence) -> CATextLayer {
-        let textLayer = CATextLayer()
-        textLayer.name = "Object Label"
-        let formattedString = NSMutableAttributedString(string: String(format: "(identifier)\nConfidence:  %.2f", confidence))
-        let largeFont = UIFont(name: "Helvetica", size: 24.0)!
-        formattedString.addAttributes([NSAttributedString.Key.font: largeFont], range: NSRange(location: 0, length: identifier.count))
-        textLayer.string = formattedString
-        textLayer.bounds = CGRect(x: 0, y: 0, width: bounds.size.height - 10, height: bounds.size.width - 10)
-        textLayer.position = CGPoint(x: bounds.midX, y: bounds.midY)
-        textLayer.shadowOpacity = 0.7
-        textLayer.shadowOffset = CGSize(width: 2, height: 2)
-        textLayer.foregroundColor = CGColor(colorSpace: CGColorSpaceCreateDeviceRGB(), components: [0.0, 0.0, 0.0, 1.0])
-        textLayer.contentsScale = 2.0 // retina rendering
-        //レイヤーを画面の向きに回転させ, 拡大縮小してミラーリングする
-        textLayer.setAffineTransform(CGAffineTransform(rotationAngle: CGFloat(.pi / 2.0)).scaledBy(x: 1.0, y: -1.0))
-        return textLayer
-    }
-    //認識した座標に矩形を表示
-    func createRoundedRectLayerWithBounds(_ bounds: CGRect) -> CALayer {
-        let shapeLayer = CALayer()
-        shapeLayer.bounds = bounds
-        shapeLayer.position = CGPoint(x: bounds.midX, y: bounds.midY)
-        shapeLayer.name = "Found Object"
-        shapeLayer.backgroundColor = CGColor(colorSpace: CGColorSpaceCreateDeviceRGB(), components: [1.0, 1.0, 1.0, 0.4])
-        shapeLayer.cornerRadius = 7
-        return shapeLayer
-    }
-}
-```

使用しているサンプルプログラムのリンクを追記しました.

2021/01/15 12:27

投稿

porcini

スコア0

test CHANGED Viewed

File without changes

test CHANGED Viewed

@@ -16,6 +16,10 @@
 カメラセッションなどは省力します。
+**以下のサンプルに手を加えて, 画像を出力出来るように考えています.**
+【https://developer.apple.com/documentation/vision/recognizing_objects_in_live_capture】
 ### 該当のソースコード
 ```Swift