質問編集履歴

コードの記載を修正

2022/03/19 05:59

投稿

Shimizukei

スコア6

test CHANGED Viewed

File without changes

test CHANGED Viewed

@@ -5,29 +5,54 @@
 [https://hituji-ws.com/code/python/python-gcp-ocr/](https://hituji-ws.com/code/python/python-gcp-ocr/)
 ```
+import requests
+import base64
-from pathlib import Path
+import json
-from google.cloud import vision
+API_KEY = ''
+GOOGLE_CLOUD_VISION_API_URL = 'https://vision.googleapis.com/v1/images:annotate?key='
+# TEXT_DETECTION:比較的短い文字
-def render_doc_text(filein):
+# DOCUMENT_TEXT_DETECTION:文章
+DETECTION_TYPE = "DOCUMENT_TEXT_DETECTION"
+def request_cloud_vison_api(image_base64, type="DOCUMENT_TEXT_DETECTION"):
+    """ http のリクエストでVisionAPIにアクセス """
+    api_url = GOOGLE_CLOUD_VISION_API_URL + API_KEY
+    req_body = json.dumps({
+        'requests': [{
+            'image': {
+                'content': image_base64.decode('utf-8')
+            },
+            'features': [{
+                'type': type,
+                'maxResults': 10,
+            }]
+        }]
+    })
-    client = vision.ImageAnnotatorClient()
+    res = requests.post(api_url, data=req_body)
+    return res.json()
-    p = Path(__file__).parent / filein
-    with p.open('rb') as image_file:
-        content = image_file.read()
+def img_to_base64(filepath):
+    """ 画像データをエンコード """
+    with open(filepath, 'rb') as img:
+        img_byte = img.read()
-    image = vision.Image(content=content)
+    return base64.b64encode(img_byte)
+def render_doc_text(file_path):
+    result = request_cloud_vison_api(image_base64=img_to_base64(file_path),
+                                     type=DETECTION_TYPE)
     data_list = []
-    response = client.document_text_detection(image=image)
-    document = response.full_text_annotation
+    # データの取得 textAnnotationsに座標とテキスト fullTextAnnotationにテキスト
-    for page in document.pages:
+    result_list = result["responses"][0]["textAnnotations"]
-        for block in page.blocks:
+    for d in result_list:
-            for paragraph in block.paragraphs:
-                for word in paragraph.words:
-                    box = [{'x':v.x, 'y':v.y} for v in word.bounding_box.vertices]
+        data_list.append([d['boundingPoly']['vertices'], d['description']])
-                    text = [symbol.text for symbol in word.symbols]
+    # 1つ目除外
-                    data_list.append([box, ''.join(text)])
+    data_list = data_list[1:len(data_list)]
     return data_list
 ```

Google Cloud Platform Django Python