Vision PDF/OCR (GoogleCloudPlatform#622)

sirtorry · bshaffer · commit f49b65975b21 · 2018-08-15T12:39:30.000-07:00
diff --git a/vision/README.md b/vision/README.md
@@ -39,6 +39,7 @@ Vision API from PHP.
   text           Detect text in an image using Google Cloud Vision API
   crop-hints     Detect crop hints in an image using Google Cloud Vision API
   document-text  Detect document text in an image using Google Cloud Vision API
+  pdf            Detect text in a PDF/TIFF using Google Cloud Vision API
   web            Detect web entities in an image using Google Cloud Vision API
   web-geo        Detect web entities in an image with geo metadata using
                  Google Cloud Vision API
diff --git a/vision/composer.json b/vision/composer.json
@@ -2,7 +2,7 @@
     "name": "google/vision",
     "type": "project",
     "require": {
-        "google/cloud-vision": "^0.10",
+        "google/cloud-vision": "^0.13",
         "google/cloud-storage": "^1.3",
         "symfony/console": "^3.1"
     },
@@ -32,7 +32,8 @@
             "src/detect_web.php",
             "src/detect_web_gcs.php",
             "src/detect_web_with_geo_metadata.php",
-            "src/detect_web_with_geo_metadata_gcs.php"
+            "src/detect_web_with_geo_metadata_gcs.php",
+            "src/detect_pdf_gcs.php"
         ]
     },
     "require-dev": {
diff --git a/vision/composer.lock b/vision/composer.lock
diff --git a/vision/src/detect_crop_hints.php b/vision/src/detect_crop_hints.php
@@ -47,5 +47,7 @@ function detect_crop_hints($path)
     } else {
         print('No crop hints' . PHP_EOL);
     }
+    
+    $imageAnnotator->close();
 }
 // [END vision_crop_hint_detection]
diff --git a/vision/src/detect_crop_hints_gcs.php b/vision/src/detect_crop_hints_gcs.php
@@ -46,5 +46,7 @@ function detect_crop_hints_gcs($path)
     } else {
         print('No crop hints' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_crop_hint_detection_gcs]
diff --git a/vision/src/detect_document_text.php b/vision/src/detect_document_text.php
@@ -63,5 +63,7 @@ function detect_document_text($path)
     } else {
         print('No text found' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_fulltext_detection]
diff --git a/vision/src/detect_document_text_gcs.php b/vision/src/detect_document_text_gcs.php
@@ -63,5 +63,7 @@ function detect_document_text_gcs($path)
     } else {
         print('No text found' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_fulltext_detection_gcs]
diff --git a/vision/src/detect_face.php b/vision/src/detect_face.php
@@ -103,6 +103,8 @@ function detect_face($path, $outFile = null)
         printf('Output image written to %s' . PHP_EOL, $outFile);
         # [END vision_face_detection_tutorial_run_application]
     }
+
+    $imageAnnotator->close();
     // [START vision_face_detection]
 }
 // [END vision_face_detection]
diff --git a/vision/src/detect_face_gcs.php b/vision/src/detect_face_gcs.php
@@ -54,5 +54,7 @@ function detect_face_gcs($path)
         print('Bounds: ' . join(', ',$bounds) . PHP_EOL);
         print(PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_face_detection_gcs]
diff --git a/vision/src/detect_image_property.php b/vision/src/detect_image_property.php
@@ -40,5 +40,7 @@ function detect_image_property($path)
         printf("Blue: %s" . PHP_EOL, $color->getBlue());
         print(PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_image_property_detection]
diff --git a/vision/src/detect_image_property_gcs.php b/vision/src/detect_image_property_gcs.php
@@ -44,5 +44,7 @@ function detect_image_property_gcs($path)
     } else {
         print('No Results.' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_image_property_detection_gcs]
diff --git a/vision/src/detect_label.php b/vision/src/detect_label.php
@@ -39,5 +39,7 @@ function detect_label($path)
     } else {
         print('No label found' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_label_detection]
diff --git a/vision/src/detect_label_gcs.php b/vision/src/detect_label_gcs.php
@@ -38,5 +38,7 @@ function detect_label_gcs($path)
     } else {
         print('No label found' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_label_detection_gcs]
diff --git a/vision/src/detect_landmark.php b/vision/src/detect_landmark.php
@@ -35,5 +35,7 @@ function detect_landmark($path)
     foreach ($landmarks as $landmark) {
         print($landmark->getDescription() . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_landmark_detection]
diff --git a/vision/src/detect_landmark_gcs.php b/vision/src/detect_landmark_gcs.php
@@ -34,5 +34,7 @@ function detect_landmark_gcs($path)
     foreach ($landmarks as $landmark) {
         print($landmark->getDescription() . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_landmark_detection_gcs]
diff --git a/vision/src/detect_logo.php b/vision/src/detect_logo.php
@@ -35,5 +35,7 @@ function detect_logo($path)
     foreach ($logos as $logo) {
         print($logo->getDescription() . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_logo_detection]
diff --git a/vision/src/detect_logo_gcs.php b/vision/src/detect_logo_gcs.php
@@ -34,5 +34,7 @@ function detect_logo_gcs($path)
     foreach ($logos as $logo) {
         print($logo->getDescription() . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_logo_detection_gcs]
diff --git a/vision/src/detect_pdf_gcs.php b/vision/src/detect_pdf_gcs.php
@@ -0,0 +1,107 @@
+<?php
+/**
+ * Copyright 2018 Google Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+// [START vision_text_detection_pdf_gcs]
+namespace Google\Cloud\Samples\Vision;
+
+use Google\Cloud\Storage\StorageClient;
+use Google\Cloud\Vision\V1\AnnotateFileResponse;
+use Google\Cloud\Vision\V1\AsyncAnnotateFileRequest;
+use Google\Cloud\Vision\V1\Feature;
+use Google\Cloud\Vision\V1\Feature_Type;
+use Google\Cloud\Vision\V1\GcsDestination;
+use Google\Cloud\Vision\V1\GcsSource;
+use Google\Cloud\Vision\V1\ImageAnnotatorClient;
+use Google\Cloud\Vision\V1\InputConfig;
+use Google\Cloud\Vision\V1\OutputConfig;
+
+// $path = 'gs://path/to/your/document.pdf'
+
+function detect_pdf_gcs($path, $output)
+{
+    # select ocr feature
+    $feature = (new Feature())
+        ->setType(Feature_Type::DOCUMENT_TEXT_DETECTION);
+
+    # set $path (file to OCR) as source
+    $gcsSource = (new GcsSource())
+        ->setUri($path);
+    # supported mime_types are: 'application/pdf' and 'image/tiff'
+    $mimeType = 'application/pdf';
+    $inputConfig = (new InputConfig())
+        ->setGcsSource($gcsSource)
+        ->setMimeType($mimeType);
+
+    # set $output as destination
+    $gcsDestination = (new GcsDestination())
+        ->setUri($output);
+    # how many pages should be grouped into each json output file.
+    $batchSize = 2;
+    $outputConfig = (new OutputConfig())
+        ->setGcsDestination($gcsDestination)
+        ->setBatchSize($batchSize);
+
+    # prepare request using configs set above
+    $request = (new AsyncAnnotateFileRequest())
+        ->setFeatures([$feature])
+        ->setInputConfig($inputConfig)
+        ->setOutputConfig($outputConfig);
+    $requests = [$request];
+
+    # make request
+    $imageAnnotator = new ImageAnnotatorClient();
+    $operation = $imageAnnotator->asyncBatchAnnotateFiles($requests);
+    print('Waiting for operation to finish.' . PHP_EOL);
+    $operation->pollUntilComplete();
+
+    # once the request has completed and the output has been
+    # written to GCS, we can list all the output files.
+    preg_match('/^gs:\/\/([a-z0-9\._\-]+)\/(\S+)$/', $output, $match);
+    $bucketName = $match[1];
+    $prefix = $match[2];
+
+    $storage = new StorageClient();
+    $bucket = $storage->bucket($bucketName);
+    $options = ['prefix' => $prefix];
+    $objects = $bucket->objects($options);
+
+    # save first object for sample below
+    $objects->next();
+    $firstObject = $objects->current();
+
+    # list objects with the given prefix.
+    print('Output files:' . PHP_EOL);
+    foreach ($objects as $object) {
+        print($object->name() . PHP_EOL);
+    }
+
+    # process the first output file from GCS.
+    # since we specified batch_size=2, the first response contains
+    # the first two pages of the input file.
+    $jsonString = $firstObject->downloadAsString();
+    $firstBatch = new AnnotateFileResponse();
+    $firstBatch->mergeFromJsonString($jsonString);
+
+    # get annotation and print text
+    foreach ($firstBatch->getResponses() as $response) {
+        $annotation = $response->getFullTextAnnotation();
+        print($annotation->getText());
+    }
+
+    $imageAnnotator->close();
+}
+// [END vision_text_detection_pdf_gcs]
diff --git a/vision/src/detect_safe_search.php b/vision/src/detect_safe_search.php
@@ -46,5 +46,7 @@ function detect_safe_search($path)
     printf("Spoof: %s" . PHP_EOL, $likelihoodName[$spoof]);
     printf("Violence: %s" . PHP_EOL, $likelihoodName[$violence]);
     printf("Racy: %s" . PHP_EOL, $likelihoodName[$racy]);
+
+    $imageAnnotator->close();
 }
 // [END vision_safe_search_detection]
diff --git a/vision/src/detect_safe_search_gcs.php b/vision/src/detect_safe_search_gcs.php
@@ -49,5 +49,7 @@ function detect_safe_search_gcs($path)
     } else {
         print('No Results.' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_safe_search_detection_gcs]
diff --git a/vision/src/detect_text.php b/vision/src/detect_text.php
@@ -43,5 +43,7 @@ function detect_text($path)
         }
         print('Bounds: ' . join(', ',$bounds) . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_text_detection]
diff --git a/vision/src/detect_text_gcs.php b/vision/src/detect_text_gcs.php
@@ -42,5 +42,7 @@ function detect_text_gcs($path)
         }
         print('Bounds: ' . join(', ',$bounds) . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_text_detection_gcs]
diff --git a/vision/src/detect_web.php b/vision/src/detect_web.php
@@ -79,5 +79,7 @@ function detect_web($path)
             $entity->getDescription(),
             $entity->getScore());
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_web_detection]
diff --git a/vision/src/detect_web_gcs.php b/vision/src/detect_web_gcs.php
@@ -81,5 +81,7 @@ function detect_web_gcs($path)
     } else {
         print('No Results.' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_web_detection_gcs]
diff --git a/vision/src/detect_web_with_geo_metadata.php b/vision/src/detect_web_with_geo_metadata.php
@@ -52,5 +52,7 @@ function detect_web_with_geo_metadata($path)
             print(PHP_EOL);
         }
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_web_detection_include_geo]
diff --git a/vision/src/detect_web_with_geo_metadata_gcs.php b/vision/src/detect_web_with_geo_metadata_gcs.php
@@ -53,5 +53,7 @@ function detect_web_with_geo_metadata_gcs($path)
     } else {
         print('No Results.' . PHP_EOL);
     }
+
+    $imageAnnotator->close();
 }
 // [END vision_web_detection_include_geo_gcs]
diff --git a/vision/test/visionTest.php b/vision/test/visionTest.php
@@ -271,6 +271,16 @@ public function testDocumentTextCommandGcs()
         $this->assertContains('Bounds:', $output);
     }
 
+    public function testPdfGcs()
+    {
+        $this->requireCloudStorage();
+
+        $source = 'gs://' . $this->bucketName . '/HodgeConj.pdf';
+        $destination = 'gs://' . $this->bucketName . '/OCR_PDF_TEST_OUTPUT/';
+        $output = $this->runCommand('pdf', $source, $destination);
+        $this->assertContains('Output files:', $output);
+    }
+
     public function testDetectWebNoGeoCommand()
     {
         $path = __DIR__ . '/data/geotagged.jpg';
diff --git a/vision/vision.php b/vision/vision.php

Original file line number	Diff line number	Diff line change
`@@ -47,5 +47,7 @@ function detect_crop_hints($path)`
`47`	`47`	`} else {`
`48`	`48`	`print('No crop hints' . PHP_EOL);`
`49`	`49`	`}`
	`50`	`+`
	`51`	`+ $imageAnnotator->close();`
`50`	`52`	`}`
`51`	`53`	`// [END vision_crop_hint_detection]`
Original file line number	Diff line number	Diff line change
`@@ -46,5 +46,7 @@ function detect_crop_hints_gcs($path)`
`46`	`46`	`} else {`
`47`	`47`	`print('No crop hints' . PHP_EOL);`
`48`	`48`	`}`
	`49`	`+`
	`50`	`+ $imageAnnotator->close();`
`49`	`51`	`}`
`50`	`52`	`// [END vision_crop_hint_detection_gcs]`
Original file line number	Diff line number	Diff line change
`@@ -63,5 +63,7 @@ function detect_document_text($path)`
`63`	`63`	`} else {`
`64`	`64`	`print('No text found' . PHP_EOL);`
`65`	`65`	`}`
	`66`	`+`
	`67`	`+ $imageAnnotator->close();`
`66`	`68`	`}`
`67`	`69`	`// [END vision_fulltext_detection]`
Original file line number	Diff line number	Diff line change
`@@ -103,6 +103,8 @@ function detect_face($path, $outFile = null)`
`103`	`103`	`printf('Output image written to %s' . PHP_EOL, $outFile);`
`104`	`104`	`# [END vision_face_detection_tutorial_run_application]`
`105`	`105`	`}`
	`106`	`+`
	`107`	`+ $imageAnnotator->close();`
`106`	`108`	`// [START vision_face_detection]`
`107`	`109`	`}`
`108`	`110`	`// [END vision_face_detection]`
Original file line number	Diff line number	Diff line change
`@@ -54,5 +54,7 @@ function detect_face_gcs($path)`
`54`	`54`	`print('Bounds: ' . join(', ',$bounds) . PHP_EOL);`
`55`	`55`	`print(PHP_EOL);`
`56`	`56`	`}`
	`57`	`+`
	`58`	`+ $imageAnnotator->close();`
`57`	`59`	`}`
`58`	`60`	`// [END vision_face_detection_gcs]`
Original file line number	Diff line number	Diff line change
`@@ -40,5 +40,7 @@ function detect_image_property($path)`
`40`	`40`	`printf("Blue: %s" . PHP_EOL, $color->getBlue());`
`41`	`41`	`print(PHP_EOL);`
`42`	`42`	`}`
	`43`	`+`
	`44`	`+ $imageAnnotator->close();`
`43`	`45`	`}`
`44`	`46`	`// [END vision_image_property_detection]`
Original file line number	Diff line number	Diff line change
`@@ -44,5 +44,7 @@ function detect_image_property_gcs($path)`
`44`	`44`	`} else {`
`45`	`45`	`print('No Results.' . PHP_EOL);`
`46`	`46`	`}`
	`47`	`+`
	`48`	`+ $imageAnnotator->close();`
`47`	`49`	`}`
`48`	`50`	`// [END vision_image_property_detection_gcs]`
Original file line number	Diff line number	Diff line change
`@@ -39,5 +39,7 @@ function detect_label($path)`
`39`	`39`	`} else {`
`40`	`40`	`print('No label found' . PHP_EOL);`
`41`	`41`	`}`
	`42`	`+`
	`43`	`+ $imageAnnotator->close();`
`42`	`44`	`}`
`43`	`45`	`// [END vision_label_detection]`
Original file line number	Diff line number	Diff line change
`@@ -38,5 +38,7 @@ function detect_label_gcs($path)`
`38`	`38`	`} else {`
`39`	`39`	`print('No label found' . PHP_EOL);`
`40`	`40`	`}`
	`41`	`+`
	`42`	`+ $imageAnnotator->close();`
`41`	`43`	`}`
`42`	`44`	`// [END vision_label_detection_gcs]`
Original file line number	Diff line number	Diff line change
`@@ -35,5 +35,7 @@ function detect_landmark($path)`
`35`	`35`	`foreach ($landmarks as $landmark) {`
`36`	`36`	`print($landmark->getDescription() . PHP_EOL);`
`37`	`37`	`}`
	`38`	`+`
	`39`	`+ $imageAnnotator->close();`
`38`	`40`	`}`
`39`	`41`	`// [END vision_landmark_detection]`