Speech Sep 2018 GA (GoogleCloudPlatform#718)

sirtorry · bshaffer · commit 699de152bc06 · 2018-10-04T15:50:27.000-07:00
diff --git a/speech/README.md b/speech/README.md
@@ -52,7 +52,10 @@ To run the Speech Samples:
       transcribe-async        Transcribe an audio file asynchronously using Google Cloud Speech API
       transcribe-async-gcs    Transcribe audio asynchronously from a Storage Object using Google Cloud Speech API
       transcribe-async-words  Transcribe an audio file asynchronously and print word time offsets using Google Cloud Speech API
+      transcribe-enhanced     Transcribe an audio file with an enhanced model using  Google Cloud Speech API
       transcribe-gcs          Transcribe audio from a Storage Object using Google Cloud Speech API
+      transcribe-model        Transcribe an audio file, with selected model, using Google Cloud Speech API
+      transcribe-punctuation  Transcribe an audio file with proper punctuation, using Google Cloud Speech API
       transcribe-stream       Transcribe a stream of audio using Google Cloud Speech API
       transcribe-words        Transcribe an audio file and print word time offsets using Google Cloud Speech API
 
diff --git a/speech/composer.json b/speech/composer.json
@@ -1,11 +1,12 @@
 {
     "require": {
-        "google/cloud-speech": "^0.11",
+        "google/cloud-speech": "~0.17",
         "google/cloud-storage": "^1.3.1",
         "symfony/console": "^3.0"
     },
     "require-dev": {
-        "phpunit/phpunit": "~4.8"
+        "phpunit/phpunit": "^5",
+        "google/cloud-tools": "^0.8.5"
     },
     "autoload": {
         "psr-4": {
@@ -16,6 +17,9 @@
             "src/transcribe_async.php",
             "src/transcribe_async_gcs.php",
             "src/transcribe_async_words.php",
+            "src/transcribe_auto_punctuation.php",
+            "src/transcribe_enhanced_model.php",
+            "src/transcribe_model_selection.php",
             "src/transcribe_sync.php",
             "src/transcribe_sync_gcs.php",
             "src/transcribe_sync_words.php"
diff --git a/speech/speech.php b/speech/speech.php
@@ -28,6 +28,7 @@
 
 $inputDefinition = new InputDefinition([
     new InputArgument('audio-file', InputArgument::REQUIRED, 'The audio file to transcribe'),
+    new InputOption('model', null, InputOption::VALUE_REQUIRED, 'The model to use'),
     new InputOption('encoding', null, InputOption::VALUE_REQUIRED,
         'The encoding of the audio file. This is required if the encoding is ' .
         'unable to be determined. '
@@ -111,6 +112,55 @@
         ]);
     });
 
+$application->add(new Command('transcribe-model'))
+    ->setDefinition($inputDefinition)
+    ->setDescription('Transcribe an audio file, with selected model, using Google Cloud Speech API')
+    ->setHelp(<<<EOF
+The <info>%command.name%</info> command transcribes audio from a file, with the 
+selected model, using the Google Cloud Speech API.
+
+<info>php %command.full_name% audio_file.wav model_name</info>
+
+EOF
+    )
+    ->setCode(function (InputInterface $input, OutputInterface $output) {
+        $audioFile = $input->getArgument('audio-file');
+        $modelName = $input->getOption('model');
+        transcribe_model_selection($audioFile, $modelName);
+    });
+
+$application->add(new Command('transcribe-enhanced'))
+    ->setDefinition($inputDefinition)
+    ->setDescription('Transcribe an audio file, with an enhanced model, using Google Cloud Speech API')
+    ->setHelp(<<<EOF
+The <info>%command.name%</info> command transcribes audio from a file, with an enhanced 
+model, using the Google Cloud Speech API.
+
+<info>php %command.full_name% audio_file.wav model_name</info>
+
+EOF
+    )
+    ->setCode(function (InputInterface $input, OutputInterface $output) {
+        $path = $input->getArgument('audio-file');
+        transcribe_enhanced_model($path);
+    });
+
+$application->add(new Command('transcribe-punctuation'))
+    ->setDefinition($inputDefinition)
+    ->setDescription('Transcribe an audio file, with proper punctuation, using Google Cloud Speech API')
+    ->setHelp(<<<EOF
+The <info>%command.name%</info> command transcribes audio from a file, with 
+proper punctuation, using the Google Cloud Speech API.
+
+<info>php %command.full_name% audio_file.wav</info>
+
+EOF
+    )
+    ->setCode(function (InputInterface $input, OutputInterface $output) {
+        $path = $input->getArgument('audio-file');
+        transcribe_auto_punctuation($path);
+    });
+
 $application->add(new Command('transcribe-async'))
     ->setDefinition($inputDefinition)
     ->setDescription('Transcribe an audio file asynchronously using Google Cloud Speech API')
diff --git a/speech/src/streaming_recognize.php b/speech/src/streaming_recognize.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
@@ -28,13 +28,13 @@
 use Google\Cloud\Speech\V1\RecognitionConfig;
 use Google\Cloud\Speech\V1\StreamingRecognitionConfig;
 use Google\Cloud\Speech\V1\StreamingRecognizeRequest;
-use Google\Cloud\Speech\V1\RecognitionConfig_AudioEncoding;
+use Google\Cloud\Speech\V1\RecognitionConfig\AudioEncoding;
 
 /**
  * Transcribe an audio file using Google Cloud Speech API
  * Example:
  * ```
- * $audoEncoding =  Google\Cloud\Speech\V1\RecognitionConfig_AudioEncoding::WAV
+ * $audoEncoding =  Google\Cloud\Speech\V1\RecognitionConfig\AudioEncoding::WAV
  * streaming_recognize('/path/to/audiofile.wav', 'en-US');
  * ```.
  *
@@ -59,7 +59,7 @@ function streaming_recognize($audioFile, $languageCode, $encoding, $sampleRateHe
         $config->setLanguageCode($languageCode);
         $config->setSampleRateHertz($sampleRateHertz);
         // encoding must be an enum, convert from string
-        $encodingEnum = constant(RecognitionConfig_AudioEncoding::class . '::' . $encoding);
+        $encodingEnum = constant(AudioEncoding::class . '::' . $encoding);
         $config->setEncoding($encodingEnum);
 
         $strmConfig = new StreamingRecognitionConfig();
diff --git a/speech/src/transcribe_async.php b/speech/src/transcribe_async.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
diff --git a/speech/src/transcribe_async_gcs.php b/speech/src/transcribe_async_gcs.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
diff --git a/speech/src/transcribe_async_words.php b/speech/src/transcribe_async_words.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
diff --git a/speech/src/transcribe_auto_punctuation.php b/speech/src/transcribe_auto_punctuation.php
@@ -0,0 +1,72 @@
+<?php
+/**
+ * Copyright 2018 Google Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * For instructions on how to run the full sample:
+ *
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
+ */
+
+namespace Google\Cloud\Samples\Speech;
+
+# [START speech_transcribe_auto_punctuation]
+use Google\Cloud\Speech\V1\SpeechClient;
+use Google\Cloud\Speech\V1\RecognitionAudio;
+use Google\Cloud\Speech\V1\RecognitionConfig;
+use Google\Cloud\Speech\V1\RecognitionConfig\AudioEncoding;
+
+/**
+ * Transcribe the given audio file with auto punctuation enabled
+ */
+function transcribe_auto_punctuation($path)
+{
+    // get contents of a file into a string
+    $handle = fopen($path, 'r');
+    $content = fread($handle, filesize($path));
+    fclose($handle);
+
+    // set string as audio content
+    $audio = (new RecognitionAudio())
+        ->setContent($content);
+
+    // set config
+    $config = (new RecognitionConfig())
+        ->setEncoding(AudioEncoding::LINEAR16)
+        ->setSampleRateHertz(32000)
+        ->setLanguageCode('en-US')
+        ->setEnableAutomaticPunctuation(true);
+
+    // create the speech client
+    $client = new SpeechClient();
+
+    // make the API call
+    $response = $client->recognize($config, $audio);
+    $results = $response->getResults();
+
+    // print results
+    foreach ($results as $result) {
+        $alternatives = $result->getAlternatives();
+        $mostLikely = $alternatives[0];
+        $transcript = $mostLikely->getTranscript();
+        $confidence = $mostLikely->getConfidence();
+        printf('Transcript: %s' . PHP_EOL, $transcript);
+        printf('Confidence: %s' . PHP_EOL, $confidence);
+    }
+
+    $client->close();
+}
+# [END speech_transcribe_auto_punctuation]
diff --git a/speech/src/transcribe_enhanced_model.php b/speech/src/transcribe_enhanced_model.php
@@ -0,0 +1,73 @@
+<?php
+/**
+ * Copyright 2018 Google Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * For instructions on how to run the full sample:
+ *
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
+ */
+
+namespace Google\Cloud\Samples\Speech;
+
+# [START speech_transcribe_enhanced_model]
+use Google\Cloud\Speech\V1\SpeechClient;
+use Google\Cloud\Speech\V1\RecognitionAudio;
+use Google\Cloud\Speech\V1\RecognitionConfig;
+use Google\Cloud\Speech\V1\RecognitionConfig\AudioEncoding;
+
+/**
+ * Transcribe the given audio file using an enhanced model
+ */
+function transcribe_enhanced_model($path)
+{
+    // get contents of a file into a string
+    $handle = fopen($path, 'r');
+    $content = fread($handle, filesize($path));
+    fclose($handle);
+
+    // set string as audio content
+    $audio = (new RecognitionAudio())
+        ->setContent($content);
+
+    // set config
+    $config = (new RecognitionConfig())
+        ->setEncoding(AudioEncoding::LINEAR16)
+        ->setSampleRateHertz(8000)
+        ->setLanguageCode('en-US')
+        ->setUseEnhanced(true)
+        ->setModel('phone_call');
+
+    // create the speech client
+    $client = new SpeechClient();
+
+    // make the API call
+    $response = $client->recognize($config, $audio);
+    $results = $response->getResults();
+
+    // print results
+    foreach ($results as $result) {
+        $alternatives = $result->getAlternatives();
+        $mostLikely = $alternatives[0];
+        $transcript = $mostLikely->getTranscript();
+        $confidence = $mostLikely->getConfidence();
+        printf('Transcript: %s' . PHP_EOL, $transcript);
+        printf('Confidence: %s' . PHP_EOL, $confidence);
+    }
+
+    $client->close();
+}
+# [END speech_transcribe_enhanced_model]
diff --git a/speech/src/transcribe_model_selection.php b/speech/src/transcribe_model_selection.php
@@ -0,0 +1,72 @@
+<?php
+/**
+ * Copyright 2018 Google Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * For instructions on how to run the full sample:
+ *
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
+ */
+
+namespace Google\Cloud\Samples\Speech;
+
+# [START speech_transcribe_model_selection]
+use Google\Cloud\Speech\V1\SpeechClient;
+use Google\Cloud\Speech\V1\RecognitionAudio;
+use Google\Cloud\Speech\V1\RecognitionConfig;
+use Google\Cloud\Speech\V1\RecognitionConfig\AudioEncoding;
+
+/**
+ * Transcribe the given audio file synchronously with the selected model
+ */
+function transcribe_model_selection($speechFile, $model)
+{
+    // get contents of a file into a string
+    $handle = fopen($speechFile, 'r');
+    $content = fread($handle, filesize($speechFile));
+    fclose($handle);
+
+    // set string as audio content
+    $audio = (new RecognitionAudio())
+        ->setContent($content);
+
+    // set config
+    $config = (new RecognitionConfig())
+        ->setEncoding(AudioEncoding::LINEAR16)
+        ->setSampleRateHertz(32000)
+        ->setLanguageCode('en-US')
+        ->setModel($model);
+
+    // create the speech client
+    $client = new SpeechClient();
+
+    // make the API call
+    $response = $client->recognize($config, $audio);
+    $results = $response->getResults();
+
+    // print results
+    foreach ($results as $result) {
+        $alternatives = $result->getAlternatives();
+        $mostLikely = $alternatives[0];
+        $transcript = $mostLikely->getTranscript();
+        $confidence = $mostLikely->getConfidence();
+        printf('Transcript: %s' . PHP_EOL, $transcript);
+        printf('Confidence: %s' . PHP_EOL, $confidence);
+    }
+
+    $client->close();
+}
+# [END speech_transcribe_model_selection]
diff --git a/speech/src/transcribe_sync.php b/speech/src/transcribe_sync.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
diff --git a/speech/src/transcribe_sync_gcs.php b/speech/src/transcribe_sync_gcs.php
@@ -18,7 +18,7 @@
 /**
  * For instructions on how to run the full sample:
  *
- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md
+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md
  */
 
 namespace Google\Cloud\Samples\Speech;
diff --git a/speech/src/transcribe_sync_words.php b/speech/src/transcribe_sync_words.php
diff --git a/speech/test/data/commercial_mono.wav b/speech/test/data/commercial_mono.wav
diff --git a/speech/test/speechTest.php b/speech/test/speechTest.php

Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@`
`18`	`18`	`/**`
`19`	`19`	`* For instructions on how to run the full sample:`
`20`	`20`	`*`
`21`		`- * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/api/README.md`
	`21`	`+ * @see https://github.com/GoogleCloudPlatform/php-docs-samples/tree/master/speech/README.md`
`22`	`22`	`*/`
`23`	`23`
`24`	`24`	`namespace Google\Cloud\Samples\Speech;`