GoogleCloudPlatform · theacodes · Feb 7, 2017 · Feb 6, 2017 · Feb 7, 2017 · Feb 7, 2017
diff --git a/speech/cloud-client/README.rst b/speech/cloud-client/README.rst
@@ -93,18 +93,20 @@ To run this sample:
 
     $ python transcribe.py
 
-    usage: transcribe.py [-h] speech_file
+    usage: transcribe.py [-h] path
 
     Google Cloud Speech API sample application using the REST API for batch
     processing.
 
-    Example usage: python transcribe.py resources/audio.raw
+    Example usage:
+        python transcribe.py resources/audio.raw
+        python transcribe.py gs://cloud-samples-tests/speech/brooklyn.flac
 
     positional arguments:
-      speech_file  Full path of audio file to be recognized
+      path        File or GCS path for audio file to be recognized
 
     optional arguments:
-      -h, --help   show this help message and exit
+      -h, --help  show this help message and exit
 
 
 Transcribe async
@@ -118,18 +120,20 @@ To run this sample:
 
     $ python transcribe_async.py
 
-    usage: transcribe_async.py [-h] speech_file
+    usage: transcribe_async.py [-h] path
 
     Google Cloud Speech API sample application using the REST API for async
     batch processing.
 
-    Example usage: python transcribe_async.py resources/audio.raw
+    Example usage:
+        python transcribe_async.py resources/audio.raw
+        python transcribe_async.py gs://cloud-samples-tests/speech/brooklyn.flac
 
     positional arguments:
-      speech_file  Full path of audio file to be recognized
+      path        File or GCS path for audio file to be recognized
 
     optional arguments:
-      -h, --help   show this help message and exit
+      -h, --help  show this help message and exit
 
 
 

diff --git a/speech/cloud-client/transcribe.py b/speech/cloud-client/transcribe.py
@@ -17,7 +17,9 @@
 """Google Cloud Speech API sample application using the REST API for batch
 processing.
 
-Example usage: python transcribe.py resources/audio.raw
+Example usage:
+    python transcribe.py resources/audio.raw
+    python transcribe.py gs://cloud-samples-tests/speech/brooklyn.flac
 """
 
 # [START import_libraries]
@@ -26,12 +28,8 @@
 # [END import_libraries]
 
 
-def main(speech_file):
-    """Transcribe the given audio file.
-
-    Args:
-        speech_file: the name of the audio file.
-    """
+def transcribe_file(speech_file):
+    """Transcribe the given audio file."""
     # [START authenticating]
     # Application default credentials provided by env variable
     # GOOGLE_APPLICATION_CREDENTIALS
@@ -57,13 +55,48 @@ def main(speech_file):
     # [END send_request]
 
 
+def transcribe_gcs(gcs_uri):
+    """Transcribes the audio file specified by the gcs_uri."""
+    # [START authenticating_gcs]
+    # Application default credentials provided by env variable
+    # GOOGLE_APPLICATION_CREDENTIALS
+    from google.cloud import speech
+    speech_client = speech.Client()
+    # [END authenticating]
+
+    # [START construct_request_gcs]
+    audio_sample = speech_client.sample(
+        None,
+        source_uri=gcs_uri,
+        encoding='FLAC',
+        sample_rate=16000)
+    # [END construct_request_gcs]
+
+    # [START send_request_gcs]
+    alternatives = speech_client.speech_api.sync_recognize(audio_sample)
+    for alternative in alternatives:
+        print('Transcript: {}'.format(alternative.transcript))
+    # [END send_request_gcs]
+
+
+def main(path):
+    """Transcribe the given audio file.
+    Args:
+        path: the name of the audio file.
+    """
+    if path.startswith('gs://'):
+        transcribe_gcs(path)
+    else:
+        transcribe_file(path)
+
+
 # [START run_application]
 if __name__ == '__main__':
     parser = argparse.ArgumentParser(
         description=__doc__,
         formatter_class=argparse.RawDescriptionHelpFormatter)
     parser.add_argument(
-        'speech_file', help='Full path of audio file to be recognized')
+        'path', help='File or GCS path for audio file to be recognized')
     args = parser.parse_args()
-    main(args.speech_file)
+    main(args.path)
     # [END run_application]
diff --git a/speech/cloud-client/transcribe_async.py b/speech/cloud-client/transcribe_async.py
@@ -17,7 +17,9 @@
 """Google Cloud Speech API sample application using the REST API for async
 batch processing.
 
-Example usage: python transcribe_async.py resources/audio.raw
+Example usage:
+    python transcribe_async.py resources/audio.raw
+    python transcribe_async.py gs://cloud-samples-tests/speech/brooklyn.flac
 """
 
 # [START import_libraries]
@@ -27,12 +29,8 @@
 # [END import_libraries]
 
 
-def main(speech_file):
-    """Transcribe the given audio file asynchronously.
-
-    Args:
-        speech_file: the name of the audio file.
-    """
+def transcribe_file(speech_file):
+    """Transcribe the given audio file asynchronously."""
     # [START authenticating]
     # Application default credentials provided by env variable
     # GOOGLE_APPLICATION_CREDENTIALS
@@ -71,13 +69,62 @@ def main(speech_file):
     # [END send_request]
 
 
+def transcribe_gcs(gcs_uri):
+    """Asynchronously transcribes the audio file specified by the gcs_uri."""
+    # [START authenticating_gcs]
+    # Application default credentials provided by env variable
+    # GOOGLE_APPLICATION_CREDENTIALS
+    from google.cloud import speech
+    speech_client = speech.Client()
+    # [END authenticating_gcs]
+
+    # [START construct_request_gcs]
+    # Loads the audio into memory
+    audio_sample = speech_client.sample(
+        content=None,
+        source_uri=gcs_uri,
+        encoding='FLAC',
+        sample_rate=16000)
+    # [END construct_request_gcs]
+
+    # [START send_request_gcs]
+    operation = speech_client.speech_api.async_recognize(audio_sample)
+
+    retry_count = 100
+    while retry_count > 0 and not operation.complete:
+        retry_count -= 1
+        time.sleep(2)
+        operation.poll()
+
+    if not operation.complete:
+        print("Operation not complete and retry limit reached.")
+        return
+
+    alternatives = operation.results
+    for alternative in alternatives:
+        print('Transcript: {}'.format(alternative.transcript))
+        print('Confidence: {}'.format(alternative.confidence))
+    # [END send_request_gcs]
+
+
+def main(path):
+    """Transcribe the given audio file.
+    Args:
+        path: the name of the audio file.
+    """
+    if path.startswith('gs://'):
+        transcribe_gcs(path)
+    else:
+        transcribe_file(path)
+
+
 # [START run_application]
 if __name__ == '__main__':
     parser = argparse.ArgumentParser(
         description=__doc__,
         formatter_class=argparse.RawDescriptionHelpFormatter)
     parser.add_argument(
-        'speech_file', help='Full path of audio file to be recognized')
+        'path', help='File or GCS path for audio file to be recognized')
     args = parser.parse_args()
-    main(args.speech_file)
+    main(args.path)
     # [END run_application]
diff --git a/speech/cloud-client/transcribe_async_test.py b/speech/cloud-client/transcribe_async_test.py
@@ -16,8 +16,15 @@
 from transcribe_async import main
 
 
-def test_main(resource, capsys):
+def test_transcribe(resource, capsys):
     main(resource('audio.raw'))
     out, err = capsys.readouterr()
 
     assert re.search(r'how old is the Brooklyn Bridge', out, re.DOTALL | re.I)
+
+
+def test_transcribe_gcs(resource, capsys):
+    main('gs://cloud-samples-tests/speech/brooklyn.flac')
+    out, err = capsys.readouterr()
+
+    assert re.search(r'how old is the Brooklyn Bridge', out, re.DOTALL | re.I)
diff --git a/speech/cloud-client/transcribe_test.py b/speech/cloud-client/transcribe_test.py
@@ -21,3 +21,10 @@ def test_main(resource, capsys):
     out, err = capsys.readouterr()
 
     assert re.search(r'how old is the Brooklyn Bridge', out, re.DOTALL | re.I)
+
+
+def test_main_gcs(resource, capsys):
+    main('gs://cloud-samples-tests/speech/brooklyn.flac')
+    out, err = capsys.readouterr()
+
+    assert re.search(r'how old is the Brooklyn Bridge', out, re.DOTALL | re.I)