diff --git a/speech/snippets/transcribe_async.py b/speech/snippets/transcribe_async.py deleted file mode 100644 index 5ab85d624883..000000000000 --- a/speech/snippets/transcribe_async.py +++ /dev/null @@ -1,110 +0,0 @@ -#!/usr/bin/env python - -# Copyright 2017 Google Inc. All Rights Reserved. -# -# Licensed under the Apache License, Version 2.0 (the "License"); -# you may not use this file except in compliance with the License. -# You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, software -# distributed under the License is distributed on an "AS IS" BASIS, -# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -# See the License for the specific language governing permissions and -# limitations under the License. - -"""Google Cloud Speech API sample application using the REST API for async -batch processing. -Example usage: - python transcribe_async.py resources/audio.raw - python transcribe_async.py gs://cloud-samples-tests/speech/vr.flac -""" - -import argparse -import io - - -# [START speech_transcribe_async] -def transcribe_file(speech_file): - """Transcribe the given audio file asynchronously.""" - from google.cloud import speech - - client = speech.SpeechClient() - - # [START speech_python_migration_async_request] - with io.open(speech_file, "rb") as audio_file: - content = audio_file.read() - - """ - Note that transcription is limited to a 60 seconds audio file. - Use a GCS file for audio longer than 1 minute. - """ - audio = speech.RecognitionAudio(content=content) - - config = speech.RecognitionConfig( - encoding=speech.RecognitionConfig.AudioEncoding.LINEAR16, - sample_rate_hertz=16000, - language_code="en-US", - ) - - # [START speech_python_migration_async_response] - - operation = client.long_running_recognize(config=config, audio=audio) - # [END speech_python_migration_async_request] - - print("Waiting for operation to complete...") - response = operation.result(timeout=90) - - # Each result is for a consecutive portion of the audio. Iterate through - # them to get the transcripts for the entire audio file. - for result in response.results: - # The first alternative is the most likely one for this portion. - print(u"Transcript: {}".format(result.alternatives[0].transcript)) - print("Confidence: {}".format(result.alternatives[0].confidence)) - # [END speech_python_migration_async_response] - - -# [END speech_transcribe_async] - - -# [START speech_transcribe_async_gcs] -def transcribe_gcs(gcs_uri): - """Asynchronously transcribes the audio file specified by the gcs_uri.""" - from google.cloud import speech - - client = speech.SpeechClient() - - audio = speech.RecognitionAudio(uri=gcs_uri) - config = speech.RecognitionConfig( - encoding=speech.RecognitionConfig.AudioEncoding.FLAC, - sample_rate_hertz=16000, - language_code="en-US", - ) - - operation = client.long_running_recognize(config=config, audio=audio) - - print("Waiting for operation to complete...") - response = operation.result(timeout=90) - - # Each result is for a consecutive portion of the audio. Iterate through - # them to get the transcripts for the entire audio file. - for result in response.results: - # The first alternative is the most likely one for this portion. - print(u"Transcript: {}".format(result.alternatives[0].transcript)) - print("Confidence: {}".format(result.alternatives[0].confidence)) - - -# [END speech_transcribe_async_gcs] - - -if __name__ == "__main__": - parser = argparse.ArgumentParser( - description=__doc__, formatter_class=argparse.RawDescriptionHelpFormatter - ) - parser.add_argument("path", help="File or GCS path for audio file to be recognized") - args = parser.parse_args() - if args.path.startswith("gs://"): - transcribe_gcs(args.path) - else: - transcribe_file(args.path)