GoogleCloudPlatform · happyhuman · Jul 20, 2018 · Jul 19, 2018 · Jul 19, 2018 · Jul 20, 2018
diff --git a/speech/cloud-client/README.rst b/speech/cloud-client/README.rst
@@ -221,7 +221,7 @@ To run this sample:
 
     $ python beta_snippets.py
 
-    usage: beta_snippets.py [-h] command path first second
+    usage: beta_snippets.py [-h] command path [first] [second]
 
     Google Cloud Speech API sample that demonstrates enhanced models
     and recognition metadata.

diff --git a/speech/cloud-client/beta_snippets.py b/speech/cloud-client/beta_snippets.py
@@ -46,7 +46,6 @@ def transcribe_file_with_enhanced_model(speech_file):
     audio = speech.types.RecognitionAudio(content=content)
     config = speech.types.RecognitionConfig(
         encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16,
-        sample_rate_hertz=8000,
         language_code='en-US',
         # Enhanced models are only available to projects that
         # opt in for audio data collection.
@@ -95,7 +94,6 @@ def transcribe_file_with_metadata(speech_file):
     audio = speech.types.RecognitionAudio(content=content)
     config = speech.types.RecognitionConfig(
         encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16,
-        sample_rate_hertz=8000,
         language_code='en-US',
         # Add this in the request to send metadata.
         metadata=metadata)
@@ -125,7 +123,6 @@ def transcribe_file_with_auto_punctuation(speech_file):
     audio = speech.types.RecognitionAudio(content=content)
     config = speech.types.RecognitionConfig(
         encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16,
-        sample_rate_hertz=8000,
         language_code='en-US',
         # Enable automatic punctuation
         enable_automatic_punctuation=True)
@@ -156,21 +153,18 @@ def transcribe_file_with_diarization(speech_file):
 
     config = speech.types.RecognitionConfig(
         encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16,
-        sample_rate_hertz=16000,
         language_code='en-US',
         enable_speaker_diarization=True,
         diarization_speaker_count=2)
 
     print('Waiting for operation to complete...')
     response = client.recognize(config, audio)
 
-    for i, result in enumerate(response.results):
-        alternative = result.alternatives[0]
-        print('-' * 20)
-        print('First alternative of result {}: {}'
-              .format(i, alternative.transcript))
-        print('Speaker Tag for the first word: {}'
-              .format(alternative.words[0].speaker_tag))
+    result = response.results[-1]
+    words_info = result.alternatives[0].words
+    pieces = ['%s (%s)' % (word_info.word, word_info.speaker_tag)
+              for word_info in words_info]
+    print(' '.join(pieces))
     # [END speech_transcribe_diarization]
 
 

diff --git a/speech/cloud-client/beta_snippets_test.py b/speech/cloud-client/beta_snippets_test.py
@@ -51,10 +51,10 @@ def test_transcribe_file_with_auto_punctuation(capsys):
 
 def test_transcribe_diarization(capsys):
     transcribe_file_with_diarization(
-        os.path.join(RESOURCES, 'Google_Gnome.wav'))
+        os.path.join(RESOURCES, 'commercial_mono.wav'))
     out, err = capsys.readouterr()
 
-    assert 'OK Google stream stranger things from Netflix to my TV' in out
+    assert "I'm (1) here (1) hi (2)" in out
 
 
 def test_transcribe_multichannel_file(capsys):

diff --git a/texttospeech/cloud-client/audio_profile.py b/texttospeech/cloud-client/audio_profile.py
@@ -18,7 +18,7 @@
 
 Example usage:
     python audio_profile.py --text "hello" --effects_profile_id
-        "telephony-class-application"
+        "telephony-class-application" --output "output.mp3"
 """
 
 import argparse