-
Notifications
You must be signed in to change notification settings - Fork 1.5k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Update enhanced models and auto punctuation to GA [(#1702)](GoogleClo…
…udPlatform/python-docs-samples#1702) * Update enhanced models and auto punctuation to GA * Update model-slection to GA
- Loading branch information
1 parent
c810b46
commit 2795bfe
Showing
8 changed files
with
258 additions
and
7 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
2 changes: 1 addition & 1 deletion
2
packages/google-cloud-python-speech/samples/snippets/requirements.txt
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1 +1 @@ | ||
google-cloud-speech==0.35.0 | ||
google-cloud-speech==0.36.0 |
64 changes: 64 additions & 0 deletions
64
packages/google-cloud-python-speech/samples/snippets/transcribe_auto_punctuation.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,64 @@ | ||
#!/usr/bin/env python | ||
|
||
# Copyright 2018 Google LLC | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
"""Google Cloud Speech API sample that demonstrates auto punctuation | ||
and recognition metadata. | ||
Example usage: | ||
python transcribe_auto_punctuation.py resources/commercial_mono.wav | ||
""" | ||
|
||
import argparse | ||
import io | ||
|
||
|
||
def transcribe_file_with_auto_punctuation(path): | ||
"""Transcribe the given audio file with auto punctuation enabled.""" | ||
# [START speech_transcribe_auto_punctuation] | ||
from google.cloud import speech | ||
client = speech.SpeechClient() | ||
|
||
# path = 'resources/commercial_mono.wav' | ||
with io.open(path, 'rb') as audio_file: | ||
content = audio_file.read() | ||
|
||
audio = speech.types.RecognitionAudio(content=content) | ||
config = speech.types.RecognitionConfig( | ||
encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16, | ||
sample_rate_hertz=8000, | ||
language_code='en-US', | ||
# Enable automatic punctuation | ||
enable_automatic_punctuation=True) | ||
|
||
response = client.recognize(config, audio) | ||
|
||
for i, result in enumerate(response.results): | ||
alternative = result.alternatives[0] | ||
print('-' * 20) | ||
print('First alternative of result {}'.format(i)) | ||
print('Transcript: {}'.format(alternative.transcript)) | ||
# [END speech_transcribe_auto_punctuation] | ||
|
||
|
||
if __name__ == '__main__': | ||
parser = argparse.ArgumentParser( | ||
description=__doc__, | ||
formatter_class=argparse.RawDescriptionHelpFormatter) | ||
parser.add_argument('path', help='File to stream to the API') | ||
|
||
args = parser.parse_args() | ||
|
||
transcribe_file_with_auto_punctuation(args.path) |
26 changes: 26 additions & 0 deletions
26
packages/google-cloud-python-speech/samples/snippets/transcribe_auto_punctuation_test.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
# Copyright 2018, Google LLC | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
import os | ||
|
||
import transcribe_auto_punctuation | ||
|
||
RESOURCES = os.path.join(os.path.dirname(__file__), 'resources') | ||
|
||
|
||
def test_transcribe_file_with_auto_punctuation(capsys): | ||
transcribe_auto_punctuation.transcribe_file_with_auto_punctuation( | ||
'resources/commercial_mono.wav') | ||
out, _ = capsys.readouterr() | ||
|
||
assert 'Okay. Sure.' in out |
67 changes: 67 additions & 0 deletions
67
packages/google-cloud-python-speech/samples/snippets/transcribe_enhanced_model.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,67 @@ | ||
#!/usr/bin/env python | ||
|
||
# Copyright 2018 Google LLC | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
"""Google Cloud Speech API sample that demonstrates enhanced models | ||
and recognition metadata. | ||
Example usage: | ||
python transcribe_enhanced_model.py resources/commercial_mono.wav | ||
""" | ||
|
||
import argparse | ||
import io | ||
|
||
|
||
def transcribe_file_with_enhanced_model(path): | ||
"""Transcribe the given audio file using an enhanced model.""" | ||
# [START speech_transcribe_enhanced_model] | ||
from google.cloud import speech | ||
client = speech.SpeechClient() | ||
|
||
# path = 'resources/commercial_mono.wav' | ||
with io.open(path, 'rb') as audio_file: | ||
content = audio_file.read() | ||
|
||
audio = speech.types.RecognitionAudio(content=content) | ||
config = speech.types.RecognitionConfig( | ||
encoding=speech.enums.RecognitionConfig.AudioEncoding.LINEAR16, | ||
sample_rate_hertz=8000, | ||
language_code='en-US', | ||
# Enhanced models are only available to projects that | ||
# opt in for audio data collection. | ||
use_enhanced=True, | ||
# A model must be specified to use enhanced model. | ||
model='phone_call') | ||
|
||
response = client.recognize(config, audio) | ||
|
||
for i, result in enumerate(response.results): | ||
alternative = result.alternatives[0] | ||
print('-' * 20) | ||
print('First alternative of result {}'.format(i)) | ||
print('Transcript: {}'.format(alternative.transcript)) | ||
# [END speech_transcribe_enhanced_model] | ||
|
||
|
||
if __name__ == '__main__': | ||
parser = argparse.ArgumentParser( | ||
description=__doc__, | ||
formatter_class=argparse.RawDescriptionHelpFormatter) | ||
parser.add_argument('path', help='File to stream to the API') | ||
|
||
args = parser.parse_args() | ||
|
||
transcribe_file_with_enhanced_model(args.path) |
26 changes: 26 additions & 0 deletions
26
packages/google-cloud-python-speech/samples/snippets/transcribe_enhanced_model_test.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
# Copyright 2018, Google LLC | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
import os | ||
|
||
import transcribe_enhanced_model | ||
|
||
RESOURCES = os.path.join(os.path.dirname(__file__), 'resources') | ||
|
||
|
||
def test_transcribe_file_with_enhanced_model(capsys): | ||
transcribe_enhanced_model.transcribe_file_with_enhanced_model( | ||
'resources/commercial_mono.wav') | ||
out, _ = capsys.readouterr() | ||
|
||
assert 'Chrome' in out |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters