Skip to content

Commit 2a1a539

Browse files
dizcologyJon Wayne Parrott
authored and
Jon Wayne Parrott
committed
add word time offsets to async sample (#1042)
1 parent c9209ba commit 2a1a539

File tree

2 files changed

+22
-1
lines changed

2 files changed

+22
-1
lines changed

speech/cloud-client/transcribe_async.py

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,8 @@ def transcribe_gcs(gcs_uri):
7979
config = types.RecognitionConfig(
8080
encoding=enums.RecognitionConfig.AudioEncoding.FLAC,
8181
sample_rate_hertz=16000,
82-
language_code='en-US')
82+
language_code='en-US',
83+
enable_word_time_offsets=True)
8384

8485
operation = client.long_running_recognize(config, audio)
8586

@@ -96,6 +97,15 @@ def transcribe_gcs(gcs_uri):
9697
for alternative in alternatives:
9798
print('Transcript: {}'.format(alternative.transcript))
9899
print('Confidence: {}'.format(alternative.confidence))
100+
101+
for word_info in alternative.words:
102+
word = word_info.word
103+
start_time = word_info.start_time
104+
end_time = word_info.end_time
105+
print('Word: {}, start_time: {}, end_time: {}'.format(
106+
word,
107+
start_time.seconds + start_time.nanos * 1e-9,
108+
end_time.seconds + end_time.nanos * 1e-9))
99109
# [END def_transcribe_gcs]
100110

101111

speech/cloud-client/transcribe_async_test.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33,3 +33,14 @@ def test_transcribe_gcs(capsys):
3333
out, err = capsys.readouterr()
3434

3535
assert re.search(r'how old is the Brooklyn Bridge', out, re.DOTALL | re.I)
36+
37+
38+
def test_transcribe_gcs_word_time_offsets(capsys):
39+
transcribe_async.transcribe_gcs(
40+
'gs://python-docs-samples-tests/speech/audio.flac')
41+
out, err = capsys.readouterr()
42+
43+
match = re.search(r'Bridge, start_time: ([0-9.]+)', out, re.DOTALL | re.I)
44+
time = float(match.group(1))
45+
46+
assert time > 0

0 commit comments

Comments
 (0)