-
-
Save note103/04e53fb9fc4fddef8ffc7f76660f1678 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# !/usr/bin/env python | |
# coding: utf-8 | |
import argparse | |
import io | |
import sys | |
import codecs | |
import datetime | |
import locale | |
def transcribe_gcs(gcs_uri): | |
from google.cloud import speech | |
from google.cloud.speech import enums | |
from google.cloud.speech import types | |
client = speech.SpeechClient() | |
audio = types.RecognitionAudio(uri=gcs_uri) | |
config = types.RecognitionConfig( | |
encoding=enums.RecognitionConfig.AudioEncoding.FLAC, | |
# encoding=enums.RecognitionConfig.AudioEncoding.LINEAR16, | |
sample_rate_hertz=16000, | |
language_code='ja-JP') | |
operation = client.long_running_recognize(config, audio) | |
print('Waiting for operation to complete...') | |
operationResult = operation.result() | |
d = datetime.datetime.today() | |
today = d.strftime("-%Y%m%d-%H%M%S") | |
fout = codecs.open('output{}.txt'.format(today), 'a', 'utf-8') | |
for result in operationResult.results: | |
for alternative in result.alternatives: | |
fout.write(u'{}\n'.format(alternative.transcript)) | |
fout.close() | |
if __name__ == '__main__': | |
parser = argparse.ArgumentParser( | |
description=__doc__, | |
formatter_class=argparse.RawDescriptionHelpFormatter) | |
parser.add_argument( | |
'path', help='GCS path for audio file to be recognized') | |
args = parser.parse_args() | |
transcribe_gcs(args.path) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment