# -*- coding: utf-8 -*- # # Copyright 2024 Google LLC. All Rights Reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. """Cloud Speech-to-text recognizers run short audio command.""" from __future__ import absolute_import from __future__ import division from __future__ import unicode_literals from googlecloudsdk.api_lib.ml.speech import client from googlecloudsdk.calliope import base from googlecloudsdk.command_lib.ml.speech import flag_validations from googlecloudsdk.command_lib.ml.speech import flags_v2 @base.UniverseCompatible @base.ReleaseTracks(base.ReleaseTrack.ALPHA) class RunBatch(base.Command): """Get transcripts of long (more than 60 seconds) audio from a gcloud uri.""" def ValidateRunBatchFlags(self, args): """Validates run batch flags.""" flag_validations.ValidateDecodingConfig(args) flag_validations.ValidateAudioSource(args, batch=True) @staticmethod def Args(parser): """Register flags for this command.""" flags_v2.AddRecognizeRequestFlagsToParser(parser, add_async_flag=True) def Run(self, args): resource = args.CONCEPTS.recognizer.Parse() speech_client = client.SpeechV2Client() self.ValidateRunBatchFlags(args) recognition_config_update_mask = [] recognition_config, recognition_config_update_mask = ( speech_client.InitializeRecognitionConfig( args.model, args.language_codes, recognition_config_update_mask ) ) recognition_config, recognition_config_update_mask = ( speech_client.InitializeDecodingConfigFromArgs( recognition_config, args, default_to_auto_decoding_config=True, update_mask=recognition_config_update_mask, ) ) recognition_config.features, recognition_config_update_mask = ( speech_client.InitializeASRFeaturesFromArgs( args, update_mask=recognition_config_update_mask ) ) if args.hint_phrases or args.hint_phrase_sets: recognition_config.adaptation, recognition_config_update_mask = ( speech_client.InitializeAdaptationConfigFromArgs( args, update_mask=recognition_config_update_mask ) ) operation = speech_client.RunBatch( resource, args.audio, recognition_config, update_mask=recognition_config_update_mask, ) if args.async_: return operation return speech_client.WaitForBatchRecognizeOperation( location=resource.Parent().Name(), operation_ref=operation.name, message='waiting for batch recognize to finish', )