114 lines
3.7 KiB
Python
114 lines
3.7 KiB
Python
# -*- coding: utf-8 -*- #
|
|
# Copyright 2024 Google LLC. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
"""Vertex AI endpoints direct raw predict command."""
|
|
|
|
from __future__ import absolute_import
|
|
from __future__ import division
|
|
from __future__ import unicode_literals
|
|
|
|
import base64
|
|
|
|
from googlecloudsdk.api_lib.ai.endpoints import client
|
|
from googlecloudsdk.calliope import base
|
|
from googlecloudsdk.command_lib.ai import constants
|
|
from googlecloudsdk.command_lib.ai import endpoint_util
|
|
from googlecloudsdk.command_lib.ai import endpoints_util
|
|
from googlecloudsdk.command_lib.ai import flags
|
|
from googlecloudsdk.command_lib.ai import region_util
|
|
|
|
|
|
def _AddArgs(parser):
|
|
flags.AddEndpointResourceArg(
|
|
parser,
|
|
'to do online direct raw prediction',
|
|
prompt_func=region_util.PromptForOpRegion,
|
|
)
|
|
flags.AddDirectRawPredictInputArg(parser)
|
|
|
|
|
|
def _Run(args, version):
|
|
"""Run Vertex AI online direct raw prediction."""
|
|
endpoint_ref = args.CONCEPTS.endpoint.Parse()
|
|
args.region = endpoint_ref.AsDict()['locationsId']
|
|
with endpoint_util.AiplatformEndpointOverrides(
|
|
version, region=args.region, is_prediction=True
|
|
):
|
|
endpoints_client = client.EndpointsClient(version=version)
|
|
|
|
# Decode the base64 encoded input, because it will be encoded by the
|
|
# apitools client.
|
|
input_json = endpoints_util.ReadInputFromArgs(args.json_request)
|
|
input_json['input'] = base64.b64decode(input_json['input']).decode('utf-8')
|
|
if version == constants.GA_VERSION:
|
|
results = endpoints_client.DirectRawPredict(endpoint_ref, input_json)
|
|
else:
|
|
results = endpoints_client.DirectRawPredictBeta(endpoint_ref, input_json)
|
|
|
|
# Decode the base64 encoded output.
|
|
results.output = base64.b64decode(results.output)
|
|
|
|
if not args.IsSpecified('format'):
|
|
# default format is based on the response.
|
|
args.format = endpoints_util.GetDefaultFormat(
|
|
results.output, key_name='output'
|
|
)
|
|
return results
|
|
|
|
|
|
@base.UniverseCompatible
|
|
@base.ReleaseTracks(base.ReleaseTrack.GA)
|
|
class DirectRawPredictGa(base.Command):
|
|
"""Run Vertex AI online direct raw prediction.
|
|
|
|
`{command}` sends a direct raw prediction request to Vertex AI endpoint for
|
|
the given input. The request limit is 10MB.
|
|
|
|
## EXAMPLES
|
|
|
|
To direct predict against an endpoint ``123'' under project ``example'' in
|
|
region ``us-central1'', run:
|
|
|
|
$ {command} 123 --project=example --region=us-central1
|
|
--json-request=input.json
|
|
"""
|
|
|
|
@staticmethod
|
|
def Args(parser):
|
|
_AddArgs(parser)
|
|
|
|
def Run(self, args):
|
|
return _Run(args, constants.GA_VERSION)
|
|
|
|
|
|
@base.UniverseCompatible
|
|
@base.ReleaseTracks(base.ReleaseTrack.BETA, base.ReleaseTrack.ALPHA)
|
|
class DirectRawPredictBeta(DirectRawPredictGa):
|
|
"""Run Vertex AI online direct raw prediction.
|
|
|
|
`{command}` sends a direct raw prediction request to Vertex AI endpoint for
|
|
the given input. The request limit is 10MB.
|
|
|
|
## EXAMPLES
|
|
|
|
To direct raw predict against an endpoint ``123'' under project ``example'' in
|
|
region ``us-central1'', run:
|
|
|
|
$ {command} 123 --project=example --region=us-central1
|
|
--json-request=input.json
|
|
"""
|
|
|
|
def Run(self, args):
|
|
return _Run(args, constants.BETA_VERSION)
|