205 lines
6.5 KiB
Python
205 lines
6.5 KiB
Python
# -*- coding: utf-8 -*- #
|
|
# Copyright 2021 Google LLC. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
"""Command to SSH into a Cloud TPU VM Node."""
|
|
|
|
from __future__ import absolute_import
|
|
from __future__ import division
|
|
from __future__ import unicode_literals
|
|
|
|
import argparse
|
|
import os.path
|
|
|
|
from googlecloudsdk.calliope import base
|
|
from googlecloudsdk.calliope import exceptions
|
|
from googlecloudsdk.command_lib.compute import completers
|
|
from googlecloudsdk.command_lib.compute import flags
|
|
from googlecloudsdk.command_lib.compute import ssh_utils
|
|
from googlecloudsdk.command_lib.compute.tpus.tpu_vm import ssh as tpu_ssh_utils
|
|
from googlecloudsdk.core import properties
|
|
|
|
|
|
def AddCommandArgGroup(parser):
|
|
"""Argument group for running commands using SSH."""
|
|
command_group = parser.add_argument_group(
|
|
help='These arguments are used to run commands using SSH.')
|
|
command_group.add_argument(
|
|
'--command',
|
|
help="""\
|
|
Command to run on the Cloud TPU VM.
|
|
|
|
Runs the command on the target Cloud TPU VM and then exits.
|
|
|
|
Note: in the case of a TPU Pod, it will only run the command in the
|
|
workers specified with the `--worker` flag (defaults to worker 0 if not
|
|
set).
|
|
""")
|
|
command_group.add_argument(
|
|
'--output-directory',
|
|
help="""\
|
|
Path to the directory to output the logs of the commands.
|
|
|
|
The path can be relative or absolute. The directory must already exist.
|
|
|
|
If not specified, standard output will be used.
|
|
|
|
The logs will be written in files named {WORKER_ID}.log. For example:
|
|
"2.log".
|
|
""")
|
|
|
|
|
|
def AddSSHArgs(parser):
|
|
"""Additional flags and positional args to be passed to *ssh(1)*."""
|
|
parser.add_argument(
|
|
'--ssh-flag',
|
|
action='append',
|
|
help="""\
|
|
Additional flags to be passed to *ssh(1)*. It is recommended that flags
|
|
be passed using an assignment operator and quotes. Example:
|
|
|
|
$ {command} example-instance --zone=us-central1-a --ssh-flag="-vvv" --ssh-flag="-L 80:localhost:80"
|
|
|
|
This flag will replace occurences of ``%USER%'' and ``%TPU%'' with
|
|
their dereferenced values. For example, passing ``80:%TPU%:80`` into
|
|
the flag is equivalent to passing ``80:162.222.181.197:80'' to *ssh(1)*
|
|
if the external IP address of 'example-instance' is 162.222.181.197.
|
|
|
|
If connecting to the instance's external IP, then %TPU% is replaced
|
|
with that, otherwise it is replaced with the internal IP.
|
|
""")
|
|
|
|
parser.add_argument(
|
|
'user_tpu',
|
|
completer=completers.InstancesCompleter,
|
|
metavar='[USER@]TPU',
|
|
help="""\
|
|
Specifies the Cloud TPU VM to SSH into.
|
|
|
|
``USER'' specifies the username with which to SSH. If omitted, the user
|
|
login name is used.
|
|
|
|
``TPU'' specifies the name of the Cloud TPU VM to SSH into.
|
|
""")
|
|
|
|
parser.add_argument(
|
|
'ssh_args',
|
|
nargs=argparse.REMAINDER,
|
|
help="""\
|
|
Flags and positionals passed to the underlying ssh implementation.
|
|
""",
|
|
example="""\
|
|
$ {command} example-instance --zone=us-central1-a -- -vvv -L 80:%TPU%:80
|
|
""")
|
|
|
|
|
|
@base.ReleaseTracks(base.ReleaseTrack.GA)
|
|
class Ssh(base.Command):
|
|
"""SSH into a Cloud TPU VM."""
|
|
|
|
# IAP and Batching are not available for GA.
|
|
_ENABLE_IAP = False
|
|
_ENABLE_BATCHING = False
|
|
|
|
@classmethod
|
|
def Args(cls, parser):
|
|
"""Set up arguments for this command.
|
|
|
|
Args:
|
|
parser: An argparse.ArgumentParser.
|
|
"""
|
|
ssh_utils.BaseSSHCLIHelper.Args(parser)
|
|
AddSSHArgs(parser)
|
|
tpu_ssh_utils.AddTPUSSHArgs(parser, enable_iap=cls._ENABLE_IAP,
|
|
enable_batching=cls._ENABLE_BATCHING)
|
|
AddCommandArgGroup(parser)
|
|
flags.AddZoneFlag(parser, resource_type='tpu', operation_type='ssh')
|
|
|
|
def Run(self, args):
|
|
user, tpu_name = ssh_utils.GetUserAndInstance(args.user_tpu)
|
|
|
|
# If zone is not set, retrieve the one from the config.
|
|
if args.zone is None:
|
|
args.zone = properties.VALUES.compute.zone.Get(required=True)
|
|
# Validate the output path.
|
|
if args.output_directory:
|
|
if not args.command:
|
|
raise exceptions.InvalidArgumentException(
|
|
'--output_directory', 'cannot be specified without the `--command` '
|
|
'flag. Please specify the `--command` flag or remove the '
|
|
'--output-directory flag.')
|
|
output_directory_path = os.path.abspath(
|
|
os.path.expandvars(os.path.expanduser(args.output_directory)))
|
|
if not os.path.isdir(output_directory_path):
|
|
raise exceptions.InvalidArgumentException(
|
|
'--output_directory', 'Failed to find directory {}. Please create '
|
|
'it or specify another directory'.format(output_directory_path))
|
|
|
|
username_requested = '@' in args.user_tpu
|
|
prepped_node = [None]
|
|
tpu_ssh_utils.PrepareNodeForSSH(
|
|
tpu_name,
|
|
user,
|
|
args,
|
|
self.ReleaseTrack(),
|
|
self._ENABLE_BATCHING,
|
|
username_requested,
|
|
prepped_node,
|
|
0,
|
|
)
|
|
|
|
ssh_batch_size = 1
|
|
if self._ENABLE_BATCHING and prepped_node[0]:
|
|
ssh_batch_size = tpu_ssh_utils.ParseBatchSize(
|
|
args.batch_size, len(prepped_node[0].worker_ips)
|
|
)
|
|
|
|
tpu_ssh_utils.SSHIntoPreppedNodes(
|
|
prepped_node,
|
|
args,
|
|
ssh_batch_size,
|
|
)
|
|
|
|
|
|
@base.ReleaseTracks(base.ReleaseTrack.ALPHA)
|
|
class SshAlpha(Ssh):
|
|
"""SSH into a Cloud TPU VM (Alpha)."""
|
|
_ENABLE_IAP = True
|
|
_ENABLE_BATCHING = True
|
|
|
|
|
|
Ssh.detailed_help = {
|
|
'brief':
|
|
'SSH into a Cloud TPU VM.',
|
|
'EXAMPLES':
|
|
"""
|
|
To SSH into a Cloud TPU VM, run:
|
|
|
|
$ {command} my-tpu
|
|
|
|
To SSH into worker 1 on a Cloud TPU VM Pod, run:
|
|
|
|
$ {command} my-tpu --worker=1
|
|
|
|
To run an SSH command in a Cloud TPU VM (for example, to print the
|
|
time since last boot), run:
|
|
|
|
$ {command} my-tpu --command="last boot"
|
|
|
|
To run the same command in all workers in a Cloud TPU VM simultaneously,
|
|
run:
|
|
|
|
$ {command} my-tpu --command="last boot" --worker=all
|
|
"""
|
|
}
|