File: //snap/google-cloud-cli/current/lib/googlecloudsdk/command_lib/ml/vision/util.py
# -*- coding: utf-8 -*- #
# Copyright 2017 Google LLC. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Utilities for gcloud ml vision commands."""
from __future__ import absolute_import
from __future__ import division
from __future__ import unicode_literals
import os
import re
from googlecloudsdk.api_lib.util import apis
from googlecloudsdk.core import exceptions
from googlecloudsdk.core.util import files
VISION_API = 'vision'
VISION_API_VERSION = 'v1'
IMAGE_URI_FORMAT = r'^(https{,1}?|gs)://'
FILE_URI_FORMAT = r'gs://([^/]+)/(.+)'
FILE_PREFIX = r'gs://([^/]+)(/.*)*'
class Error(exceptions.Error):
"""Error for gcloud ml vision commands."""
class ImagePathError(Error):
"""Error if an image path is improperly formatted."""
class GcsSourceError(Error):
"""Error if a gcsSource path is improperly formatted."""
class GcsDestinationError(Error):
"""Error if a gcsDestination path is improperly formatted."""
def GetImageFromPath(path):
"""Builds an Image message from a path.
Args:
path: the path arg given to the command.
Raises:
ImagePathError: if the image path does not exist and does not seem to be
a remote URI.
Returns:
vision_v1_messages.Image: an image message containing information for the
API on the image to analyze.
"""
messages = apis.GetMessagesModule(VISION_API, VISION_API_VERSION)
image = messages.Image()
if os.path.isfile(path):
image.content = files.ReadBinaryFileContents(path)
elif re.match(IMAGE_URI_FORMAT, path):
image.source = messages.ImageSource(imageUri=path)
else:
raise ImagePathError(
'The image path does not exist locally or is not properly formatted. '
'A URI for a remote image must be a Google Cloud Storage image URI, '
'which must be in the form `gs://bucket_name/object_name`, or a '
'publicly accessible image HTTP/HTTPS URL. Please double-check your '
'input and try again.')
return image
def GetGcsSourceFromPath(input_file):
"""Validate a Google Cloud Storage location to read the PDF/TIFF file from.
Args:
input_file: the input file path arg given to the command.
Raises:
GcsSourceError: if the file is not a Google Cloud Storage object.
Returns:
vision_v1_messages.GcsSource: Google Cloud Storage URI for the input file.
This must only be a Google Cloud Storage object.
Wildcards are not currently supported.
"""
messages = apis.GetMessagesModule(VISION_API, VISION_API_VERSION)
gcs_source = messages.GcsSource()
if re.match(FILE_URI_FORMAT, input_file):
gcs_source.uri = input_file
else:
raise GcsSourceError(
'The URI for the input file must be a Google Cloud Storage object, '
'which must be in the form `gs://bucket_name/object_name.'
'Please double-check your input and try again.')
return gcs_source
def GetGcsDestinationFromPath(path):
"""Validate a Google Cloud Storage location to write the output to.
Args:
path: the path arg given to the command.
Raises:
GcsDestinationError: if the file is not a Google Cloud Storage object.
Returns:
vision_v1_messages.GcsDestination:Google Cloud Storage URI prefix
where the results will be stored.
This must only be a Google Cloud Storage object.
Wildcards are not currently supported.
"""
messages = apis.GetMessagesModule(VISION_API, VISION_API_VERSION)
gcs_destination = messages.GcsDestination()
if re.match(FILE_PREFIX, path):
gcs_destination.uri = path
else:
raise GcsDestinationError(
'The URI for the input file must be a Google Cloud Storage object, '
'which must be in the File prefix format `gs://bucket_name/here/file_name_prefix.'
'or directory prefix format `gs://bucket_name/some/location/. '
'Please double-check your input and try again.')
return gcs_destination