odps/models/volumes.py (189 lines of code) (raw):

#!/usr/bin/env python # -*- coding: utf-8 -*- # Copyright 1999-2025 Alibaba Group Holding Ltd. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import json import warnings from .. import errors, serializers, utils from ..compat import Enum, six from ..errors import InternalServerError from .cache import cache from .core import Iterable, LazyLoad class Volume(LazyLoad): """ Volume is the file-accessing object provided by ODPS. """ EXTERNAL_VOLUME_LOCATION_KEY = "external.location" EXTERNAL_VOLUME_ROLEARN_KEY = "odps.properties.rolearn" class Type(Enum): NEW = "NEW" OLD = "OLD" EXTERNAL = "EXTERNAL" UNKNOWN = "UNKNOWN" _root = "Meta" _type_indicator = "type" name = serializers.XMLNodeField("Name") owner = serializers.XMLNodeField("Owner") comment = serializers.XMLNodeField("Comment") type = serializers.XMLNodeField( "Type", parse_callback=lambda t: Volume.Type(t.upper()), serialize_callback=lambda t: t.value, ) length = serializers.XMLNodeField("Length", parse_callback=int) file_number = serializers.XMLNodeField("FileNumber", parse_callback=int) creation_time = serializers.XMLNodeField( "CreationTime", parse_callback=utils.parse_rfc822 ) last_modified_time = serializers.XMLNodeField( "LastModifiedTime", parse_callback=utils.parse_rfc822 ) properties = serializers.XMLNodeField( "Properties", parse_callback=json.loads, serialize_callback=json.dumps ) @classmethod def _get_cls(cls, typo): if typo is None: return cls if isinstance(typo, six.string_types): typo = Volume.Type(typo.upper()) if typo == Volume.Type.OLD: from . import PartedVolume return PartedVolume elif typo == Volume.Type.NEW: from . import FSVolume return FSVolume elif typo == Volume.Type.EXTERNAL: from . import ExternalVolume return ExternalVolume elif typo == Volume.Type.UNKNOWN: return Volume @staticmethod def _filter_cache(_, **kwargs): return kwargs.get("type") is not None and kwargs["type"] != Volume.Type.UNKNOWN @cache def __new__(cls, *args, **kwargs): typo = kwargs.get("type") if typo is not None or (cls != Volume and issubclass(cls, Volume)): return object.__new__(cls._get_cls(typo)) kwargs["type"] = Volume.Type.UNKNOWN obj = Volume(**kwargs) try: obj.reload() return Volume(**obj.extract()) except InternalServerError as ex: warnings.warn( "Cannot reload volume %s due to error %s" % (obj.name, str(ex)) ) return obj def __init__(self, **kwargs): typo = kwargs.get("type") properties = kwargs.get("properties") or {} location = kwargs.pop("location", None) rolearn = kwargs.pop("rolearn", None) if location: properties[self.EXTERNAL_VOLUME_LOCATION_KEY] = location if rolearn: properties[self.EXTERNAL_VOLUME_ROLEARN_KEY] = rolearn if properties: kwargs["properties"] = properties if isinstance(typo, six.string_types): kwargs["type"] = Volume.Type(typo.upper()) super(Volume, self).__init__(**kwargs) def reload(self): params = {} schema_name = self._get_schema_name() if schema_name is not None: params["curr_schema"] = schema_name resp = self._client.get(self.resource(), action="meta", params=params) self.parse(self._client, resp, obj=self) def drop(self, auto_remove_dir=False, recursive=False): return self.parent.delete( self, auto_remove_dir=auto_remove_dir, recursive=recursive ) class Volumes(Iterable): marker = serializers.XMLNodeField("Marker") volumes = serializers.XMLNodesReferencesField(Volume, "Volume") def _get(self, item): return Volume(client=self._client, parent=self, name=item) def _get_parent_typed(self, item): return Volume( client=self._client, parent=self, name=item, type=Volume.Type.UNKNOWN ) def __contains__(self, item): if isinstance(item, six.string_types): try: # as reload() will be done in constructor of Volume, we return directly. return self._get(item) except errors.NoSuchObject: return False elif isinstance(item, Volume): volume = item try: volume.reload() return True except errors.NoSuchObject: return False else: return False def __iter__(self): return self.iterate() def iterate(self, name=None, owner=None): """ :param name: the prefix of volume name name :param owner: :return: """ schema_name = self._get_schema_name() params = {"expectmarker": "true"} if name is not None: params["name"] = name if owner is not None: params["owner"] = owner if schema_name is not None: params["curr_schema"] = schema_name def _it(): last_marker = params.get("marker") if "marker" in params and (last_marker is None or len(last_marker) == 0): return url = self.resource() resp = self._client.get(url, params=params) v = Volumes.parse(self._client, resp, obj=self) params["marker"] = v.marker return v.volumes while True: volumes = _it() if volumes is None: break for volume in volumes: yield volume def _create(self, obj=None, **kwargs): auto_create_dir = kwargs.pop("auto_create_dir", False) accelerate = kwargs.pop("accelerate", False) volume = obj or Volume(parent=self, client=self._client, **kwargs) if volume.parent is None: volume._parent = self if volume._client is None: volume._client = self._client headers = {"Content-Type": "application/xml"} data = volume.serialize() params = {} if auto_create_dir: params["autoMkDir"] = "" if accelerate: params["accelerate"] = "" self._client.post( self.resource(), data, headers=headers, params=params, curr_schema=self._get_schema_name(), ) return self[volume.name] def create_parted(self, obj=None, **kwargs): return self._create(obj=obj, type="old", **kwargs) def create_fs(self, obj=None, **kwargs): return self._create(obj=obj, type="new", **kwargs) def create_external(self, obj=None, **kwargs): return self._create(obj=obj, type="external", **kwargs) def delete(self, name, auto_remove_dir=False, recursive=False): if not isinstance(name, Volume): volume = self._get_parent_typed(name) else: volume = name name = name.name del self[name] # release cache params = {} if auto_remove_dir: params["autoRmDir"] = "" if recursive: params["recursive"] = "true" url = volume.resource() self._client.delete(url, params=params, curr_schema=self._get_schema_name())