575 lines
18 KiB
Python
575 lines
18 KiB
Python
# -*- coding: utf-8 -*-
|
|
# MinIO Python Library for Amazon S3 Compatible Cloud Storage, (C)
|
|
# 2020 MinIO, Inc.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
"""Common request/response configuration of S3 APIs."""
|
|
# pylint: disable=invalid-name
|
|
|
|
from __future__ import absolute_import, annotations
|
|
|
|
from abc import ABCMeta
|
|
from datetime import datetime
|
|
from typing import Type, TypeVar, cast
|
|
from xml.etree import ElementTree as ET
|
|
|
|
from .error import MinioException
|
|
from .helpers import quote
|
|
from .sse import SseCustomerKey
|
|
from .time import to_http_header
|
|
from .xml import SubElement, find, findall, findtext
|
|
|
|
COPY = "COPY"
|
|
REPLACE = "REPLACE"
|
|
DISABLED = "Disabled"
|
|
ENABLED = "Enabled"
|
|
GOVERNANCE = "GOVERNANCE"
|
|
COMPLIANCE = "COMPLIANCE"
|
|
_MAX_KEY_LENGTH = 128
|
|
_MAX_VALUE_LENGTH = 256
|
|
_MAX_OBJECT_TAG_COUNT = 10
|
|
_MAX_TAG_COUNT = 50
|
|
|
|
A = TypeVar("A", bound="Tags")
|
|
|
|
|
|
class Tags(dict):
|
|
"""dict extended to bucket/object tags."""
|
|
|
|
def __init__(self, for_object: bool = False):
|
|
self._for_object = for_object
|
|
super().__init__()
|
|
|
|
def __setitem__(self, key: str, value: str):
|
|
limit = _MAX_OBJECT_TAG_COUNT if self._for_object else _MAX_TAG_COUNT
|
|
if len(self) == limit:
|
|
tag_type = "object" if self._for_object else "bucket"
|
|
raise ValueError(f"only {limit} {tag_type} tags are allowed")
|
|
if not key or len(key) > _MAX_KEY_LENGTH or "&" in key:
|
|
raise ValueError(f"invalid tag key '{key}'")
|
|
if value is None or len(value) > _MAX_VALUE_LENGTH or "&" in value:
|
|
raise ValueError(f"invalid tag value '{value}'")
|
|
super().__setitem__(key, value)
|
|
|
|
@classmethod
|
|
def new_bucket_tags(cls: Type[A]) -> A:
|
|
"""Create new bucket tags."""
|
|
return cls()
|
|
|
|
@classmethod
|
|
def new_object_tags(cls: Type[A]) -> A:
|
|
"""Create new object tags."""
|
|
return cls(True)
|
|
|
|
@classmethod
|
|
def fromxml(cls: Type[A], element: ET.Element) -> A:
|
|
"""Create new object with values from XML element."""
|
|
elements = findall(element, "Tag")
|
|
obj = cls()
|
|
for tag in elements:
|
|
key = cast(str, findtext(tag, "Key", True))
|
|
value = cast(str, findtext(tag, "Value", True))
|
|
obj[key] = value
|
|
return obj
|
|
|
|
def toxml(self, element: ET.Element | None) -> ET.Element:
|
|
"""Convert to XML."""
|
|
if element is None:
|
|
raise ValueError("element must be provided")
|
|
for key, value in self.items():
|
|
tag = SubElement(element, "Tag")
|
|
SubElement(tag, "Key", key)
|
|
SubElement(tag, "Value", value)
|
|
return element
|
|
|
|
|
|
B = TypeVar("B", bound="Tag")
|
|
|
|
|
|
class Tag:
|
|
"""Tag."""
|
|
|
|
def __init__(self, key: str, value: str):
|
|
if not key:
|
|
raise ValueError("key must be provided")
|
|
if value is None:
|
|
raise ValueError("value must be provided")
|
|
self._key = key
|
|
self._value = value
|
|
|
|
@property
|
|
def key(self) -> str:
|
|
"""Get key."""
|
|
return self._key
|
|
|
|
@property
|
|
def value(self) -> str:
|
|
"""Get value."""
|
|
return self._value
|
|
|
|
@classmethod
|
|
def fromxml(cls: Type[B], element: ET.Element) -> B:
|
|
"""Create new object with values from XML element."""
|
|
element = cast(ET.Element, find(element, "Tag", True))
|
|
key = cast(str, findtext(element, "Key", True))
|
|
value = cast(str, findtext(element, "Value", True))
|
|
return cls(key, value)
|
|
|
|
def toxml(self, element: ET.Element | None) -> ET.Element:
|
|
"""Convert to XML."""
|
|
if element is None:
|
|
raise ValueError("element must be provided")
|
|
element = SubElement(element, "Tag")
|
|
SubElement(element, "Key", self._key)
|
|
SubElement(element, "Value", self._value)
|
|
return element
|
|
|
|
|
|
C = TypeVar("C", bound="AndOperator")
|
|
|
|
|
|
class AndOperator:
|
|
"""AND operator."""
|
|
|
|
def __init__(self, prefix: str | None = None, tags: Tags | None = None):
|
|
if prefix is None and not tags:
|
|
raise ValueError("at least prefix or tags must be provided")
|
|
self._prefix = prefix
|
|
self._tags = tags
|
|
|
|
@property
|
|
def prefix(self) -> str | None:
|
|
"""Get prefix."""
|
|
return self._prefix
|
|
|
|
@property
|
|
def tags(self) -> Tags | None:
|
|
"""Get tags."""
|
|
return self._tags
|
|
|
|
@classmethod
|
|
def fromxml(cls: Type[C], element: ET.Element) -> C:
|
|
"""Create new object with values from XML element."""
|
|
element = cast(ET.Element, find(element, "And", True))
|
|
prefix = findtext(element, "Prefix")
|
|
tags = (
|
|
None if find(element, "Tag") is None
|
|
else Tags.fromxml(element)
|
|
)
|
|
return cls(prefix, tags)
|
|
|
|
def toxml(self, element: ET.Element | None) -> ET.Element:
|
|
"""Convert to XML."""
|
|
if element is None:
|
|
raise ValueError("element must be provided")
|
|
element = SubElement(element, "And")
|
|
if self._prefix is not None:
|
|
SubElement(element, "Prefix", self._prefix)
|
|
if self._tags is not None:
|
|
self._tags.toxml(element)
|
|
return element
|
|
|
|
|
|
D = TypeVar("D", bound="Filter")
|
|
|
|
|
|
class Filter:
|
|
"""Lifecycle rule filter."""
|
|
|
|
def __init__(
|
|
self,
|
|
and_operator: AndOperator | None = None,
|
|
prefix: str | None = None,
|
|
tag: Tag | None = None,
|
|
):
|
|
valid = (
|
|
(and_operator is not None) ^
|
|
(prefix is not None) ^
|
|
(tag is not None)
|
|
)
|
|
if not valid:
|
|
raise ValueError("only one of and, prefix or tag must be provided")
|
|
self._and_operator = and_operator
|
|
self._prefix = prefix
|
|
self._tag = tag
|
|
|
|
@property
|
|
def and_operator(self) -> AndOperator | None:
|
|
"""Get AND operator."""
|
|
return self._and_operator
|
|
|
|
@property
|
|
def prefix(self) -> str | None:
|
|
"""Get prefix."""
|
|
return self._prefix
|
|
|
|
@property
|
|
def tag(self) -> Tag | None:
|
|
"""Get tag."""
|
|
return self._tag
|
|
|
|
@classmethod
|
|
def fromxml(cls: Type[D], element: ET.Element) -> D:
|
|
"""Create new object with values from XML element."""
|
|
element = cast(ET.Element, find(element, "Filter", True))
|
|
and_operator = (
|
|
None if find(element, "And") is None
|
|
else AndOperator.fromxml(element)
|
|
)
|
|
prefix = findtext(element, "Prefix")
|
|
tag = None if find(element, "Tag") is None else Tag.fromxml(element)
|
|
return cls(and_operator, prefix, tag)
|
|
|
|
def toxml(self, element: ET.Element | None) -> ET.Element:
|
|
"""Convert to XML."""
|
|
if element is None:
|
|
raise ValueError("element must be provided")
|
|
element = SubElement(element, "Filter")
|
|
if self._and_operator:
|
|
self._and_operator.toxml(element)
|
|
if self._prefix is not None:
|
|
SubElement(element, "Prefix", self._prefix)
|
|
if self._tag is not None:
|
|
self._tag.toxml(element)
|
|
return element
|
|
|
|
|
|
class BaseRule:
|
|
"""Base rule class for Replication and Lifecycle."""
|
|
__metaclass__ = ABCMeta
|
|
|
|
def __init__(
|
|
self,
|
|
rule_filter: Filter | None = None,
|
|
rule_id: str | None = None,
|
|
):
|
|
if rule_id is not None:
|
|
rule_id = rule_id.strip()
|
|
if not rule_id:
|
|
raise ValueError("rule ID must be non-empty string")
|
|
if len(rule_id) > 255:
|
|
raise ValueError("rule ID must not exceed 255 characters")
|
|
self._rule_filter = rule_filter
|
|
self._rule_id = rule_id
|
|
|
|
@property
|
|
def rule_filter(self) -> Filter | None:
|
|
"""Get replication rule filter."""
|
|
return self._rule_filter
|
|
|
|
@property
|
|
def rule_id(self) -> str | None:
|
|
"""Get rule ID."""
|
|
return self._rule_id
|
|
|
|
@staticmethod
|
|
def parsexml(element: ET.Element) -> tuple[Filter | None, str | None]:
|
|
"""Parse XML and return filter and ID."""
|
|
return (
|
|
None if find(element, "Filter") is None
|
|
else Filter.fromxml(element)
|
|
), findtext(element, "ID")
|
|
|
|
def toxml(self, element: ET.Element | None) -> ET.Element:
|
|
"""Convert to XML."""
|
|
if element is None:
|
|
raise ValueError("element must be provided")
|
|
if self._rule_filter:
|
|
self._rule_filter.toxml(element)
|
|
if self._rule_id is not None:
|
|
SubElement(element, "ID", self._rule_id)
|
|
return element
|
|
|
|
|
|
def check_status(status: str):
|
|
"""Validate status."""
|
|
if status not in [ENABLED, DISABLED]:
|
|
raise ValueError("status must be 'Enabled' or 'Disabled'")
|
|
|
|
|
|
class ObjectConditionalReadArgs:
|
|
"""Base argument class holds condition properties for reading object."""
|
|
__metaclass__ = ABCMeta
|
|
|
|
def __init__(
|
|
self,
|
|
bucket_name: str,
|
|
object_name: str,
|
|
region: str | None = None,
|
|
version_id: str | None = None,
|
|
ssec: SseCustomerKey | None = None,
|
|
offset: int | None = None,
|
|
length: int | None = None,
|
|
match_etag: str | None = None,
|
|
not_match_etag: str | None = None,
|
|
modified_since: str | None = None,
|
|
unmodified_since: str | None = None,
|
|
):
|
|
if ssec is not None and not isinstance(ssec, SseCustomerKey):
|
|
raise ValueError("ssec must be SseCustomerKey type")
|
|
if offset is not None and offset < 0:
|
|
raise ValueError("offset should be zero or greater")
|
|
if length is not None and length <= 0:
|
|
raise ValueError("length should be greater than zero")
|
|
if match_etag is not None and match_etag == "":
|
|
raise ValueError("match_etag must not be empty")
|
|
if not_match_etag is not None and not_match_etag == "":
|
|
raise ValueError("not_match_etag must not be empty")
|
|
if (
|
|
modified_since is not None and
|
|
not isinstance(modified_since, datetime)
|
|
):
|
|
raise ValueError("modified_since must be datetime type")
|
|
if (
|
|
unmodified_since is not None and
|
|
not isinstance(unmodified_since, datetime)
|
|
):
|
|
raise ValueError("unmodified_since must be datetime type")
|
|
|
|
self._bucket_name = bucket_name
|
|
self._object_name = object_name
|
|
self._region = region
|
|
self._version_id = version_id
|
|
self._ssec = ssec
|
|
self._offset = offset
|
|
self._length = length
|
|
self._match_etag = match_etag
|
|
self._not_match_etag = not_match_etag
|
|
self._modified_since = modified_since
|
|
self._unmodified_since = unmodified_since
|
|
|
|
@property
|
|
def bucket_name(self) -> str:
|
|
"""Get bucket name."""
|
|
return self._bucket_name
|
|
|
|
@property
|
|
def object_name(self) -> str:
|
|
"""Get object name."""
|
|
return self._object_name
|
|
|
|
@property
|
|
def region(self) -> str | None:
|
|
"""Get region."""
|
|
return self._region
|
|
|
|
@property
|
|
def version_id(self) -> str | None:
|
|
"""Get version ID."""
|
|
return self._version_id
|
|
|
|
@property
|
|
def ssec(self) -> SseCustomerKey | None:
|
|
"""Get SSE-C."""
|
|
return self._ssec
|
|
|
|
@property
|
|
def offset(self) -> int | None:
|
|
"""Get offset."""
|
|
return self._offset
|
|
|
|
@property
|
|
def length(self) -> int | None:
|
|
"""Get length."""
|
|
return self._length
|
|
|
|
@property
|
|
def match_etag(self) -> str | None:
|
|
"""Get match ETag condition."""
|
|
return self._match_etag
|
|
|
|
@property
|
|
def not_match_etag(self) -> str | None:
|
|
"""Get not-match ETag condition."""
|
|
return self._not_match_etag
|
|
|
|
@property
|
|
def modified_since(self) -> str | None:
|
|
"""Get modified since condition."""
|
|
return self._modified_since
|
|
|
|
@property
|
|
def unmodified_since(self) -> str | None:
|
|
"""Get unmodified since condition."""
|
|
return self._unmodified_since
|
|
|
|
def gen_copy_headers(self) -> dict[str, str]:
|
|
"""Generate copy source headers."""
|
|
copy_source = quote("/" + self._bucket_name + "/" + self._object_name)
|
|
if self._version_id:
|
|
copy_source += "?versionId=" + quote(self._version_id)
|
|
|
|
headers = {"x-amz-copy-source": copy_source}
|
|
if self._ssec:
|
|
headers.update(self._ssec.copy_headers())
|
|
if self._match_etag:
|
|
headers["x-amz-copy-source-if-match"] = self._match_etag
|
|
if self._not_match_etag:
|
|
headers["x-amz-copy-source-if-none-match"] = self._not_match_etag
|
|
if self._modified_since:
|
|
headers["x-amz-copy-source-if-modified-since"] = (
|
|
to_http_header(self._modified_since)
|
|
)
|
|
if self._unmodified_since:
|
|
headers["x-amz-copy-source-if-unmodified-since"] = (
|
|
to_http_header(self._unmodified_since)
|
|
)
|
|
return headers
|
|
|
|
|
|
E = TypeVar("E", bound="CopySource")
|
|
|
|
|
|
class CopySource(ObjectConditionalReadArgs):
|
|
"""A source object definition for copy_object method."""
|
|
@classmethod
|
|
def of(cls: Type[E], src: ObjectConditionalReadArgs) -> E:
|
|
"""Create CopySource from another source."""
|
|
return cls(
|
|
src.bucket_name, src.object_name, src.region, src.version_id,
|
|
src.ssec, src.offset, src.length, src.match_etag,
|
|
src.not_match_etag, src.modified_since, src.unmodified_since,
|
|
)
|
|
|
|
|
|
F = TypeVar("F", bound="ComposeSource")
|
|
|
|
|
|
class ComposeSource(ObjectConditionalReadArgs):
|
|
"""A source object definition for compose_object method."""
|
|
|
|
def __init__(
|
|
self,
|
|
bucket_name: str,
|
|
object_name: str,
|
|
region: str | None = None,
|
|
version_id: str | None = None,
|
|
ssec: SseCustomerKey | None = None,
|
|
offset: int | None = None,
|
|
length: int | None = None,
|
|
match_etag: str | None = None,
|
|
not_match_etag: str | None = None,
|
|
modified_since: str | None = None,
|
|
unmodified_since: str | None = None,
|
|
):
|
|
super().__init__(
|
|
bucket_name, object_name, region, version_id, ssec, offset, length,
|
|
match_etag, not_match_etag, modified_since, unmodified_since,
|
|
)
|
|
self._object_size: int | None = None
|
|
self._headers: dict[str, str] | None = None
|
|
|
|
def _validate_size(self, object_size: int):
|
|
"""Validate object size with offset and length."""
|
|
def make_error(name, value):
|
|
ver = ("?versionId="+self._version_id) if self._version_id else ""
|
|
return ValueError(
|
|
f"Source {self._bucket_name}/{self._object_name}{ver}: "
|
|
f"{name} {value} is beyond object size {object_size}"
|
|
)
|
|
|
|
if self._offset is not None and self._offset >= object_size:
|
|
raise make_error("offset", self._offset)
|
|
if self._length is not None:
|
|
if self._length > object_size:
|
|
raise make_error("length", self._length)
|
|
offset = self._offset or 0
|
|
if offset+self._length > object_size:
|
|
raise make_error("compose size", offset+self._length)
|
|
|
|
def build_headers(self, object_size: int, etag: str):
|
|
"""Build headers."""
|
|
self._validate_size(object_size)
|
|
self._object_size = object_size
|
|
headers = self.gen_copy_headers()
|
|
headers["x-amz-copy-source-if-match"] = self._match_etag or etag
|
|
self._headers = headers
|
|
|
|
@property
|
|
def object_size(self) -> int | None:
|
|
"""Get object size."""
|
|
if self._object_size is None:
|
|
raise MinioException(
|
|
"build_headers() must be called prior to "
|
|
"this method invocation",
|
|
)
|
|
return self._object_size
|
|
|
|
@property
|
|
def headers(self) -> dict[str, str]:
|
|
"""Get headers."""
|
|
if self._headers is None:
|
|
raise MinioException(
|
|
"build_headers() must be called prior to "
|
|
"this method invocation",
|
|
)
|
|
return self._headers.copy()
|
|
|
|
@classmethod
|
|
def of(cls: Type[F], src: ObjectConditionalReadArgs) -> F:
|
|
"""Create ComposeSource from another source."""
|
|
return cls(
|
|
src.bucket_name, src.object_name, src.region, src.version_id,
|
|
src.ssec, src.offset, src.length, src.match_etag,
|
|
src.not_match_etag, src.modified_since, src.unmodified_since,
|
|
)
|
|
|
|
|
|
class SnowballObject:
|
|
"""A source object definition for upload_snowball_objects method."""
|
|
|
|
def __init__(
|
|
self,
|
|
object_name: str,
|
|
filename: str | None = None,
|
|
data: bytes | None = None,
|
|
length: int | None = None,
|
|
mod_time: datetime | None = None,
|
|
):
|
|
self._object_name = object_name
|
|
if (filename is not None) ^ (data is not None):
|
|
self._filename = filename
|
|
self._data = data
|
|
self._length = length
|
|
else:
|
|
raise ValueError("only one of filename or data must be provided")
|
|
if mod_time is not None and not isinstance(mod_time, datetime):
|
|
raise ValueError("mod_time must be datetime type")
|
|
self._mod_time = mod_time
|
|
|
|
@property
|
|
def object_name(self) -> str:
|
|
"""Get object name."""
|
|
return self._object_name
|
|
|
|
@property
|
|
def filename(self) -> str | None:
|
|
"""Get filename."""
|
|
return self._filename
|
|
|
|
@property
|
|
def data(self) -> bytes | None:
|
|
"""Get data."""
|
|
return self._data
|
|
|
|
@property
|
|
def length(self) -> int | None:
|
|
"""Get length."""
|
|
return self._length
|
|
|
|
@property
|
|
def mod_time(self) -> datetime | None:
|
|
"""Get modification time."""
|
|
return self._mod_time
|