summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorCat Lee Ball 🎷🐛 <cball@google.com>2019-03-27 14:49:38 -0700
committerCat Lee Ball 🎷🐛 <cball@google.com>2019-03-27 14:49:38 -0700
commit5c9bdd0fa88a351e0a4014ec94d4ec8bd7465fcf (patch)
treed8076af4c451b24730eb5f8a8816e074c63d81a7
parent598bdfee04744b394ba446603818c7a1b09ced0f (diff)
downloadboto-5c9bdd0fa88a351e0a4014ec94d4ec8bd7465fcf.tar.gz
Added function get_utf8able_str
This function will ensure given objects are utf-8 encodable, used mainly for allowing for Python 2/3 compatibility.
-rw-r--r--boto/auth.py13
-rw-r--r--boto/gs/bucket.py5
-rwxr-xr-xboto/gs/connection.py5
-rw-r--r--boto/gs/key.py4
-rw-r--r--boto/s3/bucket.py3
-rw-r--r--boto/s3/connection.py6
-rw-r--r--boto/utils.py25
7 files changed, 45 insertions, 16 deletions
diff --git a/boto/auth.py b/boto/auth.py
index 21faa6bb..77c2c2bc 100644
--- a/boto/auth.py
+++ b/boto/auth.py
@@ -42,6 +42,7 @@ import posixpath
from boto.compat import urllib, encodebytes, parse_qs_safe, urlparse, six
from boto.auth_handler import AuthHandler
from boto.exception import BotoClientError
+from boto.utils import get_utf8able_str
try:
from hashlib import sha1 as sha
@@ -383,7 +384,7 @@ class HmacAuthV4Handler(AuthHandler, HmacKeys):
parameter_names = sorted(http_request.params.keys())
pairs = []
for pname in parameter_names:
- pval = six.ensure_str(http_request.params[pname])
+ pval = get_utf8able_str(http_request.params[pname])
pairs.append(urllib.parse.quote(pname, safe=''.encode('ascii')) +
'=' +
urllib.parse.quote(pval, safe='-_~'.encode('ascii')))
@@ -396,7 +397,7 @@ class HmacAuthV4Handler(AuthHandler, HmacKeys):
return ""
l = []
for param in sorted(http_request.params):
- value = six.ensure_str(http_request.params[param])
+ value = get_utf8able_str(http_request.params[param])
l.append('%s=%s' % (urllib.parse.quote(param, safe='-_.~'),
urllib.parse.quote(value, safe='-_.~')))
return '&'.join(l)
@@ -623,7 +624,7 @@ class S3HmacAuthV4Handler(HmacAuthV4Handler, AuthHandler):
# query string.
l = []
for param in sorted(http_request.params):
- value = six.ensure_str(http_request.params[param])
+ value = get_utf8able_str(http_request.params[param])
l.append('%s=%s' % (urllib.parse.quote(param, safe='-_.~'),
urllib.parse.quote(value, safe='-_.~')))
return '&'.join(l)
@@ -836,7 +837,7 @@ class STSAnonHandler(AuthHandler):
keys.sort(key=lambda x: x.lower())
pairs = []
for key in keys:
- val = six.ensure_str(params[key])
+ val = get_utf8able_str(params[key])
pairs.append(key + '=' + self._escape_value(six.ensure_str(val)))
return '&'.join(pairs)
@@ -897,7 +898,7 @@ class QuerySignatureV0AuthHandler(QuerySignatureHelper, AuthHandler):
keys.sort(cmp=lambda x, y: cmp(x.lower(), y.lower()))
pairs = []
for key in keys:
- val = six.ensure_str(params[key])
+ val = get_utf8able_str(params[key])
pairs.append(key + '=' + urllib.parse.quote(val))
qs = '&'.join(pairs)
return (qs, base64.b64encode(hmac.digest()))
@@ -948,7 +949,7 @@ class QuerySignatureV2AuthHandler(QuerySignatureHelper, AuthHandler):
keys = sorted(params.keys())
pairs = []
for key in keys:
- val = six.ensure_str(params[key])
+ val = get_utf8able_str(params[key])
pairs.append(urllib.parse.quote(key, safe='') + '=' +
urllib.parse.quote(val, safe='-_~'))
qs = '&'.join(pairs)
diff --git a/boto/gs/bucket.py b/boto/gs/bucket.py
index c11e239d..e4e057a8 100644
--- a/boto/gs/bucket.py
+++ b/boto/gs/bucket.py
@@ -40,6 +40,7 @@ from boto.gs.lifecycle import LifecycleConfig
from boto.gs.key import Key as GSKey
from boto.s3.acl import Policy
from boto.s3.bucket import Bucket as S3Bucket
+from boto.utils import get_utf8able_str
from boto.compat import quote
from boto.compat import six
@@ -643,7 +644,7 @@ class Bucket(S3Bucket):
:param str storage_class: A string containing the storage class.
:param dict headers: Additional headers to send with the request.
"""
- req_body = self.StorageClassBody % (six.ensure_str(storage_class))
+ req_body = self.StorageClassBody % (get_utf8able_str(storage_class))
self.set_subresource(STORAGE_CLASS_ARG, req_body, headers=headers)
# Method with same signature as boto.s3.bucket.Bucket.add_email_grant(),
@@ -882,7 +883,7 @@ class Bucket(S3Bucket):
body = self.WebsiteBody % (main_page_frag, error_frag)
response = self.connection.make_request(
- 'PUT', six.ensure_str(self.name), data=six.ensure_str(body),
+ 'PUT', get_utf8able_str(self.name), data=six.ensure_str(body),
query_args='websiteConfig', headers=headers)
body = response.read()
if response.status == 200:
diff --git a/boto/gs/connection.py b/boto/gs/connection.py
index ae9fab3d..70ce6ec6 100755
--- a/boto/gs/connection.py
+++ b/boto/gs/connection.py
@@ -24,6 +24,7 @@ from boto.s3.connection import S3Connection
from boto.s3.connection import SubdomainCallingFormat
from boto.s3.connection import check_lowercase_bucketname
from boto.compat import six
+from boto.utils import get_utf8able_str
class Location(object):
DEFAULT = 'US'
@@ -91,8 +92,8 @@ class GSConnection(S3Connection):
data = ('<CreateBucketConfiguration>%s%s</CreateBucketConfiguration>'
% (location_elem, storage_class_elem))
response = self.make_request(
- 'PUT', six.ensure_str(bucket_name), headers=headers,
- data=six.ensure_str(data))
+ 'PUT', get_utf8able_str(bucket_name), headers=headers,
+ data=get_utf8able_str(data))
body = response.read()
if response.status == 409:
raise self.provider.storage_create_error(
diff --git a/boto/gs/key.py b/boto/gs/key.py
index 30b96382..0f720bb5 100644
--- a/boto/gs/key.py
+++ b/boto/gs/key.py
@@ -28,7 +28,7 @@ from boto.compat import StringIO, six
from boto.exception import BotoClientError
from boto.s3.key import Key as S3Key
from boto.s3.keyfile import KeyFile
-from boto.utils import compute_hash
+from boto.utils import compute_hash, get_utf8able_str
class Key(S3Key):
"""
@@ -706,7 +706,7 @@ class Key(S3Key):
self.md5 = None
self.base64md5 = None
- fp = StringIO(six.ensure_str(s))
+ fp = StringIO(get_utf8able_str(s))
r = self.set_contents_from_file(fp, headers, replace, cb, num_cb,
policy, md5,
if_generation=if_generation)
diff --git a/boto/s3/bucket.py b/boto/s3/bucket.py
index e24d1a51..9a3f7bc4 100644
--- a/boto/s3/bucket.py
+++ b/boto/s3/bucket.py
@@ -51,6 +51,7 @@ import re
import base64
from collections import defaultdict
from boto.compat import BytesIO, six, StringIO, urllib
+from boto.utils import get_utf8able_str
# as per http://goo.gl/BDuud (02/19/2011)
@@ -852,7 +853,7 @@ class Bucket(object):
if isinstance(src_key_name, bytes):
src_key_name = src_key_name.decode('utf-8')
else:
- src_key_name = six.ensure_str(src_key_name)
+ src_key_name = get_utf8able_str(src_key_name)
if preserve_acl:
if self.name == src_bucket_name:
src_bucket = self
diff --git a/boto/s3/connection.py b/boto/s3/connection.py
index 22b06b7d..6893c309 100644
--- a/boto/s3/connection.py
+++ b/boto/s3/connection.py
@@ -88,7 +88,7 @@ class _CallingFormat(object):
return self.get_bucket_server(server, bucket)
def build_auth_path(self, bucket, key=''):
- key = six.ensure_str(key)
+ key = get_utf8able_str(key)
if isinstance(bucket, bytes):
bucket = bucket.decode('utf-8')
path = ''
@@ -97,7 +97,7 @@ class _CallingFormat(object):
return path + '/%s' % urllib.parse.quote(key)
def build_path_base(self, bucket, key=''):
- key = six.ensure_str(key)
+ key = get_utf8able_str(key)
return '/%s' % urllib.parse.quote(key)
@@ -121,7 +121,7 @@ class OrdinaryCallingFormat(_CallingFormat):
return server
def build_path_base(self, bucket, key=''):
- key = six.ensure_str(key)
+ key = get_utf8able_str(key)
path_base = '/'
if bucket:
path_base += "%s/" % bucket
diff --git a/boto/utils.py b/boto/utils.py
index 83b429b9..173594e2 100644
--- a/boto/utils.py
+++ b/boto/utils.py
@@ -1084,3 +1084,28 @@ def parse_host(hostname):
else:
return hostname.split(':', 1)[0]
+
+def get_utf8able_str(s, errors='strict'):
+ """Returns a UTF8-encodable string in PY3, UTF8 bytes in PY2.
+
+ This method is similar to six's `ensure_str()`, except it also
+ makes sure that any bytes passed in can be decoded using the
+ utf-8 codec (and raises a UnicodeDecodeError if not).
+ """
+ if six.PY2:
+ # We want to return utf-8 encoded bytes.
+ if isinstance(s, six.text_type):
+ return s.encode('utf-8', errors)
+ if isinstance(s, six.binary_type):
+ # Verify the bytes can be represented in utf-8
+ s.decode('utf-8')
+ return s
+ else:
+ # We want to return a unicode/str object.
+ if isinstance(s, six.text_type):
+ return s
+ if isinstance(s, six.binary_type):
+ s = s.decode('utf-8')
+ return s
+ raise TypeError('not expecting type "%s"' % type(s))
+