diff options
| author | Jason R. Coombs <jaraco@jaraco.com> | 2014-05-17 12:00:51 -0400 |
|---|---|---|
| committer | Jason R. Coombs <jaraco@jaraco.com> | 2014-05-17 12:00:51 -0400 |
| commit | f03d098eef9f80ee2bccba52e7e55c52bdb16804 (patch) | |
| tree | 350905bf5e2df630b111f93acef68e1e0dc18a95 /setuptools/unicode_utils.py | |
| parent | 337ce0deb26c4fa72b083001428f0ba1d456c0a3 (diff) | |
| parent | cade48d7d2751fe69d81957963f0a12d1606c9f6 (diff) | |
| download | python-setuptools-git-f03d098eef9f80ee2bccba52e7e55c52bdb16804.tar.gz | |
Merge 4 out of 5 commits from Philip Thiem's unicode_try_2. Ref #193
Diffstat (limited to 'setuptools/unicode_utils.py')
| -rw-r--r-- | setuptools/unicode_utils.py | 41 |
1 files changed, 41 insertions, 0 deletions
diff --git a/setuptools/unicode_utils.py b/setuptools/unicode_utils.py new file mode 100644 index 00000000..d2de941a --- /dev/null +++ b/setuptools/unicode_utils.py @@ -0,0 +1,41 @@ +import unicodedata +import sys +from setuptools.compat import unicode as decoded_string + + +# HFS Plus uses decomposed UTF-8 +def decompose(path): + if isinstance(path, decoded_string): + return unicodedata.normalize('NFD', path) + try: + path = path.decode('utf-8') + path = unicodedata.normalize('NFD', path) + path = path.encode('utf-8') + except UnicodeError: + pass # Not UTF-8 + return path + + +def filesys_decode(path): + """ + Ensure that the given path is decoded, + NONE when no expected encoding works + """ + + fs_enc = sys.getfilesystemencoding() + if isinstance(path, decoded_string): + return path + + for enc in (fs_enc, "utf-8"): + try: + return path.decode(enc) + except UnicodeDecodeError: + continue + + +def try_encode(string, enc): + "turn unicode encoding into a functional routine" + try: + return string.encode(enc) + except UnicodeEncodeError: + return None |
