From 1c274f550b03d68759d75784f99203f1c850b754 Mon Sep 17 00:00:00 2001 From: Michael Shuler Date: Tue, 24 Nov 2015 22:36:33 -0600 Subject: Add Python 3 support to ca-certificates. Thanks to Andrew Wilcox and Richard Ipsum for the patch! Closes: #789753 --- debian/changelog | 9 ++++---- mozilla/certdata2pem.py | 57 +++++++++++++++++++++++++++++++++++-------------- 2 files changed, 46 insertions(+), 20 deletions(-) diff --git a/debian/changelog b/debian/changelog index 025a092..d6dcd6a 100644 --- a/debian/changelog +++ b/debian/changelog @@ -1,12 +1,13 @@ -ca-certificates (20151022) UNRELEASED; urgency=medium +ca-certificates (20151124) UNRELEASED; urgency=medium * debian/{compat,control}: Updated d/compat to version 9 and updated Build-Depends. * debian/postinst: Handle /usr/local/share/ca-certificates permissions and ownership on upgrade. Closes: #611501 - * mozilla/{certdata.txt,nssckbi.h}: - Update Mozilla certificate authority bundle to version 2.5. + * mozilla/certdata2pem.py: + Add Python 3 support to ca-certificates. + Thanks to Andrew Wilcox and Richard Ipsum for the patch! Closes: #789753 * mozilla/{certdata.txt,nssckbi.h}: Update Mozilla certificate authority bundle to version 2.5. The following certificate authorities were added (+): @@ -21,7 +22,7 @@ ca-certificates (20151022) UNRELEASED; urgency=medium - "TC TrustCenter Universal CA I" - "TURKTRUST Certificate Services Provider Root 1" - -- Michael Shuler Thu, 22 Oct 2015 17:09:46 -0500 + -- Michael Shuler Tue, 24 Nov 2015 22:34:53 -0600 ca-certificates (20150426) unstable; urgency=medium diff --git a/mozilla/certdata2pem.py b/mozilla/certdata2pem.py index 0482894..7bd4d2d 100644 --- a/mozilla/certdata2pem.py +++ b/mozilla/certdata2pem.py @@ -25,13 +25,19 @@ import os.path import re import sys import textwrap +import io objects = [] # Dirty file parser. in_data, in_multiline, in_obj = False, False, False field, type, value, obj = None, None, None, dict() -for line in open('certdata.txt', 'r'): + +# Python 3 will not let us decode non-ascii characters if we +# have not specified an encoding, but Python 2's open does not +# have an option to set the encoding. Python 3's open is io.open +# and io.open has been backported to Python 2.6 and 2.7, so use io.open. +for line in io.open('certdata.txt', 'rt', encoding='utf8'): # Ignore the file header. if not in_data: if line.startswith('BEGINDATA'): @@ -53,7 +59,7 @@ for line in open('certdata.txt', 'r'): if type == 'MULTILINE_OCTAL': line = line.strip() for i in re.finditer(r'\\([0-3][0-7][0-7])', line): - value += chr(int(i.group(1), 8)) + value.append(int(i.group(1), 8)) else: value += line continue @@ -70,13 +76,13 @@ for line in open('certdata.txt', 'r'): field, type = line_parts value = None else: - raise NotImplementedError, 'line_parts < 2 not supported.' + raise NotImplementedError('line_parts < 2 not supported.') if type == 'MULTILINE_OCTAL': in_multiline = True - value = "" + value = bytearray() continue obj[field] = value -if len(obj.items()) > 0: +if len(obj) > 0: objects.append(obj) # Read blacklist. @@ -95,7 +101,7 @@ for obj in objects: if obj['CKA_CLASS'] not in ('CKO_NETSCAPE_TRUST', 'CKO_NSS_TRUST'): continue if obj['CKA_LABEL'] in blacklist: - print "Certificate %s blacklisted, ignoring." % obj['CKA_LABEL'] + print("Certificate %s blacklisted, ignoring." % obj['CKA_LABEL']) elif obj['CKA_TRUST_SERVER_AUTH'] in ('CKT_NETSCAPE_TRUSTED_DELEGATOR', 'CKT_NSS_TRUSTED_DELEGATOR'): trust[obj['CKA_LABEL']] = True @@ -104,13 +110,13 @@ for obj in objects: trust[obj['CKA_LABEL']] = True elif obj['CKA_TRUST_SERVER_AUTH'] in ('CKT_NETSCAPE_UNTRUSTED', 'CKT_NSS_NOT_TRUSTED'): - print '!'*74 - print "UNTRUSTED BUT NOT BLACKLISTED CERTIFICATE FOUND: %s" % obj['CKA_LABEL'] - print '!'*74 + print('!'*74) + print("UNTRUSTED BUT NOT BLACKLISTED CERTIFICATE FOUND: %s" % obj['CKA_LABEL']) + print('!'*74) else: - print "Ignoring certificate %s. SAUTH=%s, EPROT=%s" % \ + print("Ignoring certificate %s. SAUTH=%s, EPROT=%s" % \ (obj['CKA_LABEL'], obj['CKA_TRUST_SERVER_AUTH'], - obj['CKA_TRUST_EMAIL_PROTECTION']) + obj['CKA_TRUST_EMAIL_PROTECTION'])) for obj in objects: if obj['CKA_CLASS'] == 'CKO_CERTIFICATE': @@ -121,13 +127,32 @@ for obj in objects: .replace('(', '=')\ .replace(')', '=')\ .replace(',', '_') - bname = bname.decode('string_escape') - fname = bname + '.crt' + + # this is the only way to decode the way NSS stores multi-byte UTF-8 + # and we need an escaped string for checking existence of things + # otherwise we're dependant on the user's current locale. + if bytes != str: + # We're in python 3, convert the utf-8 string to a + # sequence of bytes that represents this utf-8 string + # then encode the byte-sequence as an escaped string that + # can be passed to open() and os.path.exists() + bname = bname.encode('utf-8').decode('unicode_escape').encode('latin-1') + else: + # Python 2 + # Convert the unicode string back to its original byte form + # (contents of files returned by io.open are returned as + # unicode strings) + # then to an escaped string that can be passed to open() + # and os.path.exists() + bname = bname.encode('utf-8').decode('string_escape') + + fname = bname + b'.crt' if os.path.exists(fname): - print "Found duplicate certificate name %s, renaming." % bname - fname = bname + '_2.crt' + print("Found duplicate certificate name %s, renaming." % bname) + fname = bname + b'_2.crt' f = open(fname, 'w') f.write("-----BEGIN CERTIFICATE-----\n") - f.write("\n".join(textwrap.wrap(base64.b64encode(obj['CKA_VALUE']), 64))) + encoded = base64.b64encode(obj['CKA_VALUE']).decode('utf-8') + f.write("\n".join(textwrap.wrap(encoded, 64))) f.write("\n-----END CERTIFICATE-----\n") -- cgit v1.2.1