diff options
author | Barry Warsaw <barry@python.org> | 2015-01-27 15:11:53 -0500 |
---|---|---|
committer | Barry Warsaw <barry@python.org> | 2015-01-27 15:11:53 -0500 |
commit | 96d130e7732f1242d71c65a32412ae56cb229abf (patch) | |
tree | 3fb39ac6dd43988f36507a1c0b82e8944dfe95ff /cloudinit/util.py | |
parent | 6e742d20e9ed56498925c7c850cd5da65d063b4b (diff) | |
download | vyos-cloud-init-96d130e7732f1242d71c65a32412ae56cb229abf.tar.gz vyos-cloud-init-96d130e7732f1242d71c65a32412ae56cb229abf.zip |
Respond to review:
- Refactor "fully" decoding the payload of a text/* part. In Python 3,
decode=True only means to decode according to Content-Transfer-Encoding, not
according to any charset in the Content-Type header. So do that.
Diffstat (limited to 'cloudinit/util.py')
-rw-r--r-- | cloudinit/util.py | 15 |
1 files changed, 15 insertions, 0 deletions
diff --git a/cloudinit/util.py b/cloudinit/util.py index 8916cc11..3a921afe 100644 --- a/cloudinit/util.py +++ b/cloudinit/util.py @@ -110,6 +110,21 @@ def b64e(source): return b64encode(source).decode('utf-8') +def fully_decoded_payload(part): + # In Python 3, decoding the payload will ironically hand us a bytes object. + # 'decode' means to decode according to Content-Transfer-Encoding, not + # according to any charset in the Content-Type. So, if we end up with + # bytes, first try to decode to str via CT charset, and failing that, try + # utf-8 using surrogate escapes. + cte_payload = part.get_payload(decode=True) + if ( six.PY3 and + part.get_content_maintype() == 'text' and + isinstance(cte_payload, bytes)): + charset = part.get_charset() or 'utf-8' + return cte_payload.decode(charset, errors='surrogateescape') + return cte_payload + + # Path for DMI Data DMI_SYS_PATH = "/sys/class/dmi/id" |