aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKonstantin Ryabitsev <konstantin@linuxfoundation.org>2021-06-08 16:20:43 -0400
committerKonstantin Ryabitsev <konstantin@linuxfoundation.org>2021-06-08 16:20:43 -0400
commita06304fcd63facb5e6fea86c8ff8ad42430c4439 (patch)
tree2e797a3b19fe44d80dcd3d393caaf41710c1f0a0
parentc45fba464ff3442d7dfa5f65092311b4b8d73757 (diff)
downloadb4-a06304fcd63facb5e6fea86c8ff8ad42430c4439.tar.gz
Perform an encoding bug avoidance dance
This is a kludge that I'm putting in place to avoid hitting an encoding bug with Python. We really shouldn't be making a fake RFC2822 message just so we can parse it again right away, so this is a temporary measure until I refactor how it's done. Signed-off-by: Konstantin Ryabitsev <konstantin@linuxfoundation.org>
-rw-r--r--b4/pr.py11
1 files changed, 10 insertions, 1 deletions
diff --git a/b4/pr.py b/b4/pr.py
index 0dc2bab..f0d990e 100644
--- a/b4/pr.py
+++ b/b4/pr.py
@@ -341,6 +341,8 @@ def explode(gitdir, lmsg, mailfrom=None, retrieve_links=True, fpopts=None):
cmsg.add_header('From', mailfrom)
cmsg.add_header('Subject', '[' + ' '.join(msubj.prefixes) + '] ' + lmsg.subject)
cmsg.add_header('Date', lmsg.msg.get('Date'))
+ cmsg.set_charset('utf-8')
+ cmsg.replace_header('Content-Transfer-Encoding', '8bit')
msg = cmsg
@@ -483,7 +485,14 @@ def get_pr_from_github(ghurl: str):
msg['Message-Id'] = utils.make_msgid(idstring=f'{rproj}-{rrepo}-pr-{rpull}', domain='github.com')
created_at = utils.format_datetime(datetime.strptime(prdata.get('created_at'), '%Y-%m-%dT%H:%M:%SZ'))
msg['Date'] = created_at
- lmsg = b4.LoreMessage(msg)
+ # We are going to turn it into bytes and then parse again
+ # in order to avoid bugs with python's message parsing routines that
+ # end up not doing the right thing when decoding 8bit message bodies
+ msg.set_charset('utf-8')
+ msg.replace_header('Content-Transfer-Encoding', '8bit')
+ bug_avoidance = msg.as_string(policy=b4.emlpolicy).encode()
+ cmsg = email.message_from_bytes(bug_avoidance)
+ lmsg = b4.LoreMessage(cmsg)
lmsg.pr_base_commit = base.get('sha')
lmsg.pr_repo = repo.get('clone_url')
lmsg.pr_ref = head.get('ref')