17db96d56Sopenharmony_ci# Copyright (C) 2002-2007 Python Software Foundation 27db96d56Sopenharmony_ci# Author: Ben Gertzfield 37db96d56Sopenharmony_ci# Contact: email-sig@python.org 47db96d56Sopenharmony_ci 57db96d56Sopenharmony_ci"""Base64 content transfer encoding per RFCs 2045-2047. 67db96d56Sopenharmony_ci 77db96d56Sopenharmony_ciThis module handles the content transfer encoding method defined in RFC 2045 87db96d56Sopenharmony_cito encode arbitrary 8-bit data using the three 8-bit bytes in four 7-bit 97db96d56Sopenharmony_cicharacters encoding known as Base64. 107db96d56Sopenharmony_ci 117db96d56Sopenharmony_ciIt is used in the MIME standards for email to attach images, audio, and text 127db96d56Sopenharmony_ciusing some 8-bit character sets to messages. 137db96d56Sopenharmony_ci 147db96d56Sopenharmony_ciThis module provides an interface to encode and decode both headers and bodies 157db96d56Sopenharmony_ciwith Base64 encoding. 167db96d56Sopenharmony_ci 177db96d56Sopenharmony_ciRFC 2045 defines a method for including character set information in an 187db96d56Sopenharmony_ci`encoded-word' in a header. This method is commonly used for 8-bit real names 197db96d56Sopenharmony_ciin To:, From:, Cc:, etc. fields, as well as Subject: lines. 207db96d56Sopenharmony_ci 217db96d56Sopenharmony_ciThis module does not do the line wrapping or end-of-line character conversion 227db96d56Sopenharmony_cinecessary for proper internationalized headers; it only does dumb encoding and 237db96d56Sopenharmony_cidecoding. To deal with the various line wrapping issues, use the email.header 247db96d56Sopenharmony_cimodule. 257db96d56Sopenharmony_ci""" 267db96d56Sopenharmony_ci 277db96d56Sopenharmony_ci__all__ = [ 287db96d56Sopenharmony_ci 'body_decode', 297db96d56Sopenharmony_ci 'body_encode', 307db96d56Sopenharmony_ci 'decode', 317db96d56Sopenharmony_ci 'decodestring', 327db96d56Sopenharmony_ci 'header_encode', 337db96d56Sopenharmony_ci 'header_length', 347db96d56Sopenharmony_ci ] 357db96d56Sopenharmony_ci 367db96d56Sopenharmony_ci 377db96d56Sopenharmony_cifrom base64 import b64encode 387db96d56Sopenharmony_cifrom binascii import b2a_base64, a2b_base64 397db96d56Sopenharmony_ci 407db96d56Sopenharmony_ciCRLF = '\r\n' 417db96d56Sopenharmony_ciNL = '\n' 427db96d56Sopenharmony_ciEMPTYSTRING = '' 437db96d56Sopenharmony_ci 447db96d56Sopenharmony_ci# See also Charset.py 457db96d56Sopenharmony_ciMISC_LEN = 7 467db96d56Sopenharmony_ci 477db96d56Sopenharmony_ci 487db96d56Sopenharmony_ci 497db96d56Sopenharmony_ci# Helpers 507db96d56Sopenharmony_cidef header_length(bytearray): 517db96d56Sopenharmony_ci """Return the length of s when it is encoded with base64.""" 527db96d56Sopenharmony_ci groups_of_3, leftover = divmod(len(bytearray), 3) 537db96d56Sopenharmony_ci # 4 bytes out for each 3 bytes (or nonzero fraction thereof) in. 547db96d56Sopenharmony_ci n = groups_of_3 * 4 557db96d56Sopenharmony_ci if leftover: 567db96d56Sopenharmony_ci n += 4 577db96d56Sopenharmony_ci return n 587db96d56Sopenharmony_ci 597db96d56Sopenharmony_ci 607db96d56Sopenharmony_ci 617db96d56Sopenharmony_cidef header_encode(header_bytes, charset='iso-8859-1'): 627db96d56Sopenharmony_ci """Encode a single header line with Base64 encoding in a given charset. 637db96d56Sopenharmony_ci 647db96d56Sopenharmony_ci charset names the character set to use to encode the header. It defaults 657db96d56Sopenharmony_ci to iso-8859-1. Base64 encoding is defined in RFC 2045. 667db96d56Sopenharmony_ci """ 677db96d56Sopenharmony_ci if not header_bytes: 687db96d56Sopenharmony_ci return "" 697db96d56Sopenharmony_ci if isinstance(header_bytes, str): 707db96d56Sopenharmony_ci header_bytes = header_bytes.encode(charset) 717db96d56Sopenharmony_ci encoded = b64encode(header_bytes).decode("ascii") 727db96d56Sopenharmony_ci return '=?%s?b?%s?=' % (charset, encoded) 737db96d56Sopenharmony_ci 747db96d56Sopenharmony_ci 757db96d56Sopenharmony_ci 767db96d56Sopenharmony_cidef body_encode(s, maxlinelen=76, eol=NL): 777db96d56Sopenharmony_ci r"""Encode a string with base64. 787db96d56Sopenharmony_ci 797db96d56Sopenharmony_ci Each line will be wrapped at, at most, maxlinelen characters (defaults to 807db96d56Sopenharmony_ci 76 characters). 817db96d56Sopenharmony_ci 827db96d56Sopenharmony_ci Each line of encoded text will end with eol, which defaults to "\n". Set 837db96d56Sopenharmony_ci this to "\r\n" if you will be using the result of this function directly 847db96d56Sopenharmony_ci in an email. 857db96d56Sopenharmony_ci """ 867db96d56Sopenharmony_ci if not s: 877db96d56Sopenharmony_ci return "" 887db96d56Sopenharmony_ci 897db96d56Sopenharmony_ci encvec = [] 907db96d56Sopenharmony_ci max_unencoded = maxlinelen * 3 // 4 917db96d56Sopenharmony_ci for i in range(0, len(s), max_unencoded): 927db96d56Sopenharmony_ci # BAW: should encode() inherit b2a_base64()'s dubious behavior in 937db96d56Sopenharmony_ci # adding a newline to the encoded string? 947db96d56Sopenharmony_ci enc = b2a_base64(s[i:i + max_unencoded]).decode("ascii") 957db96d56Sopenharmony_ci if enc.endswith(NL) and eol != NL: 967db96d56Sopenharmony_ci enc = enc[:-1] + eol 977db96d56Sopenharmony_ci encvec.append(enc) 987db96d56Sopenharmony_ci return EMPTYSTRING.join(encvec) 997db96d56Sopenharmony_ci 1007db96d56Sopenharmony_ci 1017db96d56Sopenharmony_ci 1027db96d56Sopenharmony_cidef decode(string): 1037db96d56Sopenharmony_ci """Decode a raw base64 string, returning a bytes object. 1047db96d56Sopenharmony_ci 1057db96d56Sopenharmony_ci This function does not parse a full MIME header value encoded with 1067db96d56Sopenharmony_ci base64 (like =?iso-8859-1?b?bmloISBuaWgh?=) -- please use the high 1077db96d56Sopenharmony_ci level email.header class for that functionality. 1087db96d56Sopenharmony_ci """ 1097db96d56Sopenharmony_ci if not string: 1107db96d56Sopenharmony_ci return bytes() 1117db96d56Sopenharmony_ci elif isinstance(string, str): 1127db96d56Sopenharmony_ci return a2b_base64(string.encode('raw-unicode-escape')) 1137db96d56Sopenharmony_ci else: 1147db96d56Sopenharmony_ci return a2b_base64(string) 1157db96d56Sopenharmony_ci 1167db96d56Sopenharmony_ci 1177db96d56Sopenharmony_ci# For convenience and backwards compatibility w/ standard base64 module 1187db96d56Sopenharmony_cibody_decode = decode 1197db96d56Sopenharmony_cidecodestring = decode 120