source: trunk/essentials/dev-lang/python/Lib/email/base64mime.py@ 3226

Last change on this file since 3226 was 3225, checked in by bird, 19 years ago

Python 2.5

File size: 5.7 KB
Line 
1# Copyright (C) 2002-2006 Python Software Foundation
2# Author: Ben Gertzfield
3# Contact: [email protected]
4
5"""Base64 content transfer encoding per RFCs 2045-2047.
6
7This module handles the content transfer encoding method defined in RFC 2045
8to encode arbitrary 8-bit data using the three 8-bit bytes in four 7-bit
9characters encoding known as Base64.
10
11It is used in the MIME standards for email to attach images, audio, and text
12using some 8-bit character sets to messages.
13
14This module provides an interface to encode and decode both headers and bodies
15with Base64 encoding.
16
17RFC 2045 defines a method for including character set information in an
18`encoded-word' in a header. This method is commonly used for 8-bit real names
19in To:, From:, Cc:, etc. fields, as well as Subject: lines.
20
21This module does not do the line wrapping or end-of-line character conversion
22necessary for proper internationalized headers; it only does dumb encoding and
23decoding. To deal with the various line wrapping issues, use the email.Header
24module.
25"""
26
27__all__ = [
28 'base64_len',
29 'body_decode',
30 'body_encode',
31 'decode',
32 'decodestring',
33 'encode',
34 'encodestring',
35 'header_encode',
36 ]
37
38import re
39
40from binascii import b2a_base64, a2b_base64
41from email.utils import fix_eols
42
43CRLF = '\r\n'
44NL = '\n'
45EMPTYSTRING = ''
46
47# See also Charset.py
48MISC_LEN = 7
49
50
51
52
53# Helpers
54def base64_len(s):
55 """Return the length of s when it is encoded with base64."""
56 groups_of_3, leftover = divmod(len(s), 3)
57 # 4 bytes out for each 3 bytes (or nonzero fraction thereof) in.
58 # Thanks, Tim!
59 n = groups_of_3 * 4
60 if leftover:
61 n += 4
62 return n
63
64
65
66
67def header_encode(header, charset='iso-8859-1', keep_eols=False,
68 maxlinelen=76, eol=NL):
69 """Encode a single header line with Base64 encoding in a given charset.
70
71 Defined in RFC 2045, this Base64 encoding is identical to normal Base64
72 encoding, except that each line must be intelligently wrapped (respecting
73 the Base64 encoding), and subsequent lines must start with a space.
74
75 charset names the character set to use to encode the header. It defaults
76 to iso-8859-1.
77
78 End-of-line characters (\\r, \\n, \\r\\n) will be automatically converted
79 to the canonical email line separator \\r\\n unless the keep_eols
80 parameter is True (the default is False).
81
82 Each line of the header will be terminated in the value of eol, which
83 defaults to "\\n". Set this to "\\r\\n" if you are using the result of
84 this function directly in email.
85
86 The resulting string will be in the form:
87
88 "=?charset?b?WW/5ciBtYXp66XLrIHf8eiBhIGhhbXBzdGHuciBBIFlv+XIgbWF6euly?=\\n
89 =?charset?b?6yB3/HogYSBoYW1wc3Rh7nIgQkMgWW/5ciBtYXp66XLrIHf8eiBhIGhh?="
90
91 with each line wrapped at, at most, maxlinelen characters (defaults to 76
92 characters).
93 """
94 # Return empty headers unchanged
95 if not header:
96 return header
97
98 if not keep_eols:
99 header = fix_eols(header)
100
101 # Base64 encode each line, in encoded chunks no greater than maxlinelen in
102 # length, after the RFC chrome is added in.
103 base64ed = []
104 max_encoded = maxlinelen - len(charset) - MISC_LEN
105 max_unencoded = max_encoded * 3 // 4
106
107 for i in range(0, len(header), max_unencoded):
108 base64ed.append(b2a_base64(header[i:i+max_unencoded]))
109
110 # Now add the RFC chrome to each encoded chunk
111 lines = []
112 for line in base64ed:
113 # Ignore the last character of each line if it is a newline
114 if line.endswith(NL):
115 line = line[:-1]
116 # Add the chrome
117 lines.append('=?%s?b?%s?=' % (charset, line))
118 # Glue the lines together and return it. BAW: should we be able to
119 # specify the leading whitespace in the joiner?
120 joiner = eol + ' '
121 return joiner.join(lines)
122
123
124
125
126def encode(s, binary=True, maxlinelen=76, eol=NL):
127 """Encode a string with base64.
128
129 Each line will be wrapped at, at most, maxlinelen characters (defaults to
130 76 characters).
131
132 If binary is False, end-of-line characters will be converted to the
133 canonical email end-of-line sequence \\r\\n. Otherwise they will be left
134 verbatim (this is the default).
135
136 Each line of encoded text will end with eol, which defaults to "\\n". Set
137 this to "\r\n" if you will be using the result of this function directly
138 in an email.
139 """
140 if not s:
141 return s
142
143 if not binary:
144 s = fix_eols(s)
145
146 encvec = []
147 max_unencoded = maxlinelen * 3 // 4
148 for i in range(0, len(s), max_unencoded):
149 # BAW: should encode() inherit b2a_base64()'s dubious behavior in
150 # adding a newline to the encoded string?
151 enc = b2a_base64(s[i:i + max_unencoded])
152 if enc.endswith(NL) and eol <> NL:
153 enc = enc[:-1] + eol
154 encvec.append(enc)
155 return EMPTYSTRING.join(encvec)
156
157
158# For convenience and backwards compatibility w/ standard base64 module
159body_encode = encode
160encodestring = encode
161
162
163
164
165def decode(s, convert_eols=None):
166 """Decode a raw base64 string.
167
168 If convert_eols is set to a string value, all canonical email linefeeds,
169 e.g. "\\r\\n", in the decoded text will be converted to the value of
170 convert_eols. os.linesep is a good choice for convert_eols if you are
171 decoding a text attachment.
172
173 This function does not parse a full MIME header value encoded with
174 base64 (like =?iso-8895-1?b?bmloISBuaWgh?=) -- please use the high
175 level email.Header class for that functionality.
176 """
177 if not s:
178 return s
179
180 dec = a2b_base64(s)
181 if convert_eols:
182 return dec.replace(CRLF, convert_eols)
183 return dec
184
185
186# For convenience and backwards compatibility w/ standard base64 module
187body_decode = decode
188decodestring = decode
Note: See TracBrowser for help on using the repository browser.