summaryrefslogtreecommitdiffstats
path: root/Lib/mimify.py
diff options
context:
space:
mode:
authorSjoerd Mullender <sjoerd@acm.org>1996-02-14 10:40:03 (GMT)
committerSjoerd Mullender <sjoerd@acm.org>1996-02-14 10:40:03 (GMT)
commite8a0a5c92a9fbfe0816a592d857cd75e7a875092 (patch)
tree1bb97a168b7dcc251a227ddad01ad8f8981db57b /Lib/mimify.py
parent5416e200375537b3559caa6f5722780844fbd9fe (diff)
downloadcpython-e8a0a5c92a9fbfe0816a592d857cd75e7a875092.zip
cpython-e8a0a5c92a9fbfe0816a592d857cd75e7a875092.tar.gz
cpython-e8a0a5c92a9fbfe0816a592d857cd75e7a875092.tar.bz2
Module to convert a mail message to or from quoted-printable. The
message may consist of several MIME parts in which case each part is converted independent of the others. Only converts when necessary.
Diffstat (limited to 'Lib/mimify.py')
-rwxr-xr-xLib/mimify.py415
1 files changed, 415 insertions, 0 deletions
diff --git a/Lib/mimify.py b/Lib/mimify.py
new file mode 100755
index 0000000..1582199
--- /dev/null
+++ b/Lib/mimify.py
@@ -0,0 +1,415 @@
+#!/usr/local/bin/python
+
+'''Mimification and unmimification of mail messages.
+
+decode quoted-printable parts of a mail message or encode using
+quoted-printable.
+
+Usage:
+ mimify(input, output)
+ unmimify(input, output)
+to encode and decode respectively. Input and output may be the name
+of a file or an open file object. Only a readline() method is used
+on the input file, only a write() method is used on the output file.
+When using file names, the input and output file names may be the
+same.
+
+Interactive usage:
+ mimify.py -e [infile [outfile]]
+ mimify.py -d [infile [outfile]]
+to encode and decode respectively. Infile defaults to standard
+input and outfile to standard output.
+'''
+
+# Configure
+MAXLEN = 200 # if lines longer than this, encode as quoted-printable
+CHARSET = 'ISO-8859-1' # default charset for non-US-ASCII mail
+QUOTE = '> ' # string replies are quoted with
+# End configure
+
+import regex, regsub, string
+
+qp = regex.compile('^content-transfer-encoding:[\000-\377]*quoted-printable',
+ regex.casefold)
+mp = regex.compile('^content-type:[\000-\377]*multipart/[\000-\377]*boundary="?\\([^;"\n]*\\)',
+ regex.casefold)
+chrset = regex.compile('^\\(content-type:.*charset="\\)\\(us-ascii\\|iso-8859-[0-9]+\\)\\("[\000-\377]*\\)',
+ regex.casefold)
+he = regex.compile('^-*$')
+mime_code = regex.compile('=\\([0-9a-f][0-9a-f]\\)', regex.casefold)
+mime_head = regex.compile('=\\?iso-8859-1\\?q\\?\\([^?]+\\)\\?=',
+ regex.casefold)
+repl = regex.compile('^subject:[ \t]+re: ', regex.casefold)
+
+class File:
+ '''A simple fake file object that knows about limited
+ read-ahead and boundaries.
+ The only supported method is readline().'''
+
+ def __init__(self, file, boundary):
+ self.file = file
+ self.boundary = boundary
+ self.peek = None
+
+ def readline(self):
+ if self.peek is not None:
+ return ''
+ line = self.file.readline()
+ if not line:
+ return line
+ if self.boundary:
+ if line == self.boundary + '\n':
+ self.peek = line
+ return ''
+ if line == self.boundary + '--\n':
+ self.peek = line
+ return ''
+ return line
+
+class HeaderFile:
+ def __init__(self, file):
+ self.file = file
+ self.peek = None
+
+ def readline(self):
+ if self.peek is not None:
+ line = self.peek
+ self.peek = None
+ else:
+ line = self.file.readline()
+ if not line:
+ return line
+ if he.match(line) >= 0:
+ return line
+ while 1:
+ self.peek = self.file.readline()
+ if len(self.peek) == 0 or \
+ (self.peek[0] != ' ' and self.peek[0] != '\t'):
+ return line
+ line = line + self.peek
+ self.peek = None
+
+def mime_decode(line):
+ '''Decode a single line of quoted-printable text to 8bit.'''
+ newline = ''
+ while 1:
+ i = mime_code.search(line)
+ if i < 0:
+ break
+ newline = newline + line[:i] + \
+ chr(string.atoi(mime_code.group(1), 16))
+ line = line[i+3:]
+ return newline + line
+
+def mime_decode_header(line):
+ '''Decode a header line to 8bit.'''
+ newline = ''
+ while 1:
+ i = mime_head.search(line)
+ if i < 0:
+ break
+ match = mime_head.group(0, 1)
+ newline = newline + line[:i] + mime_decode(match[1])
+ line = line[i + len(match[0]):]
+ return newline + line
+
+def unmimify_part(ifile, ofile):
+ '''Convert a quoted-printable part of a MIME mail message to 8bit.'''
+ multipart = None
+ quoted_printable = 0
+ is_repl = 0
+ if ifile.boundary and ifile.boundary[:2] == QUOTE:
+ prefix = QUOTE
+ else:
+ prefix = ''
+
+ # read header
+ hfile = HeaderFile(ifile)
+ while 1:
+ line = hfile.readline()
+ if not line:
+ return
+ if prefix and line[:len(prefix)] == prefix:
+ line = line[len(prefix):]
+ pref = prefix
+ else:
+ pref = ''
+ line = mime_decode_header(line)
+ if qp.match(line) >= 0:
+ quoted_printable = 1
+ continue # skip this header
+ ofile.write(pref + line)
+ if not prefix and repl.match(line) >= 0:
+ # we're dealing with a reply message
+ is_repl = 1
+ if mp.match(line) >= 0:
+ multipart = '--' + mp.group(1)
+ if he.match(line) >= 0:
+ break
+ if is_repl and (quoted_printable or multipart):
+ is_repl = 0
+
+ # read body
+ while 1:
+ line = ifile.readline()
+ if not line:
+ return
+ line = regsub.gsub(mime_head, '\\1', line)
+ if prefix and line[:len(prefix)] == prefix:
+ line = line[len(prefix):]
+ pref = prefix
+ else:
+ pref = ''
+## if is_repl and len(line) >= 4 and line[:4] == QUOTE+'--' and line[-3:] != '--\n':
+## multipart = line[:-1]
+ while multipart:
+ if line == multipart + '--\n':
+ ofile.write(pref + line)
+ multipart = None
+ line = None
+ break
+ if line == multipart + '\n':
+ ofile.write(pref + line)
+ nifile = File(ifile, multipart)
+ unmimify_part(nifile, ofile)
+ line = nifile.peek
+ continue
+ # not a boundary between parts
+ break
+ if line and quoted_printable:
+ while line[-2:] == '=\n':
+ line = line[:-2]
+ newline = ifile.readline()
+ if newline[:len(QUOTE)] == QUOTE:
+ newline = newline[len(QUOTE):]
+ line = line + newline
+ line = mime_decode(line)
+ if line:
+ ofile.write(pref + line)
+
+def unmimify(infile, outfile):
+ '''Convert quoted-printable parts of a MIME mail message to 8bit.'''
+ if type(infile) == type(''):
+ ifile = open(infile)
+ if type(outfile) == type('') and infile == outfile:
+ import os
+ d, f = os.path.split(infile)
+ os.rename(infile, os.path.join(d, ',' + f))
+ else:
+ ifile = infile
+ if type(outfile) == type(''):
+ ofile = open(outfile, 'w')
+ else:
+ ofile = outfile
+ nifile = File(ifile, None)
+ unmimify_part(nifile, ofile)
+ ofile.flush()
+
+mime_char = regex.compile('[=\240-\377]') # quote these chars in body
+mime_header_char = regex.compile('[=?\240-\377]') # quote these in header
+
+def mime_encode(line, header):
+ '''Code a single line as quoted-printable.
+ If header is set, quote some extra characters.'''
+ if header:
+ reg = mime_header_char
+ else:
+ reg = mime_char
+ newline = ''
+ if len(line) >= 5 and line[:5] == 'From ':
+ # quote 'From ' at the start of a line for stupid mailers
+ newline = string.upper('=%02x' % ord('F'))
+ line = line[1:]
+ while 1:
+ i = reg.search(line)
+ if i < 0:
+ break
+ newline = newline + line[:i] + \
+ string.upper('=%02x' % ord(line[i]))
+ line = line[i+1:]
+ line = newline + line
+
+ newline = ''
+ while len(line) >= 75:
+ i = 73
+ while line[i] == '=' or line[i-1] == '=':
+ i = i - 1
+ i = i + 1
+ newline = newline + line[:i] + '=\n'
+ line = line[i:]
+ return newline + line
+
+mime_header = regex.compile('\\([ \t(]\\)\\([-a-zA-Z0-9_+]*[\240-\377][-a-zA-Z0-9_+\240-\377]*\\)\\([ \t)]\\|$\\)')
+
+def mime_encode_header(line):
+ '''Code a single header line as quoted-printable.'''
+ newline = ''
+ while 1:
+ i = mime_header.search(line)
+ if i < 0:
+ break
+ newline = newline + line[:i] + mime_header.group(1) + \
+ '=?' + CHARSET + '?Q?' + \
+ mime_encode(mime_header.group(2), 1) + \
+ '?=' + mime_header.group(3)
+ line = line[i+len(mime_header.group(0)):]
+ return newline + line
+
+mv = regex.compile('^mime-version:', regex.casefold)
+cte = regex.compile('^content-transfer-encoding:', regex.casefold)
+iso_char = regex.compile('[\240-\377]')
+
+def mimify_part(ifile, ofile, is_mime):
+ '''Convert an 8bit part of a MIME mail message to quoted-printable.'''
+ has_cte = is_qp = 0
+ multipart = None
+ must_quote_body = must_quote_header = has_iso_chars = 0
+
+ header = []
+ header_end = ''
+ message = []
+ message_end = ''
+ # read header
+ hfile = HeaderFile(ifile)
+ while 1:
+ line = hfile.readline()
+ if not line:
+ break
+ if not must_quote_header and iso_char.search(line) >= 0:
+ must_quote_header = 1
+ if mv.match(line) >= 0:
+ is_mime = 1
+ if cte.match(line) >= 0:
+ has_cte = 1
+ if qp.match(line) >= 0:
+ is_qp = 1
+ if mp.match(line) >= 0:
+ multipart = '--' + mp.group(1)
+ if he.match(line) >= 0:
+ header_end = line
+ break
+ header.append(line)
+
+ # read body
+ while 1:
+ line = ifile.readline()
+ if not line:
+ break
+ if multipart:
+ if line == multipart + '--\n':
+ message_end = line
+ break
+ if line == multipart + '\n':
+ message_end = line
+ break
+ if is_qp:
+ while line[-2:] == '=\n':
+ line = line[:-2]
+ newline = ifile.readline()
+ if newline[:len(QUOTE)] == QUOTE:
+ newline = newline[len(QUOTE):]
+ line = line + newline
+ line = mime_decode(line)
+ message.append(line)
+ if not has_iso_chars:
+ if iso_char.search(line) >= 0:
+ has_iso_chars = must_quote_body = 1
+ if not must_quote_body:
+ if len(line) > MAXLEN:
+ must_quote_body = 1
+
+ # convert and output header and body
+ for line in header:
+ if must_quote_header:
+ line = mime_encode_header(line)
+ if chrset.match(line) >= 0:
+ if has_iso_chars:
+ # change us-ascii into iso-8859-1
+ if string.lower(chrset.group(2)) == 'us-ascii':
+ line = chrset.group(1) + \
+ CHARSET + chrset.group(3)
+ else:
+ # change iso-8859-* into us-ascii
+ line = chrset.group(1) + 'us-ascii' + chrset.group(3)
+ if has_cte and cte.match(line) >= 0:
+ line = 'Content-Transfer-Encoding: '
+ if must_quote_body:
+ line = line + 'quoted-printable\n'
+ else:
+ line = line + '7bit\n'
+ ofile.write(line)
+ if (must_quote_header or must_quote_body) and not is_mime:
+ ofile.write('Mime-Version: 1.0\n')
+ ofile.write('Content-Type: text/plain; ')
+ if has_iso_chars:
+ ofile.write('charset="%s"\n' % CHARSET)
+ else:
+ ofile.write('charset="us-ascii"\n')
+ if must_quote_body and not has_cte:
+ ofile.write('Content-Transfer-Encoding: quoted-printable\n')
+ ofile.write(header_end)
+
+ for line in message:
+ if must_quote_body:
+ line = mime_encode(line, 0)
+ ofile.write(line)
+ ofile.write(message_end)
+
+ line = message_end
+ while multipart:
+ if line == multipart + '--\n':
+ return
+ if line == multipart + '\n':
+ nifile = File(ifile, multipart)
+ mimify_part(nifile, ofile, 1)
+ line = nifile.peek
+ ofile.write(line)
+ continue
+
+def mimify(infile, outfile):
+ '''Convert 8bit parts of a MIME mail message to quoted-printable.'''
+ if type(infile) == type(''):
+ ifile = open(infile)
+ if type(outfile) == type('') and infile == outfile:
+ import os
+ d, f = os.path.split(infile)
+ os.rename(infile, os.path.join(d, ',' + f))
+ else:
+ ifile = infile
+ if type(outfile) == type(''):
+ ofile = open(outfile, 'w')
+ else:
+ ofile = outfile
+ nifile = File(ifile, None)
+ mimify_part(nifile, ofile, 0)
+ ofile.flush()
+
+import sys
+if __name__ == '__main__' or (len(sys.argv) > 0 and sys.argv[0] == 'mimify'):
+ import getopt
+ usage = 'Usage: mimify [-l len] -[ed] [infile [outfile]]'
+
+ opts, args = getopt.getopt(sys.argv[1:], 'l:ed')
+ if len(args) not in (0, 1, 2):
+ print usage
+ sys.exit(1)
+ if (('-e', '') in opts) == (('-d', '') in opts):
+ print usage
+ sys.exit(1)
+ for o, a in opts:
+ if o == '-e':
+ encode = mimify
+ elif o == '-d':
+ encode = unmimify
+ elif o == '-l':
+ try:
+ MAXLEN = string.atoi(a)
+ except:
+ print usage
+ sys.exit(1)
+ if len(args) == 0:
+ encode(sys.stdin, sys.stdout)
+ elif len(args) == 1:
+ encode(args[0], sys.stdout)
+ else:
+ encode(args[0], args[1])