summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorGuido van Rossum <guido@python.org>1996-07-30 16:29:16 (GMT)
committerGuido van Rossum <guido@python.org>1996-07-30 16:29:16 (GMT)
commit3534a8932a26ce1cc67595c7c6f059f7ddc40ddc (patch)
tree83b2673ee62da3bd3bfb052d0b3daaf7d5b0dca7
parent7698d12a8bb3a5b42d89843fd17a8caa8d4153cc (diff)
downloadcpython-3534a8932a26ce1cc67595c7c6f059f7ddc40ddc.zip
cpython-3534a8932a26ce1cc67595c7c6f059f7ddc40ddc.tar.gz
cpython-3534a8932a26ce1cc67595c7c6f059f7ddc40ddc.tar.bz2
New, improved parseaddr() by Sjoerd.
-rw-r--r--Lib/rfc822.py113
1 files changed, 83 insertions, 30 deletions
diff --git a/Lib/rfc822.py b/Lib/rfc822.py
index 64deaec..20abad8 100644
--- a/Lib/rfc822.py
+++ b/Lib/rfc822.py
@@ -297,35 +297,88 @@ def unquote(str):
# Parse an address into (name, address) tuple
def parseaddr(address):
- # This is probably not perfect
- address = string.strip(address)
- # Case 1: part of the address is in <xx@xx> form.
- pos = regex.search('<.*>', address)
- if pos >= 0:
- name = address[:pos]
- address = address[pos:]
- length = regex.match('<.*>', address)
- name = name + address[length:]
- address = address[:length]
- else:
- # Case 2: part of the address is in (comment) form
- pos = regex.search('(.*)', address)
- if pos >= 0:
- name = address[pos:]
- address = address[:pos]
- length = regex.match('(.*)', name)
- address = address + name[length:]
- name = name[:length]
+ import string
+ str = ''
+ email = ''
+ comment = ''
+ backslash = 0
+ dquote = 0
+ space = 0
+ paren = 0
+ bracket = 0
+ seen_bracket = 0
+ for c in address:
+ if backslash:
+ str = str + c
+ backslash = 0
+ continue
+ if c == '\\':
+ backslash = 1
+ continue
+ if dquote:
+ if c == '"':
+ dquote = 0
+ else:
+ str = str + c
+ continue
+ if c == '"':
+ dquote = 1
+ continue
+ if c in string.whitespace:
+ space = 1
+ continue
+ if space:
+ str = str + ' '
+ space = 0
+ if paren:
+ if c == '(':
+ paren = paren + 1
+ str = str + c
+ continue
+ if c == ')':
+ paren = paren - 1
+ if paren == 0:
+ comment = comment + str
+ str = ''
+ continue
+ if c == '(':
+ paren = paren + 1
+ if bracket:
+ email = email + str
+ str = ''
+ elif not seen_bracket:
+ email = email + str
+ str = ''
+ continue
+ if bracket:
+ if c == '>':
+ bracket = 0
+ email = email + str
+ str = ''
+ continue
+ if c == '<':
+ bracket = 1
+ seen_bracket = 1
+ comment = comment + str
+ str = ''
+ email = ''
+ continue
+ if c == '#' and not bracket and not paren:
+ # rest is comment
+ break
+ str = str + c
+ if str:
+ if seen_bracket:
+ if bracket:
+ email = str
+ else:
+ comment = comment + str
else:
- # Case 3: neither. Only an address
- name = ''
- name = string.strip(name)
- address = string.strip(address)
- if address and address[0] == '<' and address[-1] == '>':
- address = address[1:-1]
- if name and name[0] == '(' and name[-1] == ')':
- name = name[1:-1]
- return name, address
+ if paren:
+ comment = comment + str
+ else:
+ email = email + str
+ return string.strip(comment), string.strip(email)
# Parse a date field
@@ -376,8 +429,8 @@ def parsedate(data):
# message in RFC-822 format.
if __name__ == '__main__':
- import sys
- file = '/ufs/guido/Mail/drafts/,1'
+ import sys, os
+ file = os.path.join(os.environ['HOME'], 'Mail/drafts/,1')
if sys.argv[1:]: file = sys.argv[1]
f = open(file, 'r')
m = Message(f)