merge from 3.2

author: Senthil Kumaran <orsenthil@gmail.com> 2011-04-15 10:22:05 (GMT)
committer: Senthil Kumaran <orsenthil@gmail.com> 2011-04-15 10:22:05 (GMT)
commit: b496159603e5cc31904a894166ecce52fea01a1c (patch)
tree: 947788534cea9802e60046e3f74fb0c335999603 /Lib
parent: 0dea6484a05759258151800d0b604ea4820f6bb3 (diff)
parent: b4bd4af8c4adb03978803b5d94241a87e40bdaf9 (diff)
download: cpython-b496159603e5cc31904a894166ecce52fea01a1c.zip
cpython-b496159603e5cc31904a894166ecce52fea01a1c.tar.gz
cpython-b496159603e5cc31904a894166ecce52fea01a1c.tar.bz2
2 files changed, 15 insertions, 5 deletions
diff --git a/Lib/test/test_urlparse.py b/Lib/test/test_urlparse.py
index 628b8ec..c8d572c 100644
--- a/Lib/test/test_urlparse.py
+++ b/Lib/test/test_urlparse.py
@@ -228,6 +228,11 @@ class UrlParseTestCase(unittest.TestCase):
         #self.checkJoin(RFC1808_BASE, 'http:g', 'http:g')
         #self.checkJoin(RFC1808_BASE, 'http:', 'http:')
 
+    def test_RFC2368(self):
+        # Issue 11467: path that starts with a number is not parsed correctly
+        self.assertEqual(urllib.parse.urlparse('mailto:1337@example.org'),
+                ('mailto', '', '1337@example.org', '', '', ''))
+
     def test_RFC2396(self):
         # cases from RFC 2396
 
diff --git a/Lib/urllib/parse.py b/Lib/urllib/parse.py
index 9a3e42e..45ae202 100644
--- a/Lib/urllib/parse.py
+++ b/Lib/urllib/parse.py
@@ -340,12 +340,17 @@ def urlsplit(url, scheme='', allow_fragments=True):
             v = SplitResult(scheme, netloc, url, query, fragment)
             _parse_cache[key] = v
             return _coerce_result(v)
-        if url.endswith(':') or not url[i+1].isdigit():
-            for c in url[:i]:
-                if c not in scheme_chars:
-                    break
-            else:
+        for c in url[:i]:
+            if c not in scheme_chars:
+                break
+        else:
+            try:
+                # make sure "url" is not actually a port number (in which case
+                # "scheme" is really part of the path
+                _testportnum = int(url[i+1:])
+            except ValueError:
                 scheme, url = url[:i].lower(), url[i+1:]
+
     if url[:2] == '//':
         netloc, url = _splitnetloc(url, 2)
         if (('[' in netloc and ']' not in netloc) or
author	Senthil Kumaran <orsenthil@gmail.com>	2011-04-15 10:22:05 (GMT)
committer	Senthil Kumaran <orsenthil@gmail.com>	2011-04-15 10:22:05 (GMT)
commit	b496159603e5cc31904a894166ecce52fea01a1c (patch)
tree	947788534cea9802e60046e3f74fb0c335999603 /Lib
parent	0dea6484a05759258151800d0b604ea4820f6bb3 (diff)
parent	b4bd4af8c4adb03978803b5d94241a87e40bdaf9 (diff)
download	cpython-b496159603e5cc31904a894166ecce52fea01a1c.zip cpython-b496159603e5cc31904a894166ecce52fea01a1c.tar.gz cpython-b496159603e5cc31904a894166ecce52fea01a1c.tar.bz2