summaryrefslogtreecommitdiffstats
path: root/Lib
diff options
context:
space:
mode:
authorSenthil Kumaran <orsenthil@gmail.com>2010-08-04 04:45:31 (GMT)
committerSenthil Kumaran <orsenthil@gmail.com>2010-08-04 04:45:31 (GMT)
commit0b5019fe2376ed6ef2aaf61ff9cbc8e6b090bc56 (patch)
tree33f9f2f49322aad97d20169ada9767fe8b411d01 /Lib
parent75a292e5be429977656acaf846345be9dc0a6b8e (diff)
downloadcpython-0b5019fe2376ed6ef2aaf61ff9cbc8e6b090bc56.zip
cpython-0b5019fe2376ed6ef2aaf61ff9cbc8e6b090bc56.tar.gz
cpython-0b5019fe2376ed6ef2aaf61ff9cbc8e6b090bc56.tar.bz2
Fix Issue754016 - urlparse goes wrong with IP:port without scheme
Diffstat (limited to 'Lib')
-rw-r--r--Lib/test/test_urlparse.py20
-rw-r--r--Lib/urlparse.py11
2 files changed, 26 insertions, 5 deletions
diff --git a/Lib/test/test_urlparse.py b/Lib/test/test_urlparse.py
index 80e4d91..8244017 100644
--- a/Lib/test/test_urlparse.py
+++ b/Lib/test/test_urlparse.py
@@ -478,6 +478,26 @@ class UrlParseTestCase(unittest.TestCase):
self.assertEqual(urlparse.urlparse("x-newscheme://foo.com/stuff"),
('x-newscheme','foo.com','/stuff','','',''))
+ def test_withoutscheme(self):
+ # Test urlparse without scheme
+ # Issue 754016: urlparse goes wrong with IP:port without scheme
+ # RFC 1808 specifies that netloc should start with //, urlparse expects
+ # the same, otherwise it classifies the portion of url as path.
+ self.assertEqual(urlparse.urlparse("path"),
+ ('','','path','','',''))
+ self.assertEqual(urlparse.urlparse("//www.python.org:80"),
+ ('','www.python.org:80','','','',''))
+ self.assertEqual(urlparse.urlparse("http://www.python.org:80"),
+ ('http','www.python.org:80','','','',''))
+
+ def test_portseparator(self):
+ # Issue 754016 makes changes for port separator ':' from scheme separator
+ self.assertEqual(urlparse.urlparse("path:80"),
+ ('','','path:80','','',''))
+ self.assertEqual(urlparse.urlparse("http:"),('http','','','','',''))
+ self.assertEqual(urlparse.urlparse("https:"),('https','','','','',''))
+ self.assertEqual(urlparse.urlparse("http://www.python.org:80"),
+ ('http','www.python.org:80','','','',''))
def test_main():
diff --git a/Lib/urlparse.py b/Lib/urlparse.py
index 6261b24..99ebe6a 100644
--- a/Lib/urlparse.py
+++ b/Lib/urlparse.py
@@ -187,11 +187,12 @@ def urlsplit(url, scheme='', allow_fragments=True):
v = SplitResult(scheme, netloc, url, query, fragment)
_parse_cache[key] = v
return v
- for c in url[:i]:
- if c not in scheme_chars:
- break
- else:
- scheme, url = url[:i].lower(), url[i+1:]
+ if url.endswith(':') or not url[i+1].isdigit():
+ for c in url[:i]:
+ if c not in scheme_chars:
+ break
+ else:
+ scheme, url = url[:i].lower(), url[i+1:]
if url[:2] == '//':
netloc, url = _splitnetloc(url, 2)