diff options
author | max <max@tclers.tk> | 2013-04-04 14:42:19 (GMT) |
---|---|---|
committer | max <max@tclers.tk> | 2013-04-04 14:42:19 (GMT) |
commit | 91b943a9a0a7d05e20c4b4dd02af0f86e7db48b7 (patch) | |
tree | 45959397b29bce6bd1bc6b815c0afa387f519613 /library | |
parent | c70e635d90321aba50e235fa636bcf1f78dfeda5 (diff) | |
download | tcl-91b943a9a0a7d05e20c4b4dd02af0f86e7db48b7.zip tcl-91b943a9a0a7d05e20c4b4dd02af0f86e7db48b7.tar.gz tcl-91b943a9a0a7d05e20c4b4dd02af0f86e7db48b7.tar.bz2 |
Allow URLs that don't have a path, but a query query, e.g. http://example.com?foo=bar .
Diffstat (limited to 'library')
-rw-r--r-- | library/http/http.tcl | 17 |
1 files changed, 13 insertions, 4 deletions
diff --git a/library/http/http.tcl b/library/http/http.tcl index ddf066e..57f665a 100644 --- a/library/http/http.tcl +++ b/library/http/http.tcl @@ -394,13 +394,16 @@ proc http::geturl {url args} { # First, before the colon, is the protocol scheme (e.g. http) # Second, for HTTP-like protocols, is the authority # The authority is preceded by // and lasts up to (but not including) - # the following / and it identifies up to four parts, of which only one, - # the host, is required (if an authority is present at all). All other - # parts of the authority (user name, password, port number) are optional. + # the following / or ? and it identifies up to four parts, of which + # only one, the host, is required (if an authority is present at all). + # All other parts of the authority (user name, password, port number) + # are optional. # Third is the resource name, which is split into two parts at a ? # The first part (from the single "/" up to "?") is the path, and the # second part (from that "?" up to "#") is the query. *HOWEVER*, we do # not need to separate them; we send the whole lot to the server. + # Both, path and query are allowed to be missing, including their + # delimiting character. # Fourth is the fragment identifier, which is everything after the first # "#" in the URL. The fragment identifier MUST NOT be sent to the server # and indeed, we don't bother to validate it (it could be an error to @@ -437,7 +440,7 @@ proc http::geturl {url args} { ) (?: : (\d+) )? # <port part of authority> )? - ( / [^\#]*)? # <path> (including query) + ( [/\?] [^\#]*)? # <path> (including query) (?: \# (.*) )? # <fragment> $ } @@ -481,6 +484,12 @@ proc http::geturl {url args} { } } if {$srvurl ne ""} { + # RFC 3986 allows empty paths (not even a /), but servers + # return 400 if the path in the HTTP request doesn't start + # with / , so add it here if needed. + if {[string index $srvurl 0] ne "/"} { + set srvurl /$srvurl + } # Check for validity according to RFC 3986, Appendix A set validityRE {(?xi) ^ |