Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Appearance settings

Commit ddca295

Browse filesBrowse files
[3.9] gh-103848: Adds checks to ensure that bracketed hosts found by urlsplit are of IPv6 or IPvFuture format (#103849) (#126976)
Co-authored-by: Gregory P. Smith <greg@krypto.org> (cherry picked from commit 29f348e) Co-authored-by: JohnJamesUtley <81572567+JohnJamesUtley@users.noreply.github.com>
1 parent 307a762 commit ddca295
Copy full SHA for ddca295

File tree

3 files changed

+43
-1
lines changed
Filter options

3 files changed

+43
-1
lines changed

‎Lib/test/test_urlparse.py

Copy file name to clipboardExpand all lines: Lib/test/test_urlparse.py
+26Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1135,6 +1135,32 @@ def test_issue14072(self):
11351135
self.assertEqual(p2.scheme, 'tel')
11361136
self.assertEqual(p2.path, '+31641044153')
11371137

1138+
def test_invalid_bracketed_hosts(self):
1139+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[192.0.2.146]/Path?Query')
1140+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[important.com:8000]/Path?Query')
1141+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[v123r.IP]/Path?Query')
1142+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[v12ae]/Path?Query')
1143+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[v.IP]/Path?Query')
1144+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[v123.]/Path?Query')
1145+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[v]/Path?Query')
1146+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[0439:23af::2309::fae7:1234]/Path?Query')
1147+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@[0439:23af:2309::fae7:1234:2342:438e:192.0.2.146]/Path?Query')
1148+
self.assertRaises(ValueError, urllib.parse.urlsplit, 'Scheme://user@]v6a.ip[/Path')
1149+
1150+
def test_splitting_bracketed_hosts(self):
1151+
p1 = urllib.parse.urlsplit('scheme://user@[v6a.ip]/path?query')
1152+
self.assertEqual(p1.hostname, 'v6a.ip')
1153+
self.assertEqual(p1.username, 'user')
1154+
self.assertEqual(p1.path, '/path')
1155+
p2 = urllib.parse.urlsplit('scheme://user@[0439:23af:2309::fae7%test]/path?query')
1156+
self.assertEqual(p2.hostname, '0439:23af:2309::fae7%test')
1157+
self.assertEqual(p2.username, 'user')
1158+
self.assertEqual(p2.path, '/path')
1159+
p3 = urllib.parse.urlsplit('scheme://user@[0439:23af:2309::fae7:1234:192.0.2.146%test]/path?query')
1160+
self.assertEqual(p3.hostname, '0439:23af:2309::fae7:1234:192.0.2.146%test')
1161+
self.assertEqual(p3.username, 'user')
1162+
self.assertEqual(p3.path, '/path')
1163+
11381164
def test_port_casting_failure_message(self):
11391165
message = "Port could not be cast to integer value as 'oracle'"
11401166
p1 = urllib.parse.urlparse('http://Server=sde; Service=sde:oracle')

‎Lib/urllib/parse.py

Copy file name to clipboardExpand all lines: Lib/urllib/parse.py
+15-1Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,7 @@
3636
import types
3737
import collections
3838
import warnings
39+
import ipaddress
3940

4041
__all__ = ["urlparse", "urlunparse", "urljoin", "urldefrag",
4142
"urlsplit", "urlunsplit", "urlencode", "parse_qs",
@@ -442,6 +443,17 @@ def _checknetloc(netloc):
442443
raise ValueError("netloc '" + netloc + "' contains invalid " +
443444
"characters under NFKC normalization")
444445

446+
# Valid bracketed hosts are defined in
447+
# https://www.rfc-editor.org/rfc/rfc3986#page-49 and https://url.spec.whatwg.org/
448+
def _check_bracketed_host(hostname):
449+
if hostname.startswith('v'):
450+
if not re.match(r"\Av[a-fA-F0-9]+\..+\Z", hostname):
451+
raise ValueError(f"IPvFuture address is invalid")
452+
else:
453+
ip = ipaddress.ip_address(hostname) # Throws Value Error if not IPv6 or IPv4
454+
if isinstance(ip, ipaddress.IPv4Address):
455+
raise ValueError(f"An IPv4 address cannot be in brackets")
456+
445457
def urlsplit(url, scheme='', allow_fragments=True):
446458
"""Parse a URL into 5 components:
447459
<scheme>://<netloc>/<path>?<query>#<fragment>
@@ -488,12 +500,14 @@ def urlsplit(url, scheme='', allow_fragments=True):
488500
break
489501
else:
490502
scheme, url = url[:i].lower(), url[i+1:]
491-
492503
if url[:2] == '//':
493504
netloc, url = _splitnetloc(url, 2)
494505
if (('[' in netloc and ']' not in netloc) or
495506
(']' in netloc and '[' not in netloc)):
496507
raise ValueError("Invalid IPv6 URL")
508+
if '[' in netloc and ']' in netloc:
509+
bracketed_host = netloc.partition('[')[2].partition(']')[0]
510+
_check_bracketed_host(bracketed_host)
497511
if allow_fragments and '#' in url:
498512
url, fragment = url.split('#', 1)
499513
if '?' in url:
+2Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
Add checks to ensure that ``[`` bracketed ``]`` hosts found by
2+
:func:`urllib.parse.urlsplit` are of IPv6 or IPvFuture format.

0 commit comments

Comments
0 (0)
Morty Proxy This is a proxified and sanitized view of the page, visit original site.