nonHostChars = ['%', '/', '?', ';', '#'].concat(autoEscape),
hostEndingChars = ['/', '?', '#'],
hostnameMaxLen = 255,
- hostnamePartPattern = /^[a-z0-9A-Z_-]{0,63}$/,
- hostnamePartStart = /^([a-z0-9A-Z_-]{0,63})(.*)$/,
+ hostnamePatternString = '[^' + nonHostChars.join('') + ']{0,63}',
+ hostnamePartPattern = new RegExp('^' + hostnamePatternString + '$'),
+ hostnamePartStart = new RegExp('^(' + hostnamePatternString + ')(.*)$'),
// protocols that can allow "unsafe" and "unwise" chars.
unsafeProtocol = {
'javascript': true,
'path': '/Y'
},
+ // + not an invalid host character
+ // per https://url.spec.whatwg.org/#host-parsing
+ 'http://x.y.com+a/b/c' : {
+ 'href': 'http://x.y.com+a/b/c',
+ 'protocol': 'http:',
+ 'slashes': true,
+ 'host': 'x.y.com+a',
+ 'hostname': 'x.y.com+a',
+ 'pathname': '/b/c',
+ 'path': '/b/c'
+ },
+
// an unexpected invalid char in the hostname.
- 'HtTp://x.y.cOm*a/b/c?d=e#f g<h>i' : {
- 'href': 'http://x.y.com/*a/b/c?d=e#f%20g%3Ch%3Ei',
+ 'HtTp://x.y.cOm;a/b/c?d=e#f g<h>i' : {
+ 'href': 'http://x.y.com/;a/b/c?d=e#f%20g%3Ch%3Ei',
'protocol': 'http:',
'slashes': true,
'host': 'x.y.com',
'hostname': 'x.y.com',
- 'pathname': '/*a/b/c',
+ 'pathname': ';a/b/c',
'search': '?d=e',
'query': 'd=e',
'hash': '#f%20g%3Ch%3Ei',
- 'path': '/*a/b/c?d=e'
+ 'path': ';a/b/c?d=e'
},
// make sure that we don't accidentally lcast the path parts.
- 'HtTp://x.y.cOm*A/b/c?d=e#f g<h>i' : {
- 'href': 'http://x.y.com/*A/b/c?d=e#f%20g%3Ch%3Ei',
+ 'HtTp://x.y.cOm;A/b/c?d=e#f g<h>i' : {
+ 'href': 'http://x.y.com/;A/b/c?d=e#f%20g%3Ch%3Ei',
'protocol': 'http:',
'slashes': true,
'host': 'x.y.com',
'hostname': 'x.y.com',
- 'pathname': '/*A/b/c',
+ 'pathname': ';A/b/c',
'search': '?d=e',
'query': 'd=e',
'hash': '#f%20g%3Ch%3Ei',
- 'path': '/*A/b/c?d=e'
+ 'path': ';A/b/c?d=e'
},
'http://x...y...#p': {
'path': '/'
},
- 'http://www.Äffchen.cOm*A/b/c?d=e#f g<h>i' : {
- 'href': 'http://www.xn--ffchen-9ta.com/*A/b/c?d=e#f%20g%3Ch%3Ei',
+ 'http://www.Äffchen.cOm;A/b/c?d=e#f g<h>i' : {
+ 'href': 'http://www.xn--ffchen-9ta.com/;A/b/c?d=e#f%20g%3Ch%3Ei',
'protocol': 'http:',
'slashes': true,
'host': 'www.xn--ffchen-9ta.com',
'hostname': 'www.xn--ffchen-9ta.com',
- 'pathname': '/*A/b/c',
+ 'pathname': ';A/b/c',
'search': '?d=e',
'query': 'd=e',
'hash': '#f%20g%3Ch%3Ei',
- 'path': '/*A/b/c?d=e'
+ 'path': ';A/b/c?d=e'
},
'http://SÉLIER.COM/' : {