NotificationsYou must be signed in to change notification settings
Fork33.7k
Star70.4k

Commit0a87812

and

authored

[3.8]gh-67693: Fix urlunparse() and urlunsplit() for URIs with path starting with multiple slashes and no authority (GH-113563) (#119028)

(cherry picked from commite237b25)Co-authored-by: Łukasz Langa <lukasz@langa.pl>

1 parent7d1f50c commit0a87812Copy full SHA for 0a87812

File tree

3 files changed

+70

-4

lines changed

Lib
- test
  - test_urlparse.py
- urllib
  - parse.py
Misc/NEWS.d/next/Library
- 2019-08-27-01-16-50.gh-issue-67693.4NIAiy.rst

3 files changed

+70

-4

lines changed

`‎Lib/test/test_urlparse.py‎`

Lines changed: 67 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -70,15 +70,17 @@`
`70`	`70`
`71`	`71`	`classUrlParseTestCase(unittest.TestCase):`
`72`	`72`
`73`		`-defcheckRoundtrips(self,url,parsed,split):`
	`73`	`+defcheckRoundtrips(self,url,parsed,split,url2=None):`
	`74`	`+ifurl2isNone:`
	`75`	`+url2=url`
`74`	`76`	`result=urllib.parse.urlparse(url)`
`75`	`77`	`self.assertEqual(result,parsed)`
`76`	`78`	`t= (result.scheme,result.netloc,result.path,`
`77`	`79`	`result.params,result.query,result.fragment)`
`78`	`80`	`self.assertEqual(t,parsed)`
`79`	`81`	`# put it back together and it should be the same`
`80`	`82`	`result2=urllib.parse.urlunparse(result)`
`81`		`-self.assertEqual(result2,url)`
	`83`	`+self.assertEqual(result2,url2)`
`82`	`84`	`self.assertEqual(result2,result.geturl())`
`83`	`85`
`84`	`86`	`# the result of geturl() is a fixpoint; we can always parse it`
`@@ -104,7 +106,7 @@ def checkRoundtrips(self, url, parsed, split):`
`104`	`106`	`result.query,result.fragment)`
`105`	`107`	`self.assertEqual(t,split)`
`106`	`108`	`result2=urllib.parse.urlunsplit(result)`
`107`		`-self.assertEqual(result2,url)`
	`109`	`+self.assertEqual(result2,url2)`
`108`	`110`	`self.assertEqual(result2,result.geturl())`
`109`	`111`
`110`	`112`	`# check the fixpoint property of re-parsing the result of geturl()`
`@@ -142,9 +144,39 @@ def test_qs(self):`
`142`	`144`
`143`	`145`	`deftest_roundtrips(self):`
`144`	`146`	`str_cases= [`
	`147`	`+ ('path/to/file',`
	`148`	`+ ('','','path/to/file','','',''),`
	`149`	`+ ('','','path/to/file','','')),`
	`150`	`+ ('/path/to/file',`
	`151`	`+ ('','','/path/to/file','','',''),`
	`152`	`+ ('','','/path/to/file','','')),`
	`153`	`+ ('//path/to/file',`
	`154`	`+ ('','path','/to/file','','',''),`
	`155`	`+ ('','path','/to/file','','')),`
	`156`	`+ ('////path/to/file',`
	`157`	`+ ('','','//path/to/file','','',''),`
	`158`	`+ ('','','//path/to/file','','')),`
	`159`	`+ ('scheme:path/to/file',`
	`160`	`+ ('scheme','','path/to/file','','',''),`
	`161`	`+ ('scheme','','path/to/file','','')),`
	`162`	`+ ('scheme:/path/to/file',`
	`163`	`+ ('scheme','','/path/to/file','','',''),`
	`164`	`+ ('scheme','','/path/to/file','','')),`
	`165`	`+ ('scheme://path/to/file',`
	`166`	`+ ('scheme','path','/to/file','','',''),`
	`167`	`+ ('scheme','path','/to/file','','')),`
	`168`	`+ ('scheme:////path/to/file',`
	`169`	`+ ('scheme','','//path/to/file','','',''),`
	`170`	`+ ('scheme','','//path/to/file','','')),`
`145`	`171`	`('file:///tmp/junk.txt',`
`146`	`172`	`('file','','/tmp/junk.txt','','',''),`
`147`	`173`	`('file','','/tmp/junk.txt','','')),`
	`174`	`+ ('file:////tmp/junk.txt',`
	`175`	`+ ('file','','//tmp/junk.txt','','',''),`
	`176`	`+ ('file','','//tmp/junk.txt','','')),`
	`177`	`+ ('file://///tmp/junk.txt',`
	`178`	`+ ('file','','///tmp/junk.txt','','',''),`
	`179`	`+ ('file','','///tmp/junk.txt','','')),`
`148`	`180`	`('imap://mail.python.org/mbox1',`
`149`	`181`	`('imap','mail.python.org','/mbox1','','',''),`
`150`	`182`	`('imap','mail.python.org','/mbox1','','')),`
`@@ -175,6 +207,38 @@ def _encode(t):`
`175`	`207`	`forurl,parsed,splitinstr_cases+bytes_cases:`
`176`	`208`	`self.checkRoundtrips(url,parsed,split)`
`177`	`209`
	`210`	`+deftest_roundtrips_normalization(self):`
	`211`	`+str_cases= [`
	`212`	`+ ('///path/to/file',`
	`213`	`+'/path/to/file',`
	`214`	`+ ('','','/path/to/file','','',''),`
	`215`	`+ ('','','/path/to/file','','')),`
	`216`	`+ ('scheme:///path/to/file',`
	`217`	`+'scheme:/path/to/file',`
	`218`	`+ ('scheme','','/path/to/file','','',''),`
	`219`	`+ ('scheme','','/path/to/file','','')),`
	`220`	`+ ('file:/tmp/junk.txt',`
	`221`	`+'file:///tmp/junk.txt',`
	`222`	`+ ('file','','/tmp/junk.txt','','',''),`
	`223`	`+ ('file','','/tmp/junk.txt','','')),`
	`224`	`+ ('http:/tmp/junk.txt',`
	`225`	`+'http:///tmp/junk.txt',`
	`226`	`+ ('http','','/tmp/junk.txt','','',''),`
	`227`	`+ ('http','','/tmp/junk.txt','','')),`
	`228`	`+ ('https:/tmp/junk.txt',`
	`229`	`+'https:///tmp/junk.txt',`
	`230`	`+ ('https','','/tmp/junk.txt','','',''),`
	`231`	`+ ('https','','/tmp/junk.txt','','')),`
	`232`	`+ ]`
	`233`	`+def_encode(t):`
	`234`	`+return (t[0].encode('ascii'),`
	`235`	`+t[1].encode('ascii'),`
	`236`	`+tuple(x.encode('ascii')forxint[2]),`
	`237`	`+tuple(x.encode('ascii')forxint[3]))`
	`238`	`+bytes_cases= [_encode(x)forxinstr_cases]`
	`239`	`+forurl,url2,parsed,splitinstr_cases+bytes_cases:`
	`240`	`+self.checkRoundtrips(url,parsed,split,url2)`
	`241`	`+`
`178`	`242`	`deftest_http_roundtrips(self):`
`179`	`243`	`# urllib.parse.urlsplit treats 'http:' as an optimized special case,`
`180`	`244`	`# so we test both 'http:' and 'https:' in all the following.`

`‎Lib/urllib/parse.py‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -512,7 +512,7 @@ def urlunsplit(components):`
`512`	`512`	`empty query; the RFC states that these are equivalent)."""`
`513`	`513`	`scheme,netloc,url,query,fragment,_coerce_result= (`
`514`	`514`	`_coerce_args(*components))`
`515`		`-ifnetlocor (schemeandschemeinuses_netlocandurl[:2]!='//'):`
	`515`	`+ifnetlocor (schemeandschemeinuses_netloc)orurl[:2]=='//':`
`516`	`516`	`ifurlandurl[:1]!='/':url='/'+url`
`517`	`517`	`url='//'+ (netlocor'')+url`
`518`	`518`	`ifscheme:`

`‎Misc/NEWS.d/next/Library/2019-08-27-01-16-50.gh-issue-67693.4NIAiy.rst‎`

Lines changed: 2 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	+Fix:func:`urllib.parse.urlunparse` and:func:`urllib.parse.urlunsplit` for URIs with path starting with multiple slashes and no authority.
	`2`	`+Based on patch by Ashwin Ramaswami.`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

Commit0a87812

File tree

3 files changed

3 files changed

`‎Lib/test/test_urlparse.py‎`

`‎Lib/urllib/parse.py‎`

`‎Misc/NEWS.d/next/Library/2019-08-27-01-16-50.gh-issue-67693.4NIAiy.rst‎`

0 commit comments