Browse Source

bpo-22347: Update mimetypes.guess_type to allow proper parsing of URLs (GH-15522)

https://bugs.python.org/issue22347
pull/15691/head
Dong-hee Na 6 years ago
committed by Miss Islington (bot)
parent
commit
87bd2071c7
  1. 3
      Lib/mimetypes.py
  2. 8
      Lib/test/test_mimetypes.py
  3. 2
      Lib/test/test_urllib2.py
  4. 2
      Misc/NEWS.d/next/Library/2019-08-27-01-03-26.bpo-22347._TRpYr.rst

3
Lib/mimetypes.py

@ -114,7 +114,8 @@ class MimeTypes:
but non-standard types.
"""
url = os.fspath(url)
scheme, url = urllib.parse._splittype(url)
p = urllib.parse.urlparse(url)
scheme, url = p.scheme, p.path
if scheme == 'data':
# syntax of data URLs:
# dataurl := "data:" [ mediatype ] [ ";base64" ] "," data

8
Lib/test/test_mimetypes.py

@ -51,6 +51,14 @@ class MimeTypesTestCase(unittest.TestCase):
eq(self.db.guess_type('foo.xul', strict=False), ('text/xul', None))
eq(self.db.guess_extension('image/jpg', strict=False), '.jpg')
def test_url(self):
result = self.db.guess_type('http://host.html')
msg = 'URL only has a host name, not a file'
self.assertSequenceEqual(result, (None, None), msg)
result = self.db.guess_type('http://example.com/host.html')
msg = 'Should be text/html'
self.assertSequenceEqual(result, ('text/html', None), msg)
def test_guess_all_types(self):
eq = self.assertEqual
unless = self.assertTrue

2
Lib/test/test_urllib2.py

@ -742,7 +742,7 @@ class HandlerTests(unittest.TestCase):
["foo", "bar"], "", None),
("ftp://localhost/baz.gif;type=a",
"localhost", ftplib.FTP_PORT, "", "", "A",
[], "baz.gif", None), # XXX really this should guess image/gif
[], "baz.gif", "image/gif"),
]:
req = Request(url)
req.timeout = None

2
Misc/NEWS.d/next/Library/2019-08-27-01-03-26.bpo-22347._TRpYr.rst

@ -0,0 +1,2 @@
Update mimetypes.guess_type to allow proper parsing of URLs with only a host name.
Patch by Dong-hee Na.
Loading…
Cancel
Save