Normalize the encoding names for Latin-1 and UTF-8 to 'latin-1' and 'utf-8'. These are optimized in the Python Unicode implementation to result in more direct processing, bypassing the codec registry. Also see issue11303.

commit: 8f36af7a4c9409a673412e4bdfbad76d700abc3a [log] [tgz]
author: Marc-André Lemburg <mal@egenix.com> Fri Feb 25 15:42:01 2011 +0000
committer: Marc-André Lemburg <mal@egenix.com> Fri Feb 25 15:42:01 2011 +0000
tree: 1b61599a07604a96539e98098b055c577cd7e6a8
parent: a391b11320f729f6eec6c772c00b3e62c2746eaf [diff] [blame]
diff --git a/Lib/test/test_tarfile.py b/Lib/test/test_tarfile.py
index 68e094d..a645bf2 100644
--- a/Lib/test/test_tarfile.py
+++ b/Lib/test/test_tarfile.py

@@ -1289,7 +1289,7 @@
         self._test_unicode_filename("utf7")
 
     def test_utf8_filename(self):
-        self._test_unicode_filename("utf8")
+        self._test_unicode_filename("utf-8")
 
     def _test_unicode_filename(self, encoding):
         tar = tarfile.open(tmpname, "w", format=self.format, encoding=encoding, errors="strict")
@@ -1368,7 +1368,7 @@
     def test_bad_pax_header(self):
         # Test for issue #8633. GNU tar <= 1.23 creates raw binary fields
         # without a hdrcharset=BINARY header.
-        for encoding, name in (("utf8", "pax/bad-pax-\udce4\udcf6\udcfc"),
+        for encoding, name in (("utf-8", "pax/bad-pax-\udce4\udcf6\udcfc"),
                 ("iso8859-1", "pax/bad-pax-\xe4\xf6\xfc"),):
             with tarfile.open(tarname, encoding=encoding, errors="surrogateescape") as tar:
                 try:
@@ -1383,7 +1383,7 @@
 
     def test_binary_header(self):
         # Test a POSIX.1-2008 compatible header with a hdrcharset=BINARY field.
-        for encoding, name in (("utf8", "pax/hdrcharset-\udce4\udcf6\udcfc"),
+        for encoding, name in (("utf-8", "pax/hdrcharset-\udce4\udcf6\udcfc"),
                 ("iso8859-1", "pax/hdrcharset-\xe4\xf6\xfc"),):
             with tarfile.open(tarname, encoding=encoding, errors="surrogateescape") as tar:
                 try:
commit	8f36af7a4c9409a673412e4bdfbad76d700abc3a	[log] [tgz]
author	Marc-André Lemburg <mal@egenix.com>	Fri Feb 25 15:42:01 2011 +0000
committer	Marc-André Lemburg <mal@egenix.com>	Fri Feb 25 15:42:01 2011 +0000
tree	1b61599a07604a96539e98098b055c577cd7e6a8
parent	a391b11320f729f6eec6c772c00b3e62c2746eaf [diff] [blame]