Commit b0caf329 authored by Ronald Oussoren's avatar Ronald Oussoren Committed by Ned Deily

bpo-18378: Recognize "UTF-8" as a valid name in locale._parse_localename (GH-14736)

parent fa220ec7
...@@ -492,6 +492,10 @@ def _parse_localename(localename): ...@@ -492,6 +492,10 @@ def _parse_localename(localename):
return tuple(code.split('.')[:2]) return tuple(code.split('.')[:2])
elif code == 'C': elif code == 'C':
return None, None return None, None
elif code == 'UTF-8':
# On macOS "LC_CTYPE=UTF-8" is a valid locale setting
# for getting UTF-8 handling for text.
return None, 'UTF-8'
raise ValueError('unknown locale: %s' % localename) raise ValueError('unknown locale: %s' % localename)
def _build_localename(localetuple): def _build_localename(localetuple):
......
...@@ -493,6 +493,42 @@ class NormalizeTest(unittest.TestCase): ...@@ -493,6 +493,42 @@ class NormalizeTest(unittest.TestCase):
class TestMiscellaneous(unittest.TestCase): class TestMiscellaneous(unittest.TestCase):
def test_defaults_UTF8(self):
# Issue #18378: on (at least) macOS setting LC_CTYPE to "UTF-8" is
# valid. Futhermore LC_CTYPE=UTF is used by the UTF-8 locale coercing
# during interpreter startup (on macOS).
import _locale
import os
self.assertEqual(locale._parse_localename('UTF-8'), (None, 'UTF-8'))
if hasattr(_locale, '_getdefaultlocale'):
orig_getlocale = _locale._getdefaultlocale
del _locale._getdefaultlocale
else:
orig_getlocale = None
orig_env = {}
try:
for key in ('LC_ALL', 'LC_CTYPE', 'LANG', 'LANGUAGE'):
if key in os.environ:
orig_env[key] = os.environ[key]
del os.environ[key]
os.environ['LC_CTYPE'] = 'UTF-8'
self.assertEqual(locale.getdefaultlocale(), (None, 'UTF-8'))
finally:
for k in orig_env:
os.environ[k] = orig_env[k]
if 'LC_CTYPE' not in orig_env:
del os.environ['LC_CTYPE']
if orig_getlocale is not None:
_locale._getdefaultlocale = orig_getlocale
def test_getpreferredencoding(self): def test_getpreferredencoding(self):
# Invoke getpreferredencoding to make sure it does not cause exceptions. # Invoke getpreferredencoding to make sure it does not cause exceptions.
enc = locale.getpreferredencoding() enc = locale.getpreferredencoding()
......
Recognize "UTF-8" as a valid value for LC_CTYPE in locale._parse_localename.
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment