MS_WINDOWS = (sys.platform == 'win32')
+POSIX_LOCALES = ('C', 'POSIX')
class UTF8ModeTests(unittest.TestCase):
def posix_locale(self):
loc = locale.setlocale(locale.LC_CTYPE, None)
- return (loc == 'C')
+ return (loc in POSIX_LOCALES)
def get_output(self, *args, failure=False, **kw):
kw = dict(self.DEFAULT_ENV, **kw)
def test_posix_locale(self):
code = 'import sys; print(sys.flags.utf8_mode)'
- out = self.get_output('-c', code, LC_ALL='C')
- self.assertEqual(out, '1')
+ for loc in POSIX_LOCALES:
+ with self.subTest(LC_ALL=loc):
+ out = self.get_output('-c', code, LC_ALL=loc)
+ self.assertEqual(out, '1')
def test_xoption(self):
code = 'import sys; print(sys.flags.utf8_mode)'
out = self.get_output('-X', 'utf8', '-c', code)
self.assertEqual(out, 'UTF-8 UTF-8')
- out = self.get_output('-X', 'utf8', '-c', code, LC_ALL='C')
- self.assertEqual(out, 'UTF-8 UTF-8')
+ for loc in POSIX_LOCALES:
+ with self.subTest(LC_ALL=loc):
+ out = self.get_output('-X', 'utf8', '-c', code, LC_ALL=loc)
+ self.assertEqual(out, 'UTF-8 UTF-8')
@unittest.skipIf(MS_WINDOWS, 'test specific to Unix')
def test_cmd_line(self):
self.assertEqual(args, ascii(expected), out)
check('utf8', [arg_utf8])
+ for loc in POSIX_LOCALES:
+ with self.subTest(LC_ALL=loc):
+ check('utf8', [arg_utf8], LC_ALL=loc)
+
if sys.platform == 'darwin' or support.is_android:
c_arg = arg_utf8
elif sys.platform.startswith("aix"):
c_arg = arg.decode('iso-8859-1')
else:
c_arg = arg_ascii
- check('utf8=0', [c_arg], LC_ALL='C')
+ for loc in POSIX_LOCALES:
+ with self.subTest(LC_ALL=loc):
+ check('utf8=0', [c_arg], LC_ALL=loc)
def test_optim_level(self):
# CPython: check that Py_Main() doesn't increment Py_OptimizeFlag
#include "Python.h"
#include "internal/pystate.h"
+#include <locale.h>
#define DECODE_LOCALE_ERR(NAME, LEN) \
config_init_locale(_PyCoreConfig *config)
{
if (_Py_LegacyLocaleDetected()) {
- /* POSIX locale: enable C locale coercion and UTF-8 Mode */
- if (config->utf8_mode < 0) {
- config->utf8_mode = 1;
- }
+ /* The C locale enables the C locale coercion (PEP 538) */
if (config->coerce_c_locale < 0) {
config->coerce_c_locale = 1;
}
}
+#ifndef MS_WINDOWS
+ const char *ctype_loc = setlocale(LC_CTYPE, NULL);
+ if (ctype_loc != NULL
+ && (strcmp(ctype_loc, "C") == 0 || strcmp(ctype_loc, "POSIX") == 0)) {
+ /* The C locale and the POSIX locale enable the UTF-8 Mode (PEP 540) */
+ if (config->utf8_mode < 0) {
+ config->utf8_mode = 1;
+ }
+ }
+#endif
}