8000 bpo-28604: Fix localeconv() for different LC_MONETARY by vstinner · Pull Request #10606 · python/cpython · GitHub
[go: up one dir, main page]

Skip to content

bpo-28604: Fix localeconv() for different LC_MONETARY #10606

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 3 commits into from
Nov 20, 2018
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Next Next commit
bpo-28604: Fix localeconv() for different LC_MONETARY
locale.localeconv() now sets temporarily the LC_CTYPE locale to the
LC_MONETARY locale if the two locales are different and monetary
strings are non-ASCII. This temporary change affects other threads.

Changes:

* locale.localeconv() can now set LC_CTYPE to LC_MONETARY to decode
  monetary fields.
* Add LocaleInfo.grouping_buffer: copy localeconv() grouping string
  since it can be replaced anytimes if a different thread calls
  localeconv().
* _Py_GetLocaleconvNumeric() now requires a "struct lconv *"
  structure, so locale.localeconv() now longer calls localeconv()
  twice. Moreover, the function now requires all arguments to be
  non-NULL.
* Rename STATIC_LOCALE_INFO_INIT to LOCALE_INFO_STATIC_INIT.
* Move _Py_GetLocaleconvNumeric() definition from fileutils.h
  to pycore_fileutils.h. pycore_fileutils.h now includes locale.h.
* The _locale module is now built with Py_BUILD_CORE defined.
  • Loading branch information
vstinner committed Nov 20, 2018
commit 4bdd0f2c7d3ed91d4ed512be6b74f5bb601a1d4a
6 changes: 2 additions & 4 deletions Doc/library/locale.rst
Original file line number Diff line number Diff line change
Expand Up @@ -148,10 +148,8 @@ The :mod:`locale` module defines the following exception and functions:
+--------------+-----------------------------------------+

The function sets temporarily the ``LC_CTYPE`` locale to the ``LC_NUMERIC``
locale to decode ``decimal_point`` and ``thousands_sep`` byte strings if
they are non-ASCII or longer than 1 byte, and the ``LC_NUMERIC`` locale is
different than the ``LC_CTYPE`` locale. This temporary change affects other
threads.
locale or the ``LC_MONETARY`` locale if locales are different and strings
are non-ASCII. This temporary change affects other threads.

.. versionchanged:: 3.7
The function now sets temporarily the ``LC_CTYPE`` locale to the
Expand Down
5 changes: 0 additions & 5 deletions Include/fileutils.h
Original file line number Diff line number Diff line change
Expand Up @@ -170,11 +170,6 @@ PyAPI_FUNC(int) _Py_get_blocking(int fd);
PyAPI_FUNC(int) _Py_set_blocking(int fd, int blocking);
#endif /* !MS_WINDOWS */

PyAPI_FUNC(int) _Py_GetLocaleconvNumeric(
PyObject **decimal_point,
PyObject **thousands_sep,
const char **grouping);

#endif /* Py_LIMITED_API */

#ifdef __cplusplus
Expand Down
8 changes: 8 additions & 0 deletions Include/internal/pycore_fileutils.h
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,8 @@ extern "C" {
# error "Py_BUILD_CORE must be defined to include this header"
#endif

#include <locale.h> /* struct lconv */

PyAPI_FUNC(int) _Py_DecodeUTF8Ex(
const char *arg,
Py_ssize_t arglen,
Expand All @@ -30,6 +32,12 @@ PyAPI_FUNC(wchar_t*) _Py_DecodeUTF8_surrogateescape(

PyAPI_FUNC(int) _Py_GetForceASCII(void);

PyAPI_FUNC(int) _Py_GetLocaleconvNumeric(
struct lconv *lc,
PyObject **decimal_point,
PyObject **thousands_sep,
const char **grouping);

#ifdef __cplusplus
}
#endif
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
:func:`locale.localeconv` now sets temporarily the ``LC_CTYPE`` locale to the
``LC_MONETARY`` locale if the two locales are different and monetary strings
are non-ASCII. This temporary change affects other threads.
2 changes: 1 addition & 1 deletion Modules/Setup
Original file line number Diff line number Diff line change
Expand Up @@ -120,7 +120,7 @@ time -DPy_BUILD_CORE -I$(srcdir)/Include/internal timemodule.c # -lm # time oper
_thread -DPy_BUILD_CORE -I$(srcdir)/Include/internal _threadmodule.c # low-level threading interface

# access to ISO C locale support
_locale _localemodule.c # -lintl
_locale -DPy_BUILD_CORE _localemodule.c # -lintl

# Standard I/O baseline
_io -DPy_BUILD_CORE -I$(srcdir)/Include/internal -I$(srcdir)/Modules/_io _io/_iomodule.c _io/iobase.c _io/fileio.c _io/bytesio.c _io/bufferedio.c _io/textio.c _io/stringio.c
Expand Down
93 changes: 86 additions & 7 deletions Modules/_localemodule.c
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@ This software comes with no warranty. Use at your own risk.

#define PY_SSIZE_T_CLEAN
#include "Python.h"
#include "pycore_fileutils.h"

#include <stdio.h>
#include <locale.h>
Expand Down Expand Up @@ -128,6 +129,81 @@ PyLocale_setlocale(PyObject* self, PyObject* args)
return result_object;
}

static int
locale_is_ascii(const char *str)
{
return (strlen(str) == 1 && ((unsigned char)str[0]) <= 127);
}

static int
locale_decode_monetary(PyObject *dict, struct lconv *lc)
{
int res = -1;

int change_locale;
change_locale = (!locale_is_ascii(lc->int_curr_symbol)
|| !locale_is_ascii(lc->currency_symbol)
|| !locale_is_ascii(lc->mon_decimal_point)
|| !locale_is_ascii(lc->mon_thousands_sep));

/* Keep a copy of the LC_CTYPE locale */
char *oldloc = NULL, *loc = NULL;
if (change_locale) {
oldloc = setlocale(LC_CTYPE, NULL);
if (!oldloc) {
PyErr_SetString(PyExc_RuntimeWarning, "faild to get LC_CTYPE locale");
return -1;
}

oldloc = _PyMem_Strdup(oldloc);
if (!oldloc) {
PyErr_NoMemory();
return -1;
}

loc = setlocale(LC_MONETARY, NULL);
if (loc != NULL && strcmp(loc, oldloc) == 0) {
loc = NULL;
}

if (loc != NULL) {
/* Only set the locale temporarily the LC_CTYPE locale
to the LC_MONETARY locale if the two locales are different and
at least one string is non-ASCII. */
setlocale(LC_CTYPE, loc);
}
}

#define RESULT_STRING(ATTR) \
do { \
PyObject *obj; \
obj = PyUnicode_DecodeLocale(lc->ATTR, NULL); \
if (obj == NULL) { \
goto error; \
} \
if (PyDict_SetItemString(dict, Py_STRINGIFY(ATTR), obj) < 0) { \
Py_DECREF(obj); \
goto error; \
} \
Py_DECREF(obj); \
} while (0)

RESULT_STRING(int_curr_symbol);
RESULT_STRING(currency_symbol);
RESULT_STRING(mon_decimal_point);
RESULT_STRING(mon_thousands_sep);
#undef RESULT_STRING

res = 0;

error:
if (loc != NULL) {
setlocale(LC_CTYPE, oldloc);
}
PyMem_Free(oldloc);
return res;
}

PyDoc_STRVAR(localeconv__doc__,
"() -> dict. Returns numeric and monetary locale-specific parameters.");

Expand Down Expand Up @@ -172,11 +248,10 @@ PyLocale_localeconv(PyObject* self, PyObject *Py_UNUSED(ignored))
RESULT(#i, x); \
} while (0)

/* Monetary information */
RESULT_STRING(int_curr_symbol);
RESULT_STRING(currency_symbol);
RESULT_STRING(mon_decimal_point);
RESULT_STRING(mon_thousands_sep);
/* Monetary information: LC_MONETARY encoding */
if (locale_decode_monetary(result, l) < 0) {
goto failed;
}
x = copy_grouping(l->mon_grouping);
RESULT("mon_grouping", x);

Expand All @@ -191,10 +266,10 @@ PyLocale_localeconv(PyObject* self, PyObject *Py_UNUSED(ignored))
RESULT_INT(p_sign_posn);
RESULT_INT(n_sign_posn);

/* Numeric information */
/* Numeric information: LC_NUMERIC encoding */
PyObject *decimal_point, *thousands_sep;
const char *grouping;
if (_Py_GetLocaleconvNumeric(&decimal_point,
if (_Py_GetLocaleconvNumeric(l, &decimal_point,
&thousands_sep,
&grouping) < 0) {
goto failed;
Expand All @@ -221,6 +296,10 @@ PyLocale_localeconv(PyObject* self, PyObject *Py_UNUSED(ignored))
failed:
Py_DECREF(result);
return NULL;

#undef RESULT
#undef RESULT_STRING
#undef RESULT_INT
}

#if defined(HAVE_WCSCOLL)
Expand Down
40 changes: 17 additions & 23 deletions Python/fileutils.c
< F438 /thead>
Original file line number Diff line number Diff line change
Expand Up @@ -1868,22 +1868,21 @@ _Py_set_blocking(int fd, int blocking)


int
_Py_GetLocaleconvNumeric(PyObject **decimal_point, PyObject **thousands_sep,
_Py_GetLocaleconvNumeric(struct lconv *lc,
PyObject **decimal_point, PyObject **thousands_sep,
const char **grouping)
{
int res = -1;
assert(decimal_point != NULL);
assert(thousands_sep != NULL);
assert(grouping != NULL);

struct lconv *lc = localeconv();
int res = -1;

int change_locale = 0;
if (decimal_point != NULL &&
(strlen(lc->decimal_point) > 1 || ((unsigned char)lc->decimal_point[0]) > 127))
{
if ((strlen(lc->decimal_point) > 1 || ((unsigned char)lc->decimal_point[0]) > 127)) {
change_locale = 1;
}
if (thousands_sep != NULL &&
(strlen(lc->thousands_sep) > 1 || ((unsigned char)lc->thousands_sep[0]) > 127))
{
if ((strlen(lc->thousands_sep) > 1 || ((unsigned char)lc->thousands_sep[0]) > 127)) {
change_locale = 1;
}

Expand All @@ -1908,31 +1907,26 @@ _Py_GetLocaleconvNumeric(PyObject **decimal_point, PyObject **thousands_sep,
}

if (loc != NULL) {
/* Only set the locale temporarilty the LC_CTYPE locale
/* Only set the locale temporarily the LC_CTYPE locale
if LC_NUMERIC locale is different than LC_CTYPE locale and
decimal_point and/or thousands_sep are non-ASCII or longer than
1 byte */
setlocale(LC_CTYPE, loc);
}
}

if (decimal_point != NULL) {
*decimal_point = PyUnicode_DecodeLocale(lc->decimal_point, NULL);
if (*decimal_point == NULL) {
goto error;
}
}
if (thousands_sep != NULL) {
*thousands_sep = PyUnicode_DecodeLocale(lc->thousands_sep, NULL);
if (*thousands_sep == NULL) {
goto error;
}
*decimal_point = PyUnicode_DecodeLocale(lc->decimal_point, NULL);
if (*decimal_point == NULL) {
goto error;
}

if (grouping != NULL) {
*grouping = lc->grouping;
*thousands_sep = PyUnicode_DecodeLocale(lc->thousands_sep, NULL);
if (*thousands_sep == NULL) {
goto error;
}

*grouping = lc->grouping;

res = 0;

error:
Expand Down
28 changes: 22 additions & 6 deletions Python/formatter_unicode.c
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@
of int.__float__, etc., that take and return unicode objects */

#include "Python.h"
#include "pycore_fileutils.h"
#include <locale.h>

/* Raises an exception about an unknown presentation type for this
Expand Down Expand Up @@ -396,9 +397,10 @@ typedef struct {
PyObject *decimal_point;
PyObject *thousands_sep;
const char *grouping;
char *grouping_buffer;
} LocaleInfo;

#define STATIC_LOCALE_INFO_INIT {0, 0, 0}
#define LOCALE_INFO_STATIC_INIT {0, 0, 0, 0}

/* describes the layout for an integer, see the comment in
calc_number_widths() for details */
Expand Down Expand Up @@ -705,11 +707,24 @@ get_locale_info(enum LocaleType type, LocaleInfo *locale_info)
{
switch (type) {
case LT_CURRENT_LOCALE: {
if (_Py_GetLocaleconvNumeric(&locale_info->decimal_point,
struct lconv *lc = localeconv();
const char *grouping;
if (_Py_GetLocaleconvNumeric(lc,
&locale_info->decimal_point,
&locale_info->thousands_sep,
&locale_info->grouping) < 0) {
&grouping) < 0) {
return -1;
}
/* bpo-28604: localeconv() grouping becomes a dangling pointer
and may point to a different string if another thread calls
localeconv() during the string formatting. Copy the string
to avoid this risk. */
locale_info->grouping_buffer = _PyMem_Strdup(grouping);
if (locale_info->grouping_buffer == NULL) {
PyErr_NoMemory();
return -1;
}
locale_info->grouping = locale_info->grouping_buffer;
break;
}
case LT_DEFAULT_LOCALE:
Expand Down Expand Up @@ -743,6 +758,7 @@ free_locale_info(LocaleInfo *locale_info)
{
Py_XDECREF(locale_info->decimal_point);
Py_XDECREF(locale_info->thousands_sep);
PyMem_Free(locale_info->grouping_buffer);
}

/************************************************************************/
Expand Down Expand Up @@ -855,7 +871,7 @@ format_long_internal(PyObject *value, const InternalFormatSpec *format,

/* Locale settings, either from the actual locale or
from a hard-code pseudo-locale */
LocaleInfo locale = STATIC_LOCALE_INFO_INIT;
LocaleInfo locale = LOCALE_INFO_STATIC_INIT;

/* no precision allowed on integers */
if (format->precision != -1) {
Expand Down Expand Up @@ -1027,7 +1043,7 @@ format_float_internal(PyObject *value,

/* Locale settings, either from the actual locale or
from a hard-code pseudo-locale */
LocaleInfo locale = STATIC_LOCALE_INFO_INIT;
LocaleInfo locale = LOCALE_INFO_STATIC_INIT;

if (format->precision > INT_MAX) {
PyErr_SetString(PyExc_ValueError, "precision too big");
Expand Down Expand Up @@ -1190,7 +1206,7 @@ format_complex_internal(PyObject *value,

/* Locale settings, either from the actual locale or
from a hard-code pseudo-locale */
LocaleInfo locale = STATIC_LOCALE_INFO_INIT;
LocaleInfo locale = LOCALE_INFO_STATIC_INIT;

if (format->precision > INT_MAX) {
PyErr_SetString(PyExc_ValueError, "precision too big");
Expand Down
0