1326 lines
48 KiB
Python
1326 lines
48 KiB
Python
|
"""
|
||
|
babel.numbers
|
||
|
~~~~~~~~~~~~~
|
||
|
|
||
|
Locale dependent formatting and parsing of numeric data.
|
||
|
|
||
|
The default locale for the functions in this module is determined by the
|
||
|
following environment variables, in that order:
|
||
|
|
||
|
* ``LC_NUMERIC``,
|
||
|
* ``LC_ALL``, and
|
||
|
* ``LANG``
|
||
|
|
||
|
:copyright: (c) 2013-2023 by the Babel Team.
|
||
|
:license: BSD, see LICENSE for more details.
|
||
|
"""
|
||
|
# TODO:
|
||
|
# Padding and rounding increments in pattern:
|
||
|
# - https://www.unicode.org/reports/tr35/ (Appendix G.6)
|
||
|
from __future__ import annotations
|
||
|
|
||
|
import datetime
|
||
|
import decimal
|
||
|
import re
|
||
|
import warnings
|
||
|
from typing import TYPE_CHECKING, Any, cast, overload
|
||
|
|
||
|
from babel.core import Locale, default_locale, get_global
|
||
|
from babel.localedata import LocaleDataDict
|
||
|
|
||
|
if TYPE_CHECKING:
|
||
|
from typing_extensions import Literal
|
||
|
|
||
|
LC_NUMERIC = default_locale('LC_NUMERIC')
|
||
|
|
||
|
|
||
|
class UnknownCurrencyError(Exception):
|
||
|
"""Exception thrown when a currency is requested for which no data is available.
|
||
|
"""
|
||
|
|
||
|
def __init__(self, identifier: str) -> None:
|
||
|
"""Create the exception.
|
||
|
:param identifier: the identifier string of the unsupported currency
|
||
|
"""
|
||
|
Exception.__init__(self, f"Unknown currency {identifier!r}.")
|
||
|
|
||
|
#: The identifier of the locale that could not be found.
|
||
|
self.identifier = identifier
|
||
|
|
||
|
|
||
|
def list_currencies(locale: Locale | str | None = None) -> set[str]:
|
||
|
""" Return a `set` of normalized currency codes.
|
||
|
|
||
|
.. versionadded:: 2.5.0
|
||
|
|
||
|
:param locale: filters returned currency codes by the provided locale.
|
||
|
Expected to be a locale instance or code. If no locale is
|
||
|
provided, returns the list of all currencies from all
|
||
|
locales.
|
||
|
"""
|
||
|
# Get locale-scoped currencies.
|
||
|
if locale:
|
||
|
return set(Locale.parse(locale).currencies)
|
||
|
return set(get_global('all_currencies'))
|
||
|
|
||
|
|
||
|
def validate_currency(currency: str, locale: Locale | str | None = None) -> None:
|
||
|
""" Check the currency code is recognized by Babel.
|
||
|
|
||
|
Accepts a ``locale`` parameter for fined-grained validation, working as
|
||
|
the one defined above in ``list_currencies()`` method.
|
||
|
|
||
|
Raises a `UnknownCurrencyError` exception if the currency is unknown to Babel.
|
||
|
"""
|
||
|
if currency not in list_currencies(locale):
|
||
|
raise UnknownCurrencyError(currency)
|
||
|
|
||
|
|
||
|
def is_currency(currency: str, locale: Locale | str | None = None) -> bool:
|
||
|
""" Returns `True` only if a currency is recognized by Babel.
|
||
|
|
||
|
This method always return a Boolean and never raise.
|
||
|
"""
|
||
|
if not currency or not isinstance(currency, str):
|
||
|
return False
|
||
|
try:
|
||
|
validate_currency(currency, locale)
|
||
|
except UnknownCurrencyError:
|
||
|
return False
|
||
|
return True
|
||
|
|
||
|
|
||
|
def normalize_currency(currency: str, locale: Locale | str | None = None) -> str | None:
|
||
|
"""Returns the normalized identifier of any currency code.
|
||
|
|
||
|
Accepts a ``locale`` parameter for fined-grained validation, working as
|
||
|
the one defined above in ``list_currencies()`` method.
|
||
|
|
||
|
Returns None if the currency is unknown to Babel.
|
||
|
"""
|
||
|
if isinstance(currency, str):
|
||
|
currency = currency.upper()
|
||
|
if not is_currency(currency, locale):
|
||
|
return None
|
||
|
return currency
|
||
|
|
||
|
|
||
|
def get_currency_name(
|
||
|
currency: str,
|
||
|
count: float | decimal.Decimal | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
) -> str:
|
||
|
"""Return the name used by the locale for the specified currency.
|
||
|
|
||
|
>>> get_currency_name('USD', locale='en_US')
|
||
|
u'US Dollar'
|
||
|
|
||
|
.. versionadded:: 0.9.4
|
||
|
|
||
|
:param currency: the currency code.
|
||
|
:param count: the optional count. If provided the currency name
|
||
|
will be pluralized to that number if possible.
|
||
|
:param locale: the `Locale` object or locale identifier.
|
||
|
"""
|
||
|
loc = Locale.parse(locale)
|
||
|
if count is not None:
|
||
|
try:
|
||
|
plural_form = loc.plural_form(count)
|
||
|
except (OverflowError, ValueError):
|
||
|
plural_form = 'other'
|
||
|
plural_names = loc._data['currency_names_plural']
|
||
|
if currency in plural_names:
|
||
|
currency_plural_names = plural_names[currency]
|
||
|
if plural_form in currency_plural_names:
|
||
|
return currency_plural_names[plural_form]
|
||
|
if 'other' in currency_plural_names:
|
||
|
return currency_plural_names['other']
|
||
|
return loc.currencies.get(currency, currency)
|
||
|
|
||
|
|
||
|
def get_currency_symbol(currency: str, locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the symbol used by the locale for the specified currency.
|
||
|
|
||
|
>>> get_currency_symbol('USD', locale='en_US')
|
||
|
u'$'
|
||
|
|
||
|
:param currency: the currency code.
|
||
|
:param locale: the `Locale` object or locale identifier.
|
||
|
"""
|
||
|
return Locale.parse(locale).currency_symbols.get(currency, currency)
|
||
|
|
||
|
|
||
|
def get_currency_precision(currency: str) -> int:
|
||
|
"""Return currency's precision.
|
||
|
|
||
|
Precision is the number of decimals found after the decimal point in the
|
||
|
currency's format pattern.
|
||
|
|
||
|
.. versionadded:: 2.5.0
|
||
|
|
||
|
:param currency: the currency code.
|
||
|
"""
|
||
|
precisions = get_global('currency_fractions')
|
||
|
return precisions.get(currency, precisions['DEFAULT'])[0]
|
||
|
|
||
|
|
||
|
def get_currency_unit_pattern(
|
||
|
currency: str,
|
||
|
count: float | decimal.Decimal | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
) -> str:
|
||
|
"""
|
||
|
Return the unit pattern used for long display of a currency value
|
||
|
for a given locale.
|
||
|
This is a string containing ``{0}`` where the numeric part
|
||
|
should be substituted and ``{1}`` where the currency long display
|
||
|
name should be substituted.
|
||
|
|
||
|
>>> get_currency_unit_pattern('USD', locale='en_US', count=10)
|
||
|
u'{0} {1}'
|
||
|
|
||
|
.. versionadded:: 2.7.0
|
||
|
|
||
|
:param currency: the currency code.
|
||
|
:param count: the optional count. If provided the unit
|
||
|
pattern for that number will be returned.
|
||
|
:param locale: the `Locale` object or locale identifier.
|
||
|
"""
|
||
|
loc = Locale.parse(locale)
|
||
|
if count is not None:
|
||
|
plural_form = loc.plural_form(count)
|
||
|
try:
|
||
|
return loc._data['currency_unit_patterns'][plural_form]
|
||
|
except LookupError:
|
||
|
# Fall back to 'other'
|
||
|
pass
|
||
|
|
||
|
return loc._data['currency_unit_patterns']['other']
|
||
|
|
||
|
|
||
|
@overload
|
||
|
def get_territory_currencies(
|
||
|
territory: str,
|
||
|
start_date: datetime.date | None = ...,
|
||
|
end_date: datetime.date | None = ...,
|
||
|
tender: bool = ...,
|
||
|
non_tender: bool = ...,
|
||
|
include_details: Literal[False] = ...,
|
||
|
) -> list[str]:
|
||
|
... # pragma: no cover
|
||
|
|
||
|
|
||
|
@overload
|
||
|
def get_territory_currencies(
|
||
|
territory: str,
|
||
|
start_date: datetime.date | None = ...,
|
||
|
end_date: datetime.date | None = ...,
|
||
|
tender: bool = ...,
|
||
|
non_tender: bool = ...,
|
||
|
include_details: Literal[True] = ...,
|
||
|
) -> list[dict[str, Any]]:
|
||
|
... # pragma: no cover
|
||
|
|
||
|
|
||
|
def get_territory_currencies(
|
||
|
territory: str,
|
||
|
start_date: datetime.date | None = None,
|
||
|
end_date: datetime.date | None = None,
|
||
|
tender: bool = True,
|
||
|
non_tender: bool = False,
|
||
|
include_details: bool = False,
|
||
|
) -> list[str] | list[dict[str, Any]]:
|
||
|
"""Returns the list of currencies for the given territory that are valid for
|
||
|
the given date range. In addition to that the currency database
|
||
|
distinguishes between tender and non-tender currencies. By default only
|
||
|
tender currencies are returned.
|
||
|
|
||
|
The return value is a list of all currencies roughly ordered by the time
|
||
|
of when the currency became active. The longer the currency is being in
|
||
|
use the more to the left of the list it will be.
|
||
|
|
||
|
The start date defaults to today. If no end date is given it will be the
|
||
|
same as the start date. Otherwise a range can be defined. For instance
|
||
|
this can be used to find the currencies in use in Austria between 1995 and
|
||
|
2011:
|
||
|
|
||
|
>>> from datetime import date
|
||
|
>>> get_territory_currencies('AT', date(1995, 1, 1), date(2011, 1, 1))
|
||
|
['ATS', 'EUR']
|
||
|
|
||
|
Likewise it's also possible to find all the currencies in use on a
|
||
|
single date:
|
||
|
|
||
|
>>> get_territory_currencies('AT', date(1995, 1, 1))
|
||
|
['ATS']
|
||
|
>>> get_territory_currencies('AT', date(2011, 1, 1))
|
||
|
['EUR']
|
||
|
|
||
|
By default the return value only includes tender currencies. This
|
||
|
however can be changed:
|
||
|
|
||
|
>>> get_territory_currencies('US')
|
||
|
['USD']
|
||
|
>>> get_territory_currencies('US', tender=False, non_tender=True,
|
||
|
... start_date=date(2014, 1, 1))
|
||
|
['USN', 'USS']
|
||
|
|
||
|
.. versionadded:: 2.0
|
||
|
|
||
|
:param territory: the name of the territory to find the currency for.
|
||
|
:param start_date: the start date. If not given today is assumed.
|
||
|
:param end_date: the end date. If not given the start date is assumed.
|
||
|
:param tender: controls whether tender currencies should be included.
|
||
|
:param non_tender: controls whether non-tender currencies should be
|
||
|
included.
|
||
|
:param include_details: if set to `True`, instead of returning currency
|
||
|
codes the return value will be dictionaries
|
||
|
with detail information. In that case each
|
||
|
dictionary will have the keys ``'currency'``,
|
||
|
``'from'``, ``'to'``, and ``'tender'``.
|
||
|
"""
|
||
|
currencies = get_global('territory_currencies')
|
||
|
if start_date is None:
|
||
|
start_date = datetime.date.today()
|
||
|
elif isinstance(start_date, datetime.datetime):
|
||
|
start_date = start_date.date()
|
||
|
if end_date is None:
|
||
|
end_date = start_date
|
||
|
elif isinstance(end_date, datetime.datetime):
|
||
|
end_date = end_date.date()
|
||
|
|
||
|
curs = currencies.get(territory.upper(), ())
|
||
|
# TODO: validate that the territory exists
|
||
|
|
||
|
def _is_active(start, end):
|
||
|
return (start is None or start <= end_date) and \
|
||
|
(end is None or end >= start_date)
|
||
|
|
||
|
result = []
|
||
|
for currency_code, start, end, is_tender in curs:
|
||
|
if start:
|
||
|
start = datetime.date(*start)
|
||
|
if end:
|
||
|
end = datetime.date(*end)
|
||
|
if ((is_tender and tender) or
|
||
|
(not is_tender and non_tender)) and _is_active(start, end):
|
||
|
if include_details:
|
||
|
result.append({
|
||
|
'currency': currency_code,
|
||
|
'from': start,
|
||
|
'to': end,
|
||
|
'tender': is_tender,
|
||
|
})
|
||
|
else:
|
||
|
result.append(currency_code)
|
||
|
|
||
|
return result
|
||
|
|
||
|
|
||
|
def get_decimal_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the symbol used by the locale to separate decimal fractions.
|
||
|
|
||
|
>>> get_decimal_symbol('en_US')
|
||
|
u'.'
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('decimal', '.')
|
||
|
|
||
|
|
||
|
def get_plus_sign_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the plus sign symbol used by the current locale.
|
||
|
|
||
|
>>> get_plus_sign_symbol('en_US')
|
||
|
u'+'
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('plusSign', '+')
|
||
|
|
||
|
|
||
|
def get_minus_sign_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the plus sign symbol used by the current locale.
|
||
|
|
||
|
>>> get_minus_sign_symbol('en_US')
|
||
|
u'-'
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('minusSign', '-')
|
||
|
|
||
|
|
||
|
def get_exponential_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the symbol used by the locale to separate mantissa and exponent.
|
||
|
|
||
|
>>> get_exponential_symbol('en_US')
|
||
|
u'E'
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('exponential', 'E')
|
||
|
|
||
|
|
||
|
def get_group_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the symbol used by the locale to separate groups of thousands.
|
||
|
|
||
|
>>> get_group_symbol('en_US')
|
||
|
u','
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('group', ',')
|
||
|
|
||
|
|
||
|
def get_infinity_symbol(locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the symbol used by the locale to represent infinity.
|
||
|
|
||
|
>>> get_infinity_symbol('en_US')
|
||
|
u'∞'
|
||
|
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
"""
|
||
|
return Locale.parse(locale).number_symbols.get('infinity', '∞')
|
||
|
|
||
|
|
||
|
def format_number(number: float | decimal.Decimal | str, locale: Locale | str | None = LC_NUMERIC) -> str:
|
||
|
"""Return the given number formatted for a specific locale.
|
||
|
|
||
|
>>> format_number(1099, locale='en_US') # doctest: +SKIP
|
||
|
u'1,099'
|
||
|
>>> format_number(1099, locale='de_DE') # doctest: +SKIP
|
||
|
u'1.099'
|
||
|
|
||
|
.. deprecated:: 2.6.0
|
||
|
|
||
|
Use babel.numbers.format_decimal() instead.
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
|
||
|
|
||
|
"""
|
||
|
warnings.warn('Use babel.numbers.format_decimal() instead.', DeprecationWarning, stacklevel=2)
|
||
|
return format_decimal(number, locale=locale)
|
||
|
|
||
|
|
||
|
def get_decimal_precision(number: decimal.Decimal) -> int:
|
||
|
"""Return maximum precision of a decimal instance's fractional part.
|
||
|
|
||
|
Precision is extracted from the fractional part only.
|
||
|
"""
|
||
|
# Copied from: https://github.com/mahmoud/boltons/pull/59
|
||
|
assert isinstance(number, decimal.Decimal)
|
||
|
decimal_tuple = number.normalize().as_tuple()
|
||
|
# Note: DecimalTuple.exponent can be 'n' (qNaN), 'N' (sNaN), or 'F' (Infinity)
|
||
|
if not isinstance(decimal_tuple.exponent, int) or decimal_tuple.exponent >= 0:
|
||
|
return 0
|
||
|
return abs(decimal_tuple.exponent)
|
||
|
|
||
|
|
||
|
def get_decimal_quantum(precision: int | decimal.Decimal) -> decimal.Decimal:
|
||
|
"""Return minimal quantum of a number, as defined by precision."""
|
||
|
assert isinstance(precision, (int, decimal.Decimal))
|
||
|
return decimal.Decimal(10) ** (-precision)
|
||
|
|
||
|
|
||
|
def format_decimal(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
format: str | NumberPattern | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
decimal_quantization: bool = True,
|
||
|
group_separator: bool = True,
|
||
|
) -> str:
|
||
|
"""Return the given decimal number formatted for a specific locale.
|
||
|
|
||
|
>>> format_decimal(1.2345, locale='en_US')
|
||
|
u'1.234'
|
||
|
>>> format_decimal(1.2346, locale='en_US')
|
||
|
u'1.235'
|
||
|
>>> format_decimal(-1.2346, locale='en_US')
|
||
|
u'-1.235'
|
||
|
>>> format_decimal(1.2345, locale='sv_SE')
|
||
|
u'1,234'
|
||
|
>>> format_decimal(1.2345, locale='de')
|
||
|
u'1,234'
|
||
|
|
||
|
The appropriate thousands grouping and the decimal separator are used for
|
||
|
each locale:
|
||
|
|
||
|
>>> format_decimal(12345.5, locale='en_US')
|
||
|
u'12,345.5'
|
||
|
|
||
|
By default the locale is allowed to truncate and round a high-precision
|
||
|
number by forcing its format pattern onto the decimal part. You can bypass
|
||
|
this behavior with the `decimal_quantization` parameter:
|
||
|
|
||
|
>>> format_decimal(1.2346, locale='en_US')
|
||
|
u'1.235'
|
||
|
>>> format_decimal(1.2346, locale='en_US', decimal_quantization=False)
|
||
|
u'1.2346'
|
||
|
>>> format_decimal(12345.67, locale='fr_CA', group_separator=False)
|
||
|
u'12345,67'
|
||
|
>>> format_decimal(12345.67, locale='en_US', group_separator=True)
|
||
|
u'12,345.67'
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param format:
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param decimal_quantization: Truncate and round high-precision numbers to
|
||
|
the format pattern. Defaults to `True`.
|
||
|
:param group_separator: Boolean to switch group separator on/off in a locale's
|
||
|
number format.
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
if format is None:
|
||
|
format = locale.decimal_formats[format]
|
||
|
pattern = parse_pattern(format)
|
||
|
return pattern.apply(
|
||
|
number, locale, decimal_quantization=decimal_quantization, group_separator=group_separator)
|
||
|
|
||
|
|
||
|
def format_compact_decimal(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
*,
|
||
|
format_type: Literal["short", "long"] = "short",
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
fraction_digits: int = 0,
|
||
|
) -> str:
|
||
|
"""Return the given decimal number formatted for a specific locale in compact form.
|
||
|
|
||
|
>>> format_compact_decimal(12345, format_type="short", locale='en_US')
|
||
|
u'12K'
|
||
|
>>> format_compact_decimal(12345, format_type="long", locale='en_US')
|
||
|
u'12 thousand'
|
||
|
>>> format_compact_decimal(12345, format_type="short", locale='en_US', fraction_digits=2)
|
||
|
u'12.34K'
|
||
|
>>> format_compact_decimal(1234567, format_type="short", locale="ja_JP")
|
||
|
u'123万'
|
||
|
>>> format_compact_decimal(2345678, format_type="long", locale="mk")
|
||
|
u'2 милиони'
|
||
|
>>> format_compact_decimal(21000000, format_type="long", locale="mk")
|
||
|
u'21 милион'
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param format_type: Compact format to use ("short" or "long")
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param fraction_digits: Number of digits after the decimal point to use. Defaults to `0`.
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
compact_format = locale.compact_decimal_formats[format_type]
|
||
|
number, format = _get_compact_format(number, compact_format, locale, fraction_digits)
|
||
|
# Did not find a format, fall back.
|
||
|
if format is None:
|
||
|
format = locale.decimal_formats[None]
|
||
|
pattern = parse_pattern(format)
|
||
|
return pattern.apply(number, locale, decimal_quantization=False)
|
||
|
|
||
|
|
||
|
def _get_compact_format(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
compact_format: LocaleDataDict,
|
||
|
locale: Locale,
|
||
|
fraction_digits: int,
|
||
|
) -> tuple[decimal.Decimal, NumberPattern | None]:
|
||
|
"""Returns the number after dividing by the unit and the format pattern to use.
|
||
|
The algorithm is described here:
|
||
|
https://www.unicode.org/reports/tr35/tr35-45/tr35-numbers.html#Compact_Number_Formats.
|
||
|
"""
|
||
|
if not isinstance(number, decimal.Decimal):
|
||
|
number = decimal.Decimal(str(number))
|
||
|
if number.is_nan() or number.is_infinite():
|
||
|
return number, None
|
||
|
format = None
|
||
|
for magnitude in sorted([int(m) for m in compact_format["other"]], reverse=True):
|
||
|
if abs(number) >= magnitude:
|
||
|
# check the pattern using "other" as the amount
|
||
|
format = compact_format["other"][str(magnitude)]
|
||
|
pattern = parse_pattern(format).pattern
|
||
|
# if the pattern is "0", we do not divide the number
|
||
|
if pattern == "0":
|
||
|
break
|
||
|
# otherwise, we need to divide the number by the magnitude but remove zeros
|
||
|
# equal to the number of 0's in the pattern minus 1
|
||
|
number = cast(decimal.Decimal, number / (magnitude // (10 ** (pattern.count("0") - 1))))
|
||
|
# round to the number of fraction digits requested
|
||
|
rounded = round(number, fraction_digits)
|
||
|
# if the remaining number is singular, use the singular format
|
||
|
plural_form = locale.plural_form(abs(number))
|
||
|
if plural_form not in compact_format:
|
||
|
plural_form = "other"
|
||
|
if number == 1 and "1" in compact_format:
|
||
|
plural_form = "1"
|
||
|
format = compact_format[plural_form][str(magnitude)]
|
||
|
number = rounded
|
||
|
break
|
||
|
return number, format
|
||
|
|
||
|
|
||
|
class UnknownCurrencyFormatError(KeyError):
|
||
|
"""Exception raised when an unknown currency format is requested."""
|
||
|
|
||
|
|
||
|
def format_currency(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
currency: str,
|
||
|
format: str | NumberPattern | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
currency_digits: bool = True,
|
||
|
format_type: Literal["name", "standard", "accounting"] = "standard",
|
||
|
decimal_quantization: bool = True,
|
||
|
group_separator: bool = True,
|
||
|
) -> str:
|
||
|
"""Return formatted currency value.
|
||
|
|
||
|
>>> format_currency(1099.98, 'USD', locale='en_US')
|
||
|
'$1,099.98'
|
||
|
>>> format_currency(1099.98, 'USD', locale='es_CO')
|
||
|
u'US$1.099,98'
|
||
|
>>> format_currency(1099.98, 'EUR', locale='de_DE')
|
||
|
u'1.099,98\\xa0\\u20ac'
|
||
|
|
||
|
The format can also be specified explicitly. The currency is
|
||
|
placed with the '¤' sign. As the sign gets repeated the format
|
||
|
expands (¤ being the symbol, ¤¤ is the currency abbreviation and
|
||
|
¤¤¤ is the full name of the currency):
|
||
|
|
||
|
>>> format_currency(1099.98, 'EUR', u'\xa4\xa4 #,##0.00', locale='en_US')
|
||
|
u'EUR 1,099.98'
|
||
|
>>> format_currency(1099.98, 'EUR', u'#,##0.00 \xa4\xa4\xa4', locale='en_US')
|
||
|
u'1,099.98 euros'
|
||
|
|
||
|
Currencies usually have a specific number of decimal digits. This function
|
||
|
favours that information over the given format:
|
||
|
|
||
|
>>> format_currency(1099.98, 'JPY', locale='en_US')
|
||
|
u'\\xa51,100'
|
||
|
>>> format_currency(1099.98, 'COP', u'#,##0.00', locale='es_ES')
|
||
|
u'1.099,98'
|
||
|
|
||
|
However, the number of decimal digits can be overridden from the currency
|
||
|
information, by setting the last parameter to ``False``:
|
||
|
|
||
|
>>> format_currency(1099.98, 'JPY', locale='en_US', currency_digits=False)
|
||
|
u'\\xa51,099.98'
|
||
|
>>> format_currency(1099.98, 'COP', u'#,##0.00', locale='es_ES', currency_digits=False)
|
||
|
u'1.099,98'
|
||
|
|
||
|
If a format is not specified the type of currency format to use
|
||
|
from the locale can be specified:
|
||
|
|
||
|
>>> format_currency(1099.98, 'EUR', locale='en_US', format_type='standard')
|
||
|
u'\\u20ac1,099.98'
|
||
|
|
||
|
When the given currency format type is not available, an exception is
|
||
|
raised:
|
||
|
|
||
|
>>> format_currency('1099.98', 'EUR', locale='root', format_type='unknown')
|
||
|
Traceback (most recent call last):
|
||
|
...
|
||
|
UnknownCurrencyFormatError: "'unknown' is not a known currency format type"
|
||
|
|
||
|
>>> format_currency(101299.98, 'USD', locale='en_US', group_separator=False)
|
||
|
u'$101299.98'
|
||
|
|
||
|
>>> format_currency(101299.98, 'USD', locale='en_US', group_separator=True)
|
||
|
u'$101,299.98'
|
||
|
|
||
|
You can also pass format_type='name' to use long display names. The order of
|
||
|
the number and currency name, along with the correct localized plural form
|
||
|
of the currency name, is chosen according to locale:
|
||
|
|
||
|
>>> format_currency(1, 'USD', locale='en_US', format_type='name')
|
||
|
u'1.00 US dollar'
|
||
|
>>> format_currency(1099.98, 'USD', locale='en_US', format_type='name')
|
||
|
u'1,099.98 US dollars'
|
||
|
>>> format_currency(1099.98, 'USD', locale='ee', format_type='name')
|
||
|
u'us ga dollar 1,099.98'
|
||
|
|
||
|
By default the locale is allowed to truncate and round a high-precision
|
||
|
number by forcing its format pattern onto the decimal part. You can bypass
|
||
|
this behavior with the `decimal_quantization` parameter:
|
||
|
|
||
|
>>> format_currency(1099.9876, 'USD', locale='en_US')
|
||
|
u'$1,099.99'
|
||
|
>>> format_currency(1099.9876, 'USD', locale='en_US', decimal_quantization=False)
|
||
|
u'$1,099.9876'
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param currency: the currency code
|
||
|
:param format: the format string to use
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param currency_digits: use the currency's natural number of decimal digits
|
||
|
:param format_type: the currency format type to use
|
||
|
:param decimal_quantization: Truncate and round high-precision numbers to
|
||
|
the format pattern. Defaults to `True`.
|
||
|
:param group_separator: Boolean to switch group separator on/off in a locale's
|
||
|
number format.
|
||
|
|
||
|
"""
|
||
|
if format_type == 'name':
|
||
|
return _format_currency_long_name(number, currency, format=format,
|
||
|
locale=locale, currency_digits=currency_digits,
|
||
|
decimal_quantization=decimal_quantization, group_separator=group_separator)
|
||
|
locale = Locale.parse(locale)
|
||
|
if format:
|
||
|
pattern = parse_pattern(format)
|
||
|
else:
|
||
|
try:
|
||
|
pattern = locale.currency_formats[format_type]
|
||
|
except KeyError:
|
||
|
raise UnknownCurrencyFormatError(f"{format_type!r} is not a known currency format type") from None
|
||
|
|
||
|
return pattern.apply(
|
||
|
number, locale, currency=currency, currency_digits=currency_digits,
|
||
|
decimal_quantization=decimal_quantization, group_separator=group_separator)
|
||
|
|
||
|
|
||
|
def _format_currency_long_name(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
currency: str,
|
||
|
format: str | NumberPattern | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
currency_digits: bool = True,
|
||
|
format_type: Literal["name", "standard", "accounting"] = "standard",
|
||
|
decimal_quantization: bool = True,
|
||
|
group_separator: bool = True,
|
||
|
) -> str:
|
||
|
# Algorithm described here:
|
||
|
# https://www.unicode.org/reports/tr35/tr35-numbers.html#Currencies
|
||
|
locale = Locale.parse(locale)
|
||
|
# Step 1.
|
||
|
# There are no examples of items with explicit count (0 or 1) in current
|
||
|
# locale data. So there is no point implementing that.
|
||
|
# Step 2.
|
||
|
|
||
|
# Correct number to numeric type, important for looking up plural rules:
|
||
|
number_n = float(number) if isinstance(number, str) else number
|
||
|
|
||
|
# Step 3.
|
||
|
unit_pattern = get_currency_unit_pattern(currency, count=number_n, locale=locale)
|
||
|
|
||
|
# Step 4.
|
||
|
display_name = get_currency_name(currency, count=number_n, locale=locale)
|
||
|
|
||
|
# Step 5.
|
||
|
if not format:
|
||
|
format = locale.decimal_formats[None]
|
||
|
|
||
|
pattern = parse_pattern(format)
|
||
|
|
||
|
number_part = pattern.apply(
|
||
|
number, locale, currency=currency, currency_digits=currency_digits,
|
||
|
decimal_quantization=decimal_quantization, group_separator=group_separator)
|
||
|
|
||
|
return unit_pattern.format(number_part, display_name)
|
||
|
|
||
|
|
||
|
def format_compact_currency(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
currency: str,
|
||
|
*,
|
||
|
format_type: Literal["short"] = "short",
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
fraction_digits: int = 0
|
||
|
) -> str:
|
||
|
"""Format a number as a currency value in compact form.
|
||
|
|
||
|
>>> format_compact_currency(12345, 'USD', locale='en_US')
|
||
|
u'$12K'
|
||
|
>>> format_compact_currency(123456789, 'USD', locale='en_US', fraction_digits=2)
|
||
|
u'$123.46M'
|
||
|
>>> format_compact_currency(123456789, 'EUR', locale='de_DE', fraction_digits=1)
|
||
|
'123,5\xa0Mio.\xa0€'
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param currency: the currency code
|
||
|
:param format_type: the compact format type to use. Defaults to "short".
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param fraction_digits: Number of digits after the decimal point to use. Defaults to `0`.
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
try:
|
||
|
compact_format = locale.compact_currency_formats[format_type]
|
||
|
except KeyError as error:
|
||
|
raise UnknownCurrencyFormatError(f"{format_type!r} is not a known compact currency format type") from error
|
||
|
number, format = _get_compact_format(number, compact_format, locale, fraction_digits)
|
||
|
# Did not find a format, fall back.
|
||
|
if format is None or "¤" not in str(format):
|
||
|
# find first format that has a currency symbol
|
||
|
for magnitude in compact_format['other']:
|
||
|
format = compact_format['other'][magnitude].pattern
|
||
|
if '¤' not in format:
|
||
|
continue
|
||
|
# remove characters that are not the currency symbol, 0's or spaces
|
||
|
format = re.sub(r'[^0\s\¤]', '', format)
|
||
|
# compress adjacent spaces into one
|
||
|
format = re.sub(r'(\s)\s+', r'\1', format).strip()
|
||
|
break
|
||
|
if format is None:
|
||
|
raise ValueError('No compact currency format found for the given number and locale.')
|
||
|
pattern = parse_pattern(format)
|
||
|
return pattern.apply(number, locale, currency=currency, currency_digits=False, decimal_quantization=False)
|
||
|
|
||
|
|
||
|
def format_percent(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
format: str | NumberPattern | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
decimal_quantization: bool = True,
|
||
|
group_separator: bool = True,
|
||
|
) -> str:
|
||
|
"""Return formatted percent value for a specific locale.
|
||
|
|
||
|
>>> format_percent(0.34, locale='en_US')
|
||
|
u'34%'
|
||
|
>>> format_percent(25.1234, locale='en_US')
|
||
|
u'2,512%'
|
||
|
>>> format_percent(25.1234, locale='sv_SE')
|
||
|
u'2\\xa0512\\xa0%'
|
||
|
|
||
|
The format pattern can also be specified explicitly:
|
||
|
|
||
|
>>> format_percent(25.1234, u'#,##0\u2030', locale='en_US')
|
||
|
u'25,123\u2030'
|
||
|
|
||
|
By default the locale is allowed to truncate and round a high-precision
|
||
|
number by forcing its format pattern onto the decimal part. You can bypass
|
||
|
this behavior with the `decimal_quantization` parameter:
|
||
|
|
||
|
>>> format_percent(23.9876, locale='en_US')
|
||
|
u'2,399%'
|
||
|
>>> format_percent(23.9876, locale='en_US', decimal_quantization=False)
|
||
|
u'2,398.76%'
|
||
|
|
||
|
>>> format_percent(229291.1234, locale='pt_BR', group_separator=False)
|
||
|
u'22929112%'
|
||
|
|
||
|
>>> format_percent(229291.1234, locale='pt_BR', group_separator=True)
|
||
|
u'22.929.112%'
|
||
|
|
||
|
:param number: the percent number to format
|
||
|
:param format:
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param decimal_quantization: Truncate and round high-precision numbers to
|
||
|
the format pattern. Defaults to `True`.
|
||
|
:param group_separator: Boolean to switch group separator on/off in a locale's
|
||
|
number format.
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
if not format:
|
||
|
format = locale.percent_formats[None]
|
||
|
pattern = parse_pattern(format)
|
||
|
return pattern.apply(
|
||
|
number, locale, decimal_quantization=decimal_quantization, group_separator=group_separator)
|
||
|
|
||
|
|
||
|
def format_scientific(
|
||
|
number: float | decimal.Decimal | str,
|
||
|
format: str | NumberPattern | None = None,
|
||
|
locale: Locale | str | None = LC_NUMERIC,
|
||
|
decimal_quantization: bool = True,
|
||
|
) -> str:
|
||
|
"""Return value formatted in scientific notation for a specific locale.
|
||
|
|
||
|
>>> format_scientific(10000, locale='en_US')
|
||
|
u'1E4'
|
||
|
|
||
|
The format pattern can also be specified explicitly:
|
||
|
|
||
|
>>> format_scientific(1234567, u'##0.##E00', locale='en_US')
|
||
|
u'1.23E06'
|
||
|
|
||
|
By default the locale is allowed to truncate and round a high-precision
|
||
|
number by forcing its format pattern onto the decimal part. You can bypass
|
||
|
this behavior with the `decimal_quantization` parameter:
|
||
|
|
||
|
>>> format_scientific(1234.9876, u'#.##E0', locale='en_US')
|
||
|
u'1.23E3'
|
||
|
>>> format_scientific(1234.9876, u'#.##E0', locale='en_US', decimal_quantization=False)
|
||
|
u'1.2349876E3'
|
||
|
|
||
|
:param number: the number to format
|
||
|
:param format:
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param decimal_quantization: Truncate and round high-precision numbers to
|
||
|
the format pattern. Defaults to `True`.
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
if not format:
|
||
|
format = locale.scientific_formats[None]
|
||
|
pattern = parse_pattern(format)
|
||
|
return pattern.apply(
|
||
|
number, locale, decimal_quantization=decimal_quantization)
|
||
|
|
||
|
|
||
|
class NumberFormatError(ValueError):
|
||
|
"""Exception raised when a string cannot be parsed into a number."""
|
||
|
|
||
|
def __init__(self, message: str, suggestions: list[str] | None = None) -> None:
|
||
|
super().__init__(message)
|
||
|
#: a list of properly formatted numbers derived from the invalid input
|
||
|
self.suggestions = suggestions
|
||
|
|
||
|
|
||
|
def parse_number(string: str, locale: Locale | str | None = LC_NUMERIC) -> int:
|
||
|
"""Parse localized number string into an integer.
|
||
|
|
||
|
>>> parse_number('1,099', locale='en_US')
|
||
|
1099
|
||
|
>>> parse_number('1.099', locale='de_DE')
|
||
|
1099
|
||
|
|
||
|
When the given string cannot be parsed, an exception is raised:
|
||
|
|
||
|
>>> parse_number('1.099,98', locale='de')
|
||
|
Traceback (most recent call last):
|
||
|
...
|
||
|
NumberFormatError: '1.099,98' is not a valid number
|
||
|
|
||
|
:param string: the string to parse
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:return: the parsed number
|
||
|
:raise `NumberFormatError`: if the string can not be converted to a number
|
||
|
"""
|
||
|
try:
|
||
|
return int(string.replace(get_group_symbol(locale), ''))
|
||
|
except ValueError as ve:
|
||
|
raise NumberFormatError(f"{string!r} is not a valid number") from ve
|
||
|
|
||
|
|
||
|
def parse_decimal(string: str, locale: Locale | str | None = LC_NUMERIC, strict: bool = False) -> decimal.Decimal:
|
||
|
"""Parse localized decimal string into a decimal.
|
||
|
|
||
|
>>> parse_decimal('1,099.98', locale='en_US')
|
||
|
Decimal('1099.98')
|
||
|
>>> parse_decimal('1.099,98', locale='de')
|
||
|
Decimal('1099.98')
|
||
|
>>> parse_decimal('12 345,123', locale='ru')
|
||
|
Decimal('12345.123')
|
||
|
|
||
|
When the given string cannot be parsed, an exception is raised:
|
||
|
|
||
|
>>> parse_decimal('2,109,998', locale='de')
|
||
|
Traceback (most recent call last):
|
||
|
...
|
||
|
NumberFormatError: '2,109,998' is not a valid decimal number
|
||
|
|
||
|
If `strict` is set to `True` and the given string contains a number
|
||
|
formatted in an irregular way, an exception is raised:
|
||
|
|
||
|
>>> parse_decimal('30.00', locale='de', strict=True)
|
||
|
Traceback (most recent call last):
|
||
|
...
|
||
|
NumberFormatError: '30.00' is not a properly formatted decimal number. Did you mean '3.000'? Or maybe '30,00'?
|
||
|
|
||
|
>>> parse_decimal('0.00', locale='de', strict=True)
|
||
|
Traceback (most recent call last):
|
||
|
...
|
||
|
NumberFormatError: '0.00' is not a properly formatted decimal number. Did you mean '0'?
|
||
|
|
||
|
:param string: the string to parse
|
||
|
:param locale: the `Locale` object or locale identifier
|
||
|
:param strict: controls whether numbers formatted in a weird way are
|
||
|
accepted or rejected
|
||
|
:raise NumberFormatError: if the string can not be converted to a
|
||
|
decimal number
|
||
|
"""
|
||
|
locale = Locale.parse(locale)
|
||
|
group_symbol = get_group_symbol(locale)
|
||
|
decimal_symbol = get_decimal_symbol(locale)
|
||
|
|
||
|
if not strict and (
|
||
|
group_symbol == '\xa0' and # if the grouping symbol is U+00A0 NO-BREAK SPACE,
|
||
|
group_symbol not in string and # and the string to be parsed does not contain it,
|
||
|
' ' in string # but it does contain a space instead,
|
||
|
):
|
||
|
# ... it's reasonable to assume it is taking the place of the grouping symbol.
|
||
|
string = string.replace(' ', group_symbol)
|
||
|
|
||
|
try:
|
||
|
parsed = decimal.Decimal(string.replace(group_symbol, '')
|
||
|
.replace(decimal_symbol, '.'))
|
||
|
except decimal.InvalidOperation as exc:
|
||
|
raise NumberFormatError(f"{string!r} is not a valid decimal number") from exc
|
||
|
if strict and group_symbol in string:
|
||
|
proper = format_decimal(parsed, locale=locale, decimal_quantization=False)
|
||
|
if string != proper and string.rstrip('0') != (proper + decimal_symbol):
|
||
|
try:
|
||
|
parsed_alt = decimal.Decimal(string.replace(decimal_symbol, '')
|
||
|
.replace(group_symbol, '.'))
|
||
|
except decimal.InvalidOperation as exc:
|
||
|
raise NumberFormatError(
|
||
|
f"{string!r} is not a properly formatted decimal number. "
|
||
|
f"Did you mean {proper!r}?",
|
||
|
suggestions=[proper],
|
||
|
) from exc
|
||
|
else:
|
||
|
proper_alt = format_decimal(parsed_alt, locale=locale, decimal_quantization=False)
|
||
|
if proper_alt == proper:
|
||
|
raise NumberFormatError(
|
||
|
f"{string!r} is not a properly formatted decimal number. "
|
||
|
f"Did you mean {proper!r}?",
|
||
|
suggestions=[proper],
|
||
|
)
|
||
|
else:
|
||
|
raise NumberFormatError(
|
||
|
f"{string!r} is not a properly formatted decimal number. "
|
||
|
f"Did you mean {proper!r}? Or maybe {proper_alt!r}?",
|
||
|
suggestions=[proper, proper_alt],
|
||
|
)
|
||
|
return parsed
|
||
|
|
||
|
|
||
|
PREFIX_END = r'[^0-9@#.,]'
|
||
|
NUMBER_TOKEN = r'[0-9@#.,E+]'
|
||
|
|
||
|
PREFIX_PATTERN = r"(?P<prefix>(?:'[^']*'|%s)*)" % PREFIX_END
|
||
|
NUMBER_PATTERN = r"(?P<number>%s*)" % NUMBER_TOKEN
|
||
|
SUFFIX_PATTERN = r"(?P<suffix>.*)"
|
||
|
|
||
|
number_re = re.compile(f"{PREFIX_PATTERN}{NUMBER_PATTERN}{SUFFIX_PATTERN}")
|
||
|
|
||
|
|
||
|
def parse_grouping(p: str) -> tuple[int, int]:
|
||
|
"""Parse primary and secondary digit grouping
|
||
|
|
||
|
>>> parse_grouping('##')
|
||
|
(1000, 1000)
|
||
|
>>> parse_grouping('#,###')
|
||
|
(3, 3)
|
||
|
>>> parse_grouping('#,####,###')
|
||
|
(3, 4)
|
||
|
"""
|
||
|
width = len(p)
|
||
|
g1 = p.rfind(',')
|
||
|
if g1 == -1:
|
||
|
return 1000, 1000
|
||
|
g1 = width - g1 - 1
|
||
|
g2 = p[:-g1 - 1].rfind(',')
|
||
|
if g2 == -1:
|
||
|
return g1, g1
|
||
|
g2 = width - g1 - g2 - 2
|
||
|
return g1, g2
|
||
|
|
||
|
|
||
|
def parse_pattern(pattern: NumberPattern | str) -> NumberPattern:
|
||
|
"""Parse number format patterns"""
|
||
|
if isinstance(pattern, NumberPattern):
|
||
|
return pattern
|
||
|
|
||
|
def _match_number(pattern):
|
||
|
rv = number_re.search(pattern)
|
||
|
if rv is None:
|
||
|
raise ValueError(f"Invalid number pattern {pattern!r}")
|
||
|
return rv.groups()
|
||
|
|
||
|
pos_pattern = pattern
|
||
|
|
||
|
# Do we have a negative subpattern?
|
||
|
if ';' in pattern:
|
||
|
pos_pattern, neg_pattern = pattern.split(';', 1)
|
||
|
pos_prefix, number, pos_suffix = _match_number(pos_pattern)
|
||
|
neg_prefix, _, neg_suffix = _match_number(neg_pattern)
|
||
|
else:
|
||
|
pos_prefix, number, pos_suffix = _match_number(pos_pattern)
|
||
|
neg_prefix = f"-{pos_prefix}"
|
||
|
neg_suffix = pos_suffix
|
||
|
if 'E' in number:
|
||
|
number, exp = number.split('E', 1)
|
||
|
else:
|
||
|
exp = None
|
||
|
if '@' in number and '.' in number and '0' in number:
|
||
|
raise ValueError('Significant digit patterns can not contain "@" or "0"')
|
||
|
if '.' in number:
|
||
|
integer, fraction = number.rsplit('.', 1)
|
||
|
else:
|
||
|
integer = number
|
||
|
fraction = ''
|
||
|
|
||
|
def parse_precision(p):
|
||
|
"""Calculate the min and max allowed digits"""
|
||
|
min = max = 0
|
||
|
for c in p:
|
||
|
if c in '@0':
|
||
|
min += 1
|
||
|
max += 1
|
||
|
elif c == '#':
|
||
|
max += 1
|
||
|
elif c == ',':
|
||
|
continue
|
||
|
else:
|
||
|
break
|
||
|
return min, max
|
||
|
|
||
|
int_prec = parse_precision(integer)
|
||
|
frac_prec = parse_precision(fraction)
|
||
|
if exp:
|
||
|
exp_plus = exp.startswith('+')
|
||
|
exp = exp.lstrip('+')
|
||
|
exp_prec = parse_precision(exp)
|
||
|
else:
|
||
|
exp_plus = None
|
||
|
exp_prec = None
|
||
|
grouping = parse_grouping(integer)
|
||
|
return NumberPattern(pattern, (pos_prefix, neg_prefix),
|
||
|
(pos_suffix, neg_suffix), grouping,
|
||
|
int_prec, frac_prec,
|
||
|
exp_prec, exp_plus, number)
|
||
|
|
||
|
|
||
|
class NumberPattern:
|
||
|
|
||
|
def __init__(
|
||
|
self,
|
||
|
pattern: str,
|
||
|
prefix: tuple[str, str],
|
||
|
suffix: tuple[str, str],
|
||
|
grouping: tuple[int, int],
|
||
|
int_prec: tuple[int, int],
|
||
|
frac_prec: tuple[int, int],
|
||
|
exp_prec: tuple[int, int] | None,
|
||
|
exp_plus: bool | None,
|
||
|
number_pattern: str | None = None,
|
||
|
) -> None:
|
||
|
# Metadata of the decomposed parsed pattern.
|
||
|
self.pattern = pattern
|
||
|
self.prefix = prefix
|
||
|
self.suffix = suffix
|
||
|
self.number_pattern = number_pattern
|
||
|
self.grouping = grouping
|
||
|
self.int_prec = int_prec
|
||
|
self.frac_prec = frac_prec
|
||
|
self.exp_prec = exp_prec
|
||
|
self.exp_plus = exp_plus
|
||
|
self.scale = self.compute_scale()
|
||
|
|
||
|
def __repr__(self) -> str:
|
||
|
return f"<{type(self).__name__} {self.pattern!r}>"
|
||
|
|
||
|
def compute_scale(self) -> Literal[0, 2, 3]:
|
||
|
"""Return the scaling factor to apply to the number before rendering.
|
||
|
|
||
|
Auto-set to a factor of 2 or 3 if presence of a ``%`` or ``‰`` sign is
|
||
|
detected in the prefix or suffix of the pattern. Default is to not mess
|
||
|
with the scale at all and keep it to 0.
|
||
|
"""
|
||
|
scale = 0
|
||
|
if '%' in ''.join(self.prefix + self.suffix):
|
||
|
scale = 2
|
||
|
elif '‰' in ''.join(self.prefix + self.suffix):
|
||
|
scale = 3
|
||
|
return scale
|
||
|
|
||
|
def scientific_notation_elements(self, value: decimal.Decimal, locale: Locale | str | None) -> tuple[decimal.Decimal, int, str]:
|
||
|
""" Returns normalized scientific notation components of a value.
|
||
|
"""
|
||
|
# Normalize value to only have one lead digit.
|
||
|
exp = value.adjusted()
|
||
|
value = value * get_decimal_quantum(exp)
|
||
|
assert value.adjusted() == 0
|
||
|
|
||
|
# Shift exponent and value by the minimum number of leading digits
|
||
|
# imposed by the rendering pattern. And always make that number
|
||
|
# greater or equal to 1.
|
||
|
lead_shift = max([1, min(self.int_prec)]) - 1
|
||
|
exp = exp - lead_shift
|
||
|
value = value * get_decimal_quantum(-lead_shift)
|
||
|
|
||
|
# Get exponent sign symbol.
|
||
|
exp_sign = ''
|
||
|
if exp < 0:
|
||
|
exp_sign = get_minus_sign_symbol(locale)
|
||
|
elif self.exp_plus:
|
||
|
exp_sign = get_plus_sign_symbol(locale)
|
||
|
|
||
|
# Normalize exponent value now that we have the sign.
|
||
|
exp = abs(exp)
|
||
|
|
||
|
return value, exp, exp_sign
|
||
|
|
||
|
def apply(
|
||
|
self,
|
||
|
value: float | decimal.Decimal | str,
|
||
|
locale: Locale | str | None,
|
||
|
currency: str | None = None,
|
||
|
currency_digits: bool = True,
|
||
|
decimal_quantization: bool = True,
|
||
|
force_frac: tuple[int, int] | None = None,
|
||
|
group_separator: bool = True,
|
||
|
):
|
||
|
"""Renders into a string a number following the defined pattern.
|
||
|
|
||
|
Forced decimal quantization is active by default so we'll produce a
|
||
|
number string that is strictly following CLDR pattern definitions.
|
||
|
|
||
|
:param value: The value to format. If this is not a Decimal object,
|
||
|
it will be cast to one.
|
||
|
:type value: decimal.Decimal|float|int
|
||
|
:param locale: The locale to use for formatting.
|
||
|
:type locale: str|babel.core.Locale
|
||
|
:param currency: Which currency, if any, to format as.
|
||
|
:type currency: str|None
|
||
|
:param currency_digits: Whether or not to use the currency's precision.
|
||
|
If false, the pattern's precision is used.
|
||
|
:type currency_digits: bool
|
||
|
:param decimal_quantization: Whether decimal numbers should be forcibly
|
||
|
quantized to produce a formatted output
|
||
|
strictly matching the CLDR definition for
|
||
|
the locale.
|
||
|
:type decimal_quantization: bool
|
||
|
:param force_frac: DEPRECATED - a forced override for `self.frac_prec`
|
||
|
for a single formatting invocation.
|
||
|
:return: Formatted decimal string.
|
||
|
:rtype: str
|
||
|
"""
|
||
|
if not isinstance(value, decimal.Decimal):
|
||
|
value = decimal.Decimal(str(value))
|
||
|
|
||
|
value = value.scaleb(self.scale)
|
||
|
|
||
|
# Separate the absolute value from its sign.
|
||
|
is_negative = int(value.is_signed())
|
||
|
value = abs(value).normalize()
|
||
|
|
||
|
# Prepare scientific notation metadata.
|
||
|
if self.exp_prec:
|
||
|
value, exp, exp_sign = self.scientific_notation_elements(value, locale)
|
||
|
|
||
|
# Adjust the precision of the fractional part and force it to the
|
||
|
# currency's if necessary.
|
||
|
if force_frac:
|
||
|
# TODO (3.x?): Remove this parameter
|
||
|
warnings.warn(
|
||
|
'The force_frac parameter to NumberPattern.apply() is deprecated.',
|
||
|
DeprecationWarning,
|
||
|
stacklevel=2,
|
||
|
)
|
||
|
frac_prec = force_frac
|
||
|
elif currency and currency_digits:
|
||
|
frac_prec = (get_currency_precision(currency), ) * 2
|
||
|
else:
|
||
|
frac_prec = self.frac_prec
|
||
|
|
||
|
# Bump decimal precision to the natural precision of the number if it
|
||
|
# exceeds the one we're about to use. This adaptative precision is only
|
||
|
# triggered if the decimal quantization is disabled or if a scientific
|
||
|
# notation pattern has a missing mandatory fractional part (as in the
|
||
|
# default '#E0' pattern). This special case has been extensively
|
||
|
# discussed at https://github.com/python-babel/babel/pull/494#issuecomment-307649969 .
|
||
|
if not decimal_quantization or (self.exp_prec and frac_prec == (0, 0)):
|
||
|
frac_prec = (frac_prec[0], max([frac_prec[1], get_decimal_precision(value)]))
|
||
|
|
||
|
# Render scientific notation.
|
||
|
if self.exp_prec:
|
||
|
number = ''.join([
|
||
|
self._quantize_value(value, locale, frac_prec, group_separator),
|
||
|
get_exponential_symbol(locale),
|
||
|
exp_sign, # type: ignore # exp_sign is always defined here
|
||
|
self._format_int(str(exp), self.exp_prec[0], self.exp_prec[1], locale) # type: ignore # exp is always defined here
|
||
|
])
|
||
|
|
||
|
# Is it a significant digits pattern?
|
||
|
elif '@' in self.pattern:
|
||
|
text = self._format_significant(value,
|
||
|
self.int_prec[0],
|
||
|
self.int_prec[1])
|
||
|
a, sep, b = text.partition(".")
|
||
|
number = self._format_int(a, 0, 1000, locale)
|
||
|
if sep:
|
||
|
number += get_decimal_symbol(locale) + b
|
||
|
|
||
|
# A normal number pattern.
|
||
|
else:
|
||
|
number = self._quantize_value(value, locale, frac_prec, group_separator)
|
||
|
|
||
|
retval = ''.join([
|
||
|
self.prefix[is_negative],
|
||
|
number if self.number_pattern != '' else '',
|
||
|
self.suffix[is_negative]])
|
||
|
|
||
|
if '¤' in retval and currency is not None:
|
||
|
retval = retval.replace('¤¤¤', get_currency_name(currency, value, locale))
|
||
|
retval = retval.replace('¤¤', currency.upper())
|
||
|
retval = retval.replace('¤', get_currency_symbol(currency, locale))
|
||
|
|
||
|
# remove single quotes around text, except for doubled single quotes
|
||
|
# which are replaced with a single quote
|
||
|
retval = re.sub(r"'([^']*)'", lambda m: m.group(1) or "'", retval)
|
||
|
|
||
|
return retval
|
||
|
|
||
|
#
|
||
|
# This is one tricky piece of code. The idea is to rely as much as possible
|
||
|
# on the decimal module to minimize the amount of code.
|
||
|
#
|
||
|
# Conceptually, the implementation of this method can be summarized in the
|
||
|
# following steps:
|
||
|
#
|
||
|
# - Move or shift the decimal point (i.e. the exponent) so the maximum
|
||
|
# amount of significant digits fall into the integer part (i.e. to the
|
||
|
# left of the decimal point)
|
||
|
#
|
||
|
# - Round the number to the nearest integer, discarding all the fractional
|
||
|
# part which contained extra digits to be eliminated
|
||
|
#
|
||
|
# - Convert the rounded integer to a string, that will contain the final
|
||
|
# sequence of significant digits already trimmed to the maximum
|
||
|
#
|
||
|
# - Restore the original position of the decimal point, potentially
|
||
|
# padding with zeroes on either side
|
||
|
#
|
||
|
def _format_significant(self, value: decimal.Decimal, minimum: int, maximum: int) -> str:
|
||
|
exp = value.adjusted()
|
||
|
scale = maximum - 1 - exp
|
||
|
digits = str(value.scaleb(scale).quantize(decimal.Decimal(1)))
|
||
|
if scale <= 0:
|
||
|
result = digits + '0' * -scale
|
||
|
else:
|
||
|
intpart = digits[:-scale]
|
||
|
i = len(intpart)
|
||
|
j = i + max(minimum - i, 0)
|
||
|
result = "{intpart}.{pad:0<{fill}}{fracpart}{fracextra}".format(
|
||
|
intpart=intpart or '0',
|
||
|
pad='',
|
||
|
fill=-min(exp + 1, 0),
|
||
|
fracpart=digits[i:j],
|
||
|
fracextra=digits[j:].rstrip('0'),
|
||
|
).rstrip('.')
|
||
|
return result
|
||
|
|
||
|
def _format_int(self, value: str, min: int, max: int, locale: Locale | str | None) -> str:
|
||
|
width = len(value)
|
||
|
if width < min:
|
||
|
value = '0' * (min - width) + value
|
||
|
gsize = self.grouping[0]
|
||
|
ret = ''
|
||
|
symbol = get_group_symbol(locale)
|
||
|
while len(value) > gsize:
|
||
|
ret = symbol + value[-gsize:] + ret
|
||
|
value = value[:-gsize]
|
||
|
gsize = self.grouping[1]
|
||
|
return value + ret
|
||
|
|
||
|
def _quantize_value(self, value: decimal.Decimal, locale: Locale | str | None, frac_prec: tuple[int, int], group_separator: bool) -> str:
|
||
|
# If the number is +/-Infinity, we can't quantize it
|
||
|
if value.is_infinite():
|
||
|
return get_infinity_symbol(locale)
|
||
|
quantum = get_decimal_quantum(frac_prec[1])
|
||
|
rounded = value.quantize(quantum)
|
||
|
a, sep, b = f"{rounded:f}".partition(".")
|
||
|
integer_part = a
|
||
|
if group_separator:
|
||
|
integer_part = self._format_int(a, self.int_prec[0], self.int_prec[1], locale)
|
||
|
number = integer_part + self._format_frac(b or '0', locale, frac_prec)
|
||
|
return number
|
||
|
|
||
|
def _format_frac(self, value: str, locale: Locale | str | None, force_frac: tuple[int, int] | None = None) -> str:
|
||
|
min, max = force_frac or self.frac_prec
|
||
|
if len(value) < min:
|
||
|
value += ('0' * (min - len(value)))
|
||
|
if max == 0 or (min == 0 and int(value) == 0):
|
||
|
return ''
|
||
|
while len(value) > min and value[-1] == '0':
|
||
|
value = value[:-1]
|
||
|
return get_decimal_symbol(locale) + value
|