Skip to content

Commit

Permalink
Added support for Esperanto numbers.
Browse files Browse the repository at this point in the history
  • Loading branch information
OpesMentis authored and KommuSoft committed Aug 18, 2022
1 parent 44a2b7c commit 75eec68
Show file tree
Hide file tree
Showing 3 changed files with 321 additions and 0 deletions.
1 change: 1 addition & 0 deletions num2words/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,7 @@
'fr_DZ': lang_FR_DZ.Num2Word_FR_DZ(),
'de': lang_DE.Num2Word_DE(),
'fi': lang_FI.Num2Word_FI(),
'eo': lang_EO.Num2Word_EO(),
'es': lang_ES.Num2Word_ES(),
'es_CO': lang_ES_CO.Num2Word_ES_CO(),
'es_NI': lang_ES_NI.Num2Word_ES_NI(),
Expand Down
130 changes: 130 additions & 0 deletions num2words/lang_EO.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,130 @@
# -*- coding: utf-8 -*-
# Copyright (c) 2021, Savoir-faire Linux inc. All Rights Reserved.

# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
# MA 02110-1301 USA

from __future__ import print_function, unicode_literals

from .base import Num2Word_Base


class Num2Word_EO(Num2Word_Base):
CURRENCY_FORMS = {
"EUR": (("eŭro", "eŭroj"), ("centimo", "centimoj")),
"USD": (("dolaro", "dolaroj"), ("cendo", "cendoj")),
"FRF": (("franko", "frankoj"), ("centimo", "centimoj")),
"GBP": (("pundo", "pundoj"), ("penco", "pencoj")),
"CNY": (("juano", "juanoj"), ("feno", "fenoj")),
}

GIGA_SUFFIX = "iliardo"
MEGA_SUFFIX = "iliono"

def set_high_numwords(self, high):
cap = 3 + 6 * len(high)

for word, n in zip(high, range(cap, 3, -6)):
if self.GIGA_SUFFIX:
self.cards[10 ** n] = word + self.GIGA_SUFFIX

if self.MEGA_SUFFIX:
self.cards[10 ** (n - 3)] = word + self.MEGA_SUFFIX

def gen_high_numwords(self, units, tens, lows):
out = [u + t for t in tens for u in units]
out.reverse()
return out + lows

def setup(self):
lows = ["naŭ", "ok", "sep", "ses", "kvin", "kvar", "tr", "b", "m"]
units = ["", "un", "duo", "tre", "kvatuor",
"kvin", "seks", "septen", "okto", "novem"]
tens = ["dek", "vigint", "trigint", "kvadragint", "kvinkvagint",
"seksagint", "septuagint", "oktogint", "nonagint"]

self.high_numwords = ["cent"] + self.gen_high_numwords(units, tens,
lows)

self.negword = "minus "
self.pointword = "komo"
self.errmsg_nonnum = u"Sole nombroj povas esti konvertita en vortojn."
self.errmsg_toobig = (
u"Tro granda nombro por esti konvertita en vortojn."
)
self.exclude_title = ["kaj", "komo", "minus"]
self.mid_numwords = [(1000, "mil"), (100, "cent"), (90, "naŭdek"),
(80, "okdek"), (70, "sepdek"), (60, "sesdek"),
(50, "kvindek"), (40, "kvardek"), (30, "tridek")]
self.low_numwords = ["dudek", "dek naŭ", "dek ok", "dek sep",
"dek ses", "dek kvin", "dek kvar", "dek tri",
"dek du", "dek unu", "dek", "naŭ", "ok", "sep",
"ses", "kvin", "kvar", "tri", "du", "unu", "nul"]
self.ords = {
"unu": "unua",
"du": "dua",
"tri": "tria",
"kvar": "kvara",
"kvin": "kvina",
"ses": "sesa",
"sep": "sepa",
"ok": "oka",
"naŭ": "naŭa",
"dek": "deka"
}

def merge(self, curr, next):
ctext, cnum, ntext, nnum = curr + next
if cnum == 1 and nnum < 1000000:
return next

if nnum >= 10**6 and cnum > 1:
return ("%s %sj" % (ctext, ntext), cnum + nnum)

if nnum == 100:
return ("%s%s" % (ctext, ntext), cnum + nnum)

return ("%s %s" % (ctext, ntext), cnum + nnum)

def to_ordinal(self, value):
self.verify_ordinal(value)
word = self.to_cardinal(value)
for src, repl in self.ords.items():
if word.endswith(src):
word = word[:-len(src)] + repl
return word

if word.endswith("o"):
word = word[:-1] + "a"
elif word.endswith("oj"):
word = word[:-2] + "a"
else:
word = word + "a"
return word

def to_ordinal_num(self, value):
self.verify_ordinal(value)
out = str(value)
out += "a"
return out

def to_currency(self, val, currency="EUR", cents=True, separator=" kaj",
adjective=False):
result = super(Num2Word_EO, self).to_currency(
val, currency=currency, cents=cents, separator=separator,
adjective=adjective)
return result

def pluralize(self, n, forms):
form = 0 if n <= 1 else 1
return forms[form]
190 changes: 190 additions & 0 deletions tests/test_eo.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,190 @@
# -*- coding: utf-8 -*-
# Copyright (c) 2021, Savoir-faire Linux inc. All Rights Reserved.

# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
# MA 02110-1301 USA

from __future__ import unicode_literals

from unittest import TestCase

from num2words import num2words

TEST_CASES_CARDINAL = (
(1, "unu"),
(2, "du"),
(3, "tri"),
(5.5, "kvin komo kvin"),
(11, "dek unu"),
(12, "dek du"),
(16, "dek ses"),
(17.42, "dek sep komo kvar du"),
(19, "dek naŭ"),
(20, "dudek"),
(21, "dudek unu"),
(26, "dudek ses"),
(27.312, "dudek sep komo tri unu du"),
(28, "dudek ok"),
(30, "tridek"),
(31, "tridek unu"),
(40, "kvardek"),
(44, "kvardek kvar"),
(50, "kvindek"),
(53.486, "kvindek tri komo kvar ok ses"),
(55, "kvindek kvin"),
(60, "sesdek"),
(67, "sesdek sep"),
(70, "sepdek"),
(79, "sepdek naŭ"),
(89, "okdek naŭ"),
(95, "naŭdek kvin"),
(100, "cent"),
(101, "cent unu"),
(199, "cent naŭdek naŭ"),
(203, "ducent tri"),
(287, "ducent okdek sep"),
(300.42, "tricent komo kvar du"),
(356, "tricent kvindek ses"),
(400, "kvarcent"),
(434, "kvarcent tridek kvar"),
(578, "kvincent sepdek ok"),
(689, "sescent okdek naŭ"),
(729, "sepcent dudek naŭ"),
(894, "okcent naŭdek kvar"),
(999, "naŭcent naŭdek naŭ"),
(1000, "mil"),
(1001, "mil unu"),
(1097, "mil naŭdek sep"),
(1104, "mil cent kvar"),
(1243, "mil ducent kvardek tri"),
(2385, "du mil tricent okdek kvin"),
(3766, "tri mil sepcent sesdek ses"),
(4196, "kvar mil cent naŭdek ses"),
(4196.42, "kvar mil cent naŭdek ses komo kvar du"),
(5846, "kvin mil okcent kvardek ses"),
(6459, "ses mil kvarcent kvindek naŭ"),
(7232, "sep mil ducent tridek du"),
(8569, "ok mil kvincent sesdek naŭ"),
(9539, "naŭ mil kvincent tridek naŭ"),
(1000000, "unu miliono"),
(1000001, "unu miliono unu"),
(4000000, "kvar milionoj"),
(4000004, "kvar milionoj kvar"),
(4300000, "kvar milionoj tricent mil"),
(80000000, "okdek milionoj"),
(300000000, "tricent milionoj"),
(10000000000000, "dek bilionoj"),
(10000000000010, "dek bilionoj dek"),
(100000000000000, "cent bilionoj"),
(1000000000000000000, "unu triliono"),
(1000000000000000000000, "unu triliardo"),
(10000000000000000000000000, "dek kvarilionoj")
)

TEST_CASES_ORDINAL = (
(1, "unua"),
(8, "oka"),
(12, "dek dua"),
(14, "dek kvara"),
(28, "dudek oka"),
(100, "centa"),
(1000, "mila"),
(1000000, "unu miliona"),
(1000000000000000, "unu biliarda"),
(1000000000000000000, "unu triliona")
)

TEST_CASES_ORDINAL_NUM = (
(1, "1a"),
(8, "8a"),
(11, "11a"),
(12, "12a"),
(14, "14a"),
(21, "21a"),
(28, "28a"),
(100, "100a"),
(101, "101a"),
(1000, "1000a"),
(1000000, "1000000a")
)

TEST_CASES_TO_CURRENCY_EUR = (
(1.00, "unu eŭro kaj nul centimo"),
(2.01, "du eŭroj kaj unu centimo"),
(8.10, "ok eŭroj kaj dek centimoj"),
(12.26, "dek du eŭroj kaj dudek ses centimoj"),
(21.29, "dudek unu eŭroj kaj dudek naŭ centimoj"),
(81.25, "okdek unu eŭroj kaj dudek kvin centimoj"),
(100.00, "cent eŭroj kaj nul centimo"),
)

TEST_CASES_TO_CURRENCY_FRF = (
(1.00, "unu franko kaj nul centimo"),
(2.01, "du frankoj kaj unu centimo"),
(8.10, "ok frankoj kaj dek centimoj"),
(12.27, "dek du frankoj kaj dudek sep centimoj"),
(21.29, "dudek unu frankoj kaj dudek naŭ centimoj"),
(81.25, "okdek unu frankoj kaj dudek kvin centimoj"),
(100.00, "cent frankoj kaj nul centimo"),
)

TEST_CASES_TO_CURRENCY_USD = (
(1.00, "unu dolaro kaj nul cendo"),
(2.01, "du dolaroj kaj unu cendo"),
(8.10, "ok dolaroj kaj dek cendoj"),
(12.26, "dek du dolaroj kaj dudek ses cendoj"),
(21.29, "dudek unu dolaroj kaj dudek naŭ cendoj"),
(81.25, "okdek unu dolaroj kaj dudek kvin cendoj"),
(100.00, "cent dolaroj kaj nul cendo"),
)


class Num2WordsEOTest(TestCase):
def test_number(self):
for test in TEST_CASES_CARDINAL:
self.assertEqual(num2words(test[0], lang="eo"), test[1])

def test_ordinal(self):
for test in TEST_CASES_ORDINAL:
self.assertEqual(
num2words(test[0], lang="eo", ordinal=True),
test[1]
)

def test_ordinal_num(self):
for test in TEST_CASES_ORDINAL_NUM:
self.assertEqual(
num2words(test[0], lang="eo", to="ordinal_num"),
test[1]
)

def test_currency_eur(self):
for test in TEST_CASES_TO_CURRENCY_EUR:
self.assertEqual(
num2words(test[0], lang="eo", to="currency", currency="EUR"),
test[1]
)

def test_currency_frf(self):
for test in TEST_CASES_TO_CURRENCY_FRF:
self.assertEqual(
num2words(test[0], lang="eo", to="currency", currency="FRF"),
test[1]
)

def test_currency_usd(self):
for test in TEST_CASES_TO_CURRENCY_USD:
self.assertEqual(
num2words(test[0], lang="eo", to="currency", currency="USD"),
test[1]
)

0 comments on commit 75eec68

Please sign in to comment.