diff --git a/numbers/src/main/resources/config/sl-si/and.word b/numbers/src/main/resources/config/sl-si/and.word new file mode 100644 index 0000000..f087d89 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/and.word @@ -0,0 +1 @@ +in \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/date_time.json b/numbers/src/main/resources/config/sl-si/date_time.json new file mode 100644 index 0000000..9da33e4 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/date_time.json @@ -0,0 +1,123 @@ +{ + "decade_format": { + "1": {"match": "^0$", "format": ""}, + "2": {"match": "^\\d$", "format": "{x}"}, + "3": {"match": "^1\\d$", "format": "{xx}"}, + "4": {"match": "^\\d0$", "format": "{x0}"}, + "5": {"match": "^[2-9]\\d$", "format": "{x}in{x0}"}, + "default": "{number}" + }, + "hundreds_format": { + "1": {"match": "^\\d{1,2}$", "format": "{formatted_decade}"}, + "2": {"match": "^1\\d{2}$", "format": "sto {formatted_decade}"}, + "3": {"match": "^2\\d{2}$", "format": "dvesto {formatted_decade}"}, + "4": {"match": "^\\d{3}$", "format": "{x_in_x00}sto {formatted_decade}"}, + "default": "{formatted_decade}" + }, + "thousand_format": { + "1": {"match": "^\\d{1,3}$", "format": "{formatted_hundreds}"}, + "2": {"match": "^1\\d{3}$", "format": "tisoč {formatted_hundreds}"}, + "default": "{x_in_x000} tisoč {formatted_hundreds}" + }, + "year_format": { + "default": "{formatted_thousand} {bc}", + "bc": "pr. n. št." + }, + "date_format": { + "date_full": "{weekday}, {day} {month} {formatted_year}", + "date_full_no_year": "{weekday}, {day} {month}", + "date_full_no_year_month": "{weekday}, {day}", + "today": "danes", + "tomorrow": "jutri", + "yesterday": "včeraj" + }, + "date_time_format": { + "date_time": "{formatted_date}, ob {formatted_time}" + }, + "weekday": { + "0": "ponedeljek", + "1": "torek", + "2": "sreda", + "3": "četrtek", + "4": "petek", + "5": "sobota", + "6": "nedelja" + }, + "date": { + "1": "prvi", + "2": "drugi", + "3": "tretji", + "4": "četrti", + "5": "peti", + "6": "šesti", + "7": "sedmi", + "8": "osmi", + "9": "deveti", + "10": "deseti", + "11": "enajsti", + "12": "dvanajsti", + "13": "trinajsti", + "14": "štirinajsti", + "15": "petjanjsti", + "16": "šestnajsti", + "17": "sedemnajsti", + "18": "osemnajsti", + "19": "devetnajsti", + "20": "dvajseti", + "21": "enaindvajseti", + "22": "dvaindvajseti", + "23": "triindvajseti", + "24": "štiriindvajseti", + "25": "petindvajseti", + "26": "šestindvajseti", + "27": "sedemindvajseti", + "28": "osemindvajseti", + "29": "devetindvajseti", + "30": "trideseti", + "31": "enaintrideseti" + }, + "month": { + "1": "januar", + "2": "februar", + "3": "marec", + "4": "april", + "5": "maj", + "6": "junij", + "7": "julij", + "8": "avgust", + "9": "september", + "10": "oktober", + "11": "november", + "12": "december" + }, + "number": { + "0": "nič", + "1": "ena", + "2": "dva", + "3": "tri", + "4": "štiri", + "5": "pet", + "6": "šest", + "7": "sedem", + "8": "osem", + "9": "devet", + "10": "deset", + "11": "enajst", + "12": "dvanajst", + "13": "trinajst", + "14": "štirinajst", + "15": "petnajst", + "16": "šestnajst", + "17": "sedemnajst", + "18": "osemnajst", + "19": "devetnajst", + "20": "dvajset", + "30": "trideset", + "40": "štirideset", + "50": "petdeset", + "60": "šestdeset", + "70": "sedemdeset", + "80": "osemdeset", + "90": "devetdeset" + } +} diff --git a/numbers/src/main/resources/config/sl-si/date_time_test.json b/numbers/src/main/resources/config/sl-si/date_time_test.json new file mode 100644 index 0000000..7bebae0 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/date_time_test.json @@ -0,0 +1,43 @@ +{ + "test_nice_year": { + "1": {"datetime_param": "1, 1, 31, 13, 22, 3", "bc": "True", "assertEqual": "ena pr. n. št." }, + "2": {"datetime_param": "10, 1, 31, 13, 22, 3", "bc": "True", "assertEqual": "deset pr. n. št." }, + "3": {"datetime_param": "92, 1, 31, 13, 22, 3", "bc": "True", "assertEqual": "dvaindevetdeset pr. n. št." }, + "4": {"datetime_param": "803, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "osemsto tri" }, + "5": {"datetime_param": "811, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "osemsto enajst" }, + "6": {"datetime_param": "454, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "štiristo štiriinpetdeset" }, + "7": {"datetime_param": "1005, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "tisoč pet" }, + "8": {"datetime_param": "1012, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "tisoč dvanajst" }, + "9": {"datetime_param": "1046, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "tisoč šestinštirideset" }, + "10": {"datetime_param": "1807, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "tisoč osemsto sedem" }, + "11": {"datetime_param": "1717, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "tisoč sedemsto sedemnajst" }, + "12": {"datetime_param": "1988, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "tisoč devetsto oseminosemdeset"}, + "13": {"datetime_param": "2009, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "dva tisoč devet"}, + "14": {"datetime_param": "2018, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "dva tisoč osemnajst"}, + "15": {"datetime_param": "2021, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "dva tisoč enaindvajset"}, + "16": {"datetime_param": "2030, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "dva tisoč trideset"}, + "17": {"datetime_param": "2100, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "dva tisoč sto" }, + "18": {"datetime_param": "1000, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "tisoč" }, + "19": {"datetime_param": "2000, 1, 31, 13, 22, 3", "bc": "None", "assertEqual": "dva tisoč" }, + "20": {"datetime_param": "3120, 1, 31, 13, 22, 3", "bc": "True", "assertEqual": "tri tisoč sto dvajset pr. n. št." }, + "21": {"datetime_param": "3241, 1, 31, 13, 22, 3", "bc": "True", "assertEqual": "tri tisoč dvesto enainštirideset pr. n. št." }, + "22": {"datetime_param": "5200, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "pet tisoč dvesto" }, + "23": {"datetime_param": "1100, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "tisoč sto" }, + "24": {"datetime_param": "2100, 1, 31, 13, 22, 3", "bc": "False", "assertEqual": "dva tisoč sto" } + }, + "test_nice_date": { + "1": {"datetime_param": "2017, 1, 31, 0, 2, 3", "now": "None", "assertEqual": "torek, enaintrideseti januar dva tisoč sedemnajst"}, + "2": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2017, 1, 1, 0, 2, 3", "assertEqual": "nedelja, četrti februar dva tisoč osemnajst"}, + "3": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 1, 1, 0, 2, 3", "assertEqual": "nedelja, četrti februar"}, + "4": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 2, 1, 0, 2, 3", "assertEqual": "nedelja, četrti"}, + "5": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 2, 3, 0, 2, 3", "assertEqual": "jutri"}, + "6": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 2, 4, 0, 2, 3", "assertEqual": "danes"}, + "7": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 2, 5, 0, 2, 3", "assertEqual": "včeraj"}, + "8": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2018, 2, 6, 0, 2, 3", "assertEqual": "nedelja, četrti februar"}, + "9": {"datetime_param": "2018, 2, 4, 0, 2, 3", "now": "2019, 2, 6, 0, 2, 3", "assertEqual": "nedelja, četrti februar dva tisoč osemnajst"} + }, + "test_nice_date_time": { + "1": {"datetime_param": "2017, 1, 31, 13, 22, 3", "now": "None", "use_24hour": "False", "use_ampm": "True", "assertEqual": "torek, enaintrideseti januar dva tisoč sedemnajst, ob dvaindvajset čez ena p.m."}, + "2": {"datetime_param": "2017, 1, 31, 13, 22, 3", "now": "None", "use_24hour": "True", "use_ampm": "False", "assertEqual": "torek, enaintrideseti januar dva tisoč sedemnajst, ob trinajst dvaindvajset"} + } +} diff --git a/numbers/src/main/resources/config/sl-si/day.word b/numbers/src/main/resources/config/sl-si/day.word new file mode 100644 index 0000000..dc816d9 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/day.word @@ -0,0 +1 @@ +dan \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/days.word b/numbers/src/main/resources/config/sl-si/days.word new file mode 100644 index 0000000..7b0e614 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/days.word @@ -0,0 +1 @@ +dni \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/hour.word b/numbers/src/main/resources/config/sl-si/hour.word new file mode 100644 index 0000000..fa6c4e1 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/hour.word @@ -0,0 +1 @@ +ura \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/hours.word b/numbers/src/main/resources/config/sl-si/hours.word new file mode 100644 index 0000000..873003f --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/hours.word @@ -0,0 +1 @@ +ur \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/minute.word b/numbers/src/main/resources/config/sl-si/minute.word new file mode 100644 index 0000000..02810df --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/minute.word @@ -0,0 +1 @@ +minuta \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/minutes.word b/numbers/src/main/resources/config/sl-si/minutes.word new file mode 100644 index 0000000..4b98366 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/minutes.word @@ -0,0 +1 @@ +minut \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/normalize.json b/numbers/src/main/resources/config/sl-si/normalize.json new file mode 100644 index 0000000..a0892fd --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/normalize.json @@ -0,0 +1,44 @@ +{ + "lowercase": false, + "numbers_to_digits": true, + "expand_contractions": false, + "remove_symbols": false, + "remove_accents": false, + "remove_articles": false, + "remove_stopwords": false, + "contractions": {}, + "word_replacements": {}, + "number_replacements": { + "nič": "0", + "ena": "1", + "dve": "2", + "dva": "2", + "tri": "3", + "štiri": "4", + "pet": "5", + "šest": "6", + "sedem": "7", + "osem": "8", + "devet": "9", + "deset": "10", + "enajst": "11", + "dvanajst": "12", + "trinajst": "13", + "štirinajst": "14", + "petnajst": "15", + "šestnajst": "16", + "sedemnajst": "17", + "osemnajst": "18", + "devetnajst": "19", + "dvajset": "20", + "trideset": "30", + "štirideset": "40", + "petdeset": "50", + "šestdeset": "60", + "sedemdeset": "70", + "osemdeset": "80", + "devetdeset": "90" + }, + "stopwords": [], + "articles": [] +} \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/or.word b/numbers/src/main/resources/config/sl-si/or.word new file mode 100644 index 0000000..784f900 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/or.word @@ -0,0 +1 @@ +ali \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/second.word b/numbers/src/main/resources/config/sl-si/second.word new file mode 100644 index 0000000..ef210e2 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/second.word @@ -0,0 +1 @@ +sekunda \ No newline at end of file diff --git a/numbers/src/main/resources/config/sl-si/seconds.word b/numbers/src/main/resources/config/sl-si/seconds.word new file mode 100644 index 0000000..300f8e5 --- /dev/null +++ b/numbers/src/main/resources/config/sl-si/seconds.word @@ -0,0 +1 @@ +sekund \ No newline at end of file