|
""" |
|
Convert time to words |
|
TODO: fix zeros eg. 22:00 |
|
""" |
|
|
|
import re |
|
|
|
PATTERNS = [ |
|
r"(\d{1,2})([apm]{2})", |
|
r"(\d{1,2}):(\d{2})", |
|
] |
|
|
|
|
|
def extract_time(match): |
|
""" |
|
Extract hour and minute from a string in HH:MM or AM/PM format |
|
and return as integers. |
|
""" |
|
time_str = match.group(0).lower().strip() |
|
|
|
|
|
match = re.match(r"(\d{1,2}):(\d{2})", time_str) |
|
if match: |
|
h = int(match.group(1)) |
|
m = int(match.group(2)) |
|
return f"{convert_to_word(h, m)}" |
|
|
|
|
|
match = re.match(r"(\d{1,2})([apm]{2})", time_str) |
|
if match: |
|
h = int(match.group(1)) |
|
period = match.group(2) |
|
|
|
|
|
if period == "am" and h == 12: |
|
h = 0 |
|
elif period == "pm" and h != 12: |
|
h += 12 |
|
return f"{convert_to_word(h, 0)}" |
|
|
|
return match.group(0) |
|
|
|
|
|
def convert_to_word(h, m): |
|
hours = [ |
|
"אֶפֶס", |
|
"אַחַת", |
|
"שְׁנַיִם", |
|
"שָׁלוֹשׁ", |
|
"אַרְבַּע", |
|
"חָמֵשׁ", |
|
"שֵׁשׁ", |
|
"שֶׁבַע", |
|
"שְׁמוֹנֵה", |
|
"תֵּשַׁע", |
|
"עֵשֵׂר", |
|
"אַחַת עֶשְׂרֵה", |
|
"שְׁתֵּים עֶשְׂרֵה", |
|
] |
|
|
|
tens = ["", "עֵשֵׂר", "עֶשְׂרִים", "שְׁלוֹשִׁים", "אַרְבָּעִים", "חֲמִשִּׁים"] |
|
|
|
ten_to_twenty = [ |
|
"עֵשֵׂר", |
|
"אַחַת עֶשְׂרֵה", |
|
"שְׁתֵּים עֶשְׂרֵה", |
|
"שְׁלוֹשׁ עֶשְׂרֵה", |
|
"אַרְבַּע עֶשְׂרֵה", |
|
"חֲמֵשׁ עֶשְׂרֵה", |
|
"שֵׁשׁ עֶשְׂרֵה", |
|
"שְׁבַע עֶשְׂרֵה", |
|
"שְׁמוֹנֶה עֶשְׂרֵה", |
|
"תְּשַׁע עֶשְׂרֵה", |
|
] |
|
|
|
vocab = {"minutes": "דַּקּוֹת", "and": "וֵ", "shtey": "שְׁתֵּי"} |
|
|
|
|
|
if h == 0: |
|
h = 12 |
|
|
|
elif h > 12: |
|
h -= 12 |
|
|
|
if m == 0: |
|
return f"{hours[h]}" |
|
|
|
elif 1 <= m <= 9: |
|
minute_word = ( |
|
vocab["shtey"] if m == 2 else hours[m] |
|
) |
|
return f"{hours[h]} {vocab['and']}{minute_word} {vocab['minutes']}" |
|
|
|
elif 10 <= m <= 19: |
|
return f"{hours[h]} {vocab['and']}{ten_to_twenty[m - 10]} {vocab['minutes']}" |
|
|
|
else: |
|
tens_part = f"{vocab['and']}{tens[m // 10]}" |
|
units_part = f"{vocab['and']}{hours[m % 10]}" if m % 10 != 0 else "" |
|
return f"{hours[h]} {tens_part} {units_part} {vocab['minutes']}".strip() |
|
|
|
|
|
def time_to_word(text: str): |
|
return re.sub("|".join(PATTERNS), extract_time, text) |
|
|