# Scraped from https://huggingface.co/Helsinki-NLP | |
# Scrape code: | |
# console.log(Array.from(document.getElementsByClassName("text-md truncate font-mono text-black dark:group-hover/repo:text-yellow-500 group-hover/repo:text-indigo-600 text-smd")).map(element => element.innerHTML)); | |
helsinki_models = [ | |
"Helsinki-NLP/opus-mt-euq-en", | |
"Helsinki-NLP/opus-mt-eu-ru", | |
"Helsinki-NLP/opus-mt-eu-es", | |
"Helsinki-NLP/opus-mt-eu-en", | |
"Helsinki-NLP/opus-mt-eu-de", | |
"Helsinki-NLP/opus-mt-en-euq", | |
"Helsinki-NLP/opus-mt-en-euq", | |
"Helsinki-NLP/opus-mt-en-eu", | |
"Helsinki-NLP/opus-mt-de-eu", | |
"Helsinki-NLP/opus-mt-ru-eu", | |
"Helsinki-NLP/opus-mt-es-eu" | |
] | |
def get_clearly_formatted_langauge_directions(): | |
# Clearly formatted language directions only | |
# Helsinki-NLP/opus-mt-tc-base-bat-zle is ignored | |
# Helsinki-NLP/opus-mt-tc-fr-en is accepted due to clarity of source language being fr and target language being en | |
language_directions = [model.split("Helsinki-NLP/opus-mt-")[1] for model in helsinki_models | |
if (len(model.split("-"))<6 and | |
"opus-mt" in model and | |
len(model.split("_")) == 1) | |
and len(model) < len("Helsinki-NLP/opus-mt-src-trg")] | |
return language_directions |