diff --git a/src/lighteval/tasks/templates/utils/translation_literals.py b/src/lighteval/tasks/templates/utils/translation_literals.py index 7537c38f..b00957ac 100644 --- a/src/lighteval/tasks/templates/utils/translation_literals.py +++ b/src/lighteval/tasks/templates/utils/translation_literals.py @@ -865,6 +865,29 @@ def __getattribute__(self, name: str) -> str: colon=":", ), Language.TURKMEN: TranslationLiterals(language=Language.TURKMEN), + Language.UDMURT: TranslationLiterals( + language=Language.UDMURT, + question_word="юан", + answer="валэктон", + confirmation_word="озьы-а", + yes="бен", + no="ӧвӧл", + also="озьы ик", + cause_word="малы ке шуоно", + effect_word="соин ик", + true="шонерлык", + false="пӧяськон", + neither="мукет", + or_word="яке", + full_stop=".", + comma=",", + question_mark="?", + exclamation_mark="!", + word_space=" ", + sentence_space=" ", + colon=":", + indices=["А", "Б", "В", "Г", "Д", "Е"], + ), Language.UKRAINIAN: TranslationLiterals( language=Language.UKRAINIAN, question_word="питання", diff --git a/src/lighteval/utils/language.py b/src/lighteval/utils/language.py index 1e9707a3..e6e53984 100644 --- a/src/lighteval/utils/language.py +++ b/src/lighteval/utils/language.py @@ -121,6 +121,7 @@ class Language(Enum): CEBUANO = "ceb" WAR = "war" SHAN = "shn" + UDMURT = "udm" # This mapping was created for beleble, it converts iso_639_3 individual codes to iso_639_3 macro codes @@ -232,6 +233,7 @@ class Language(Enum): "ars": Language.ARABIC, "bul": Language.BULGARIAN, "est": Language.ESTONIAN, + "udm": Language.UDMURT, # 'hau': Language.HAUSA, "ind": Language.INDONESIAN, # 'kea': Language.KABUVERDIANU,