Skip to content

Commit

Permalink
Add Udmurt (udm) translation literals (#381)
Browse files Browse the repository at this point in the history
  • Loading branch information
codemurt authored Nov 8, 2024
1 parent a53bba6 commit 39a68da
Show file tree
Hide file tree
Showing 2 changed files with 25 additions and 0 deletions.
23 changes: 23 additions & 0 deletions src/lighteval/tasks/templates/utils/translation_literals.py
Original file line number Diff line number Diff line change
Expand Up @@ -865,6 +865,29 @@ def __getattribute__(self, name: str) -> str:
colon=":",
),
Language.TURKMEN: TranslationLiterals(language=Language.TURKMEN),
Language.UDMURT: TranslationLiterals(
language=Language.UDMURT,
question_word="юан",
answer="валэктон",
confirmation_word="озьы-а",
yes="бен",
no="ӧвӧл",
also="озьы ик",
cause_word="малы ке шуоно",
effect_word="соин ик",
true="шонерлык",
false="пӧяськон",
neither="мукет",
or_word="яке",
full_stop=".",
comma=",",
question_mark="?",
exclamation_mark="!",
word_space=" ",
sentence_space=" ",
colon=":",
indices=["А", "Б", "В", "Г", "Д", "Е"],
),
Language.UKRAINIAN: TranslationLiterals(
language=Language.UKRAINIAN,
question_word="питання",
Expand Down
2 changes: 2 additions & 0 deletions src/lighteval/utils/language.py
Original file line number Diff line number Diff line change
Expand Up @@ -121,6 +121,7 @@ class Language(Enum):
CEBUANO = "ceb"
WAR = "war"
SHAN = "shn"
UDMURT = "udm"


# This mapping was created for beleble, it converts iso_639_3 individual codes to iso_639_3 macro codes
Expand Down Expand Up @@ -232,6 +233,7 @@ class Language(Enum):
"ars": Language.ARABIC,
"bul": Language.BULGARIAN,
"est": Language.ESTONIAN,
"udm": Language.UDMURT,
# 'hau': Language.HAUSA,
"ind": Language.INDONESIAN,
# 'kea': Language.KABUVERDIANU,
Expand Down

0 comments on commit 39a68da

Please sign in to comment.