! Morphological Transducer for Yiddish Multichar_Symbols ! Part of speech categories % ! Noun % ! Verb % ! Auxiliary % ! Determiner % ! Pronoun % ! Preposition % ! Determiner % ! Adverb % ! Adjective % ! Preadverb % ! Coordinating conjunction % ! Subordinating conjunction % ! Proper noun ! types of pronouns, determiners, and adjectives % ! personal % ! personal possessive % ! reflexive % ! attributive ("prepositive") % ! predicative ("postpositive", nominalised) % ! interrogative % ! Comparative % ! Superlative ! number: for nouns, verbs, adjectives, determiners, etc. % ! Plural % ! Singular ! definiteness % ! Definite % ! Indefinite ! gender: for nouns, determiners, adjectives, etc. % ! masculine % ! feminine % ! neuter % ! masculine/feminine/neuter ! person % ! 1st person % ! 2nd person % ! 3rd person % ! impersonal ! cases: for determiners, pronouns, etc. % ! nominative % ! accusative % ! dative ! verb forms % ! infinitive % ! present % ! past participle % ! present participle % ! imperative ! Proper noun types % ! topographic (places) % ! anthroponyms (given names) % ! cognomens (family names) % ! organisations ! Punctuation % ! Percent % ! Sentence marker % ! Hyphen % ! Comma % ! Apostrophe % ! Quote marker (right hand side) % ! Quote marker (left hand side) % ! Parenthetical marker (right hand side) % ! Parenthetical marker (left hand side) % ! Letter ! Escaped characters %> ! morpheme boundary %. %, %{ь%} ! used for umlaut of ~previous vowel for verbs %{ь2%} ! used for umlaut of ~previous vowel for adjectives %{ױ%} ! for ױ to ײ umlaut correspondence %{ע%} ! ע or empty; in -{ע}ן is empty except after נ and ל %{ס%} ! ס in סט superlative, deletes after other ס ! matched features %[%+pp%] ! past participle %[%-pp%] ! past participle ! Regular umlaut correspondences: ! ו - י ! אָ - ע ! ױ - ײ/ײַ ! אַ - ע אַ אָ ײַ יִ וּ בּ בֿ כּ כֿ ךֿ פֿ פּ יי וו וי !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! !!! M O R P H O T A C T I C S !!! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! LEXICON Root NounRoot ; DetRoot ; VerbRoot ; Conjunctions ; Prepositions ; Pronouns ; Punctuation ; Adverbs ; Adjectives ; ProperNouns ; !!! Format for noun lexica is N-[gender]-[class] !!! gender: M, F, N !!! class: UML, UML-ER, S, N, NULL, HEB LEXICON N-M-UML %%%: # ; %%%:%{ь%} # ; LEXICON N-F-UML %%%: # ; %%%:%{ь%} # ; LEXICON N-M-UML-ER %%%: # ; %%%:%>%{ь%}ער # ; LEXICON N-F-UML-ER %%%: # ; %%%:%>%{ь%}ער # ; LEXICON N-N-UML-ER %%%: # ; %%%:%>%{ь%}ער # ; LEXICON N-M-S %%%: # ; %%%:%>ס # ; LEXICON N-F-S %%%: # ; %%%:%>ס # ; LEXICON N-N-S %%%: # ; %%%:%>ס # ; LEXICON N-M-N %%%: # ; %%%:%>%{ע%}ן # ; LEXICON N-F-N %%%: # ; %%%:%{ע%}ן # ; LEXICON N-N-N %%%: # ; %%%:%{ע%}ן # ; LEXICON N-M-NULL %%%: # ; LEXICON N-F-NULL %%%: # ; LEXICON N-N-NULL %%%: # ; LEXICON N-M-HEB %%%: # ; LEXICON N-F-HEB %%%: # ; LEXICON DET-DEF-M %%%%:ער # ; %%%%:עם # ; %%%%:עם # ; LEXICON DET-DEF-F %%%%:י # ; %%%%:י # ; %%%%:ער # ; LEXICON DET-DEF-N %%%%:אָס # ; %%%%:אָס # ; %%%%:עם # ; LEXICON DET-DEF-PL %%%%:י # ; %%%%:י # ; %%%%:י # ; LEXICON DET-INDEF %%%: # ; ! FIXME: deal with alternate אַן LEXICON V-COMMON %%%%: # ; %%%%:%>סט # ; %%%%:%>ט # ; %%%%:%>%{ע%}ן # ; %%%%:%>ט # ; %%%%:%>%{ע%}ן # ; %: V-COMMON-INF ; %: V-COMMON-IMP ; %: V-COMMON-PPRS ; LEXICON V-COMMON-INF %:%>ן # ; LEXICON V-COMMON-PPRS %:%>%{ע%}נדיק # ; LEXICON V-COMMON-IMP V-COMMON-IMP-SG ; V-COMMON-IMP-PL ; LEXICON V-COMMON-IMP-SG %%: # ; LEXICON V-COMMON-IMP-PL %%:%>ט # ; LEXICON V-REG ! Plain old weak verbs V-COMMON ; %%%[%+pp%]:%>ט # ; LEXICON V-REG-NOPREF ! Weak verbs that take no prefix V-COMMON ; %%:%>ט # ; LEXICON V-STRONG-7 ! class 7 strong verbs V-COMMON ; %%%[%+pp%]:%>%{ע%}ן # ; LEXICON V-ZAYN-ZE %%%%:%>נען # ; %%%%:%>נען # ; LEXICON V-ZAYN-ZAY %%%%:%>נען # ; %%%%:%>ט # ; %%%%:%>נען # ; %: V-COMMON-INF ; %: V-COMMON-IMP ; %: V-COMMON-PPRS ; LEXICON V-ZAYN-BI %%%%:%>ן # ; %%%%:%>סט # ; LEXICON V-ZAYN-IZ %%%%: # ; LEXICON V-ZAYN-VE %%%[%+pp%]:ן # ; %%%[%+pp%]:זן # ; ! Dir/LR LEXICON V-HOBN-HOB %: V-COMMON-INF ; %: V-COMMON-PPRS ; %: V-COMMON-IMP-SG ; %%%%: # ; %%%%:%>ן # ; %%%%:%>ן # ; LEXICON V-HOBN-HO %%%%:%>סט # ; %%%%:%>ט # ; %%%%:%>ט # ; %: V-COMMON-IMP-PL ; LEXICON V-HOBN-HA %%%[%+pp%]:ט # ; LEXICON VAux-COMMON-DEL %%%:%>סט # ; %%%:%>ט # ; %%%:%>ט # ; LEXICON VAux-COMMON-NODEL %%%: # ; %%%:%>ן # ; %%%:%>ן # ; LEXICON VAux-HOBN-HOB %: V-COMMON-INF ; %: VAux-COMMON-NODEL ; LEXICON VAux-HOBN-HO %: VAux-COMMON-DEL ; LEXICON VAux-HOBN-HA %%%[%+pp%]:ט # ; LEXICON VAux-VEL-VEL %: VAux-COMMON-NODEL ; LEXICON VAux-VEL-VE %: VAux-COMMON-DEL ; LEXICON CC %: # ; LEXICON PREP-EN PREP ; %%+דער%%%:%>%{ע%}ן # ; %%+דער%%%:%>%{ע%}ן # ; %%+דאָס%%%:%>%{ע%}ן # ; LEXICON PREP %: # ; LEXICON PRON-P1-SG איך%%%%%:איך # ; איך%%%%%:מיך # ; איך%%%%%:מיר # ; LEXICON PRON-P2-SG דו%%%%%:דו # ; דו%%%%%:דיך # ; דו%%%%%:דיר # ; LEXICON PRON-P3-SG ער%%%%%%:ער # ; ער%%%%%%:אים # ; ער%%%%%%:אים # ; זי%%%%%%:זי # ; זי%%%%%%:זי # ; זי%%%%%%:איר # ; עס%%%%%%:עס # ; עס%%%%%%:עס # ; עס%%%%%%:אים # ; LEXICON PRON-P1-PL מיר%%%%%:מיר # ; מיר%%%%%:אונדז # ; מיר%%%%%:אונדז # ; LEXICON PRON-P2-PL איר%%%%%:איר # ; איר%%%%%:אײַך # ; איר%%%%%:אײַך # ; LEXICON PRON-P3-PL זײ%%%%%:זײ # ; זײ%%%%%:זײ # ; זײ%%%%%:זײ # ; LEXICON ADJ-COMMON %: # ; %: ADJ-INFL-ENDINGS ; LEXICON ADJ-INFL-ENDINGS %%%:%>ער # ; %%%:%>%{ע%}ן # ; %%%:%>%{ע%}ן # ; %%%:%>ע # ; %%%:%>ע # ; %%%:%>ער # ; %%%%:%>ע # ; %%%%:%>ע # ; %%%%:%>%{ע%}ן # ; %%%%: # ; %%%%: # ; %%%%: # ; ! FIXME: figure out how to deal with "postpositive/nominalised" neuter forms, ! e.g. at https://en.wiktionary.org/wiki/%D7%92%D7%A8%D7%95%D7%99%D7%A1 ! or https://en.wiktionary.org/wiki/%D7%A9%D7%98%D7%90%D6%B7%D7%A8%D7%A7 ! and how they're different from predicative forms %%%:%>ע # ; %%%:%>ע # ; %%%:%>ע # ; LEXICON ADJ-UML %%:%>%{ь2%}ער ADJ-COMMON ; %%:%>%{ь2%}%{ס%}ט ADJ-COMMON ; %: ADJ-COMMON ; LEXICON ADJ %%:%>ער ADJ-COMMON ; %%:%>%{ס%}ט ADJ-COMMON ; %: ADJ-COMMON ; LEXICON ADJ-NO-COMP %: ADJ-COMMON ; LEXICON ADJ-IRREG-COMP %%:%>ער ADJ-COMMON ; %%:%>%{ס%}ט ADJ-COMMON ; LEXICON DET-PERS-AGREEMENT %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%: # ; %%%%:%>ע # ; %%%%:%>ע # ; %%%%:%>ע # ; %%%%:%>ער # ; %%%%:%>%{ע%}ן # ; %%%%:%>%{ע%}ן # ; %%%%:%>ע # ; %%%%:%>ע # ; %%%%:%>ער # ; %%%%:%>ס # ; %%%%:%>ס # ; %%%%:%>%{ע%}ן # ; %%%%:%>ע # ; %%%%:%>ע # ; %%%%:%>ע # ; LEXICON DET-PERS-P1SG %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P2SG %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P3SGMN %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P3SGF %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P1PL %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P2PL %%: DET-PERS-AGREEMENT ; LEXICON DET-PERS-P3PL %%: DET-PERS-AGREEMENT ; LEXICON DET-ITG %%: ADJ-INFL-ENDINGS ; LEXICON PRON-ITG %%: # ; LEXICON ADV-ITG %%: # ; LEXICON ADV %: # ; LEXICON CNJSUB %: # ; LEXICON PREADV %: # ; LEXICON NP-TOP %%: # ; LEXICON NP-ANT-M %%%: # ; LEXICON NP-ANT-F %%%: # ; !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! !!! L E X I C O N !!! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! LEXICON Conjunctions און:און CC ; ! "and" אָדער:אָדער CC ; ! "or" אָבער:אָבער CC ; ! "but" אַז:אַז CNJSUB ; ! "that" אױב:אױב CNJSUB ; ! "if" װי:װי CNJSUB ; ! "how" װען:װען CNJSUB ; ! "when" װײַל:װײַל CNJSUB ; ! "because" LEXICON Adverbs אַרױס:אַרױס ADV ; ! "out" אַרײַן:אַרײַן ADV ; ! "in, inside" אױך:אױך ADV ; ! "also" אױס:אױס ADV ; ! "over (finished)" הײַנט:הײַנט ADV ; ! "today" מער:מער ADV ; ! "more" נאָך:נאָך ADV ; ! "still" נאָך:נאָך PREADV ; ! "still" ! FIXME: CHECK נאָר:נאָר PREADV ; ! "only" נישט:ניט ADV ; ! "not" ! Dir/LR נישט:נישט ADV ; ! "not" פֿאַראַן:פֿאַראַן ADV ; ! "there" צוריק:צוריק ADV ; ! "back" שױן:שױן ADV ; ! "already, yet" װי:װי ADV-ITG ; ! "how" װי:װי PREADV ; ! "how" װען:װען ADV-ITG ; ! "when" LEXICON Prepositions אַרום:אַרום PREP ; ! "around" אונטער:אונטער PREP ; ! "under" איבער:איבער PREP ; ! "over, above; about" אין:אין PREP-EN ; ! "in" אױף:אױף PREP-EN ; ! "on, by" ביז:ביז PREP ; ! "up to, until" בײַ:בײַ PREP-EN ; ! "у" דורך:דורך PREP ; ! "through" מיט:מיט PREP ; ! "with" נאָך:נאָך PREP-EN ; ! "after" פֿאַר:פֿאַר PREP-EN ; ! "for" פֿון:פֿון PREP-EN ; ! "of, from" צו:צו PREP-EN ; ! "to" צװישן:צװישן PREP ; ! "between" קעגן:קעגן PREP ; ! "against" קײן:קײן PREP ; ! "to (+place)" װי:װי PREP ; ! "like" װעגן:װעגן PREP ; ! "about" LEXICON DetRoot דער:ד DET-DEF-M ; ! "the" די:ד DET-DEF-F ; ! "the" דאָס:ד DET-DEF-N ; ! "the" די:ד DET-DEF-PL ; ! "the" אַ:אַ DET-INDEF ; ! "a" אַ:אַן DET-INDEF ; ! "an" ! Dir/LR קײן:קײן DET-INDEF ; ! "a/an, no, any" מײַן:מײַן DET-PERS-P1SG ; דײַן:דײַן DET-PERS-P2SG ; זײַן:זײַן DET-PERS-P3SGMN ; איר:איר DET-PERS-P3SGF ; אונדזער:אונדזער DET-PERS-P1PL ; אײַער:אײַער DET-PERS-P2PL ; זײער:זײער DET-PERS-P3PL ; װעלך:װעלך DET-ITG ; ! "which" LEXICON Pronouns PRON-P1-SG ; PRON-P2-SG ; PRON-P3-SG ; PRON-P1-PL ; PRON-P2-PL ; PRON-P3-PL ; מען%%%%:מען # ; מען%%%%:מע # ; ! Dir/LR װאָס%%%:װאָס # ; װאָס%%%:װאָס # ; װאָס%%%:װאָס # ; זיך%%:זיך # ; װעלך:װעלך PRON-ITG ; ! "which one (?)" FIXME: CHECK LEXICON NounRoot אַרבעט:אַרבעט N-F-S ; ! "work" בּאַרג:בּאַרג N-M-UML ; ! "mountain" בּױם:בּ%{ױ%}ם N-M-UML-ER ; ! "tree" plural with ײ בוך:בוך N-N-UML-ER ; ! "book" הימל:הימל N-M-N ; ! "heaven" הױז:הױז N-N-UML-ER ; ! "house" plural with ײַ זון:זון N-F-N ; ! "sun" זון:זון N-M-UML ; ! "son" טאָג:טאָג N-M-UML ; ! "day" יאָר:יאָר N-M-N ; ! "year" לאַן:לאַן N-M-N ; ! "meadow" לאַנד:לאַנד N-N-UML-ER ; ! "country, land" צײַט:צײַט N-F-N ; ! "time" קינד:קינד N-N-UML-ER ; ! "child" (technically no umlaut) װעלט:װעלט N-F-N ; ! "world" LEXICON VerbRoot %[%-pp%]:גע VerbStems ; ! past participle VerbStems ; ! other forms LEXICON IrregularVerbs זײַן:זײַ V-ZAYN-ZAY ; זײַן:בי V-ZAYN-BI ; זײַן:איז V-ZAYN-IZ ; זײַן:װע V-ZAYN-VE ; זײַן:זע V-ZAYN-ZE ; ! Dir/LR האָבן:האָב V-HOBN-HOB ; האָבן:האָ V-HOBN-HO ; האָבן:האַ V-HOBN-HA ; LEXICON Auxiliaries האָבן:האָב VAux-HOBN-HOB ; האָבן:האָ VAux-HOBN-HO ; האָבן:האַ VAux-HOBN-HA ; װעל:װעל VAux-VEL-VEL ; װעל:װע VAux-VEL-VE ; LEXICON VerbStems IrregularVerbs ; Auxiliaries ; בּעטן:בּעט V-STRONG-7 ; ! "ask" זאָגן:זאָג V-REG ; ! "say" מאַכן:מאַך V-REG ; ! "make" פֿאַרלירן:פֿאַרליר V-REG-NOPREF ; ! "lose" קומען:קום V-STRONG-7 ; ! "come" קױפֿן:קױפֿ V-REG ; ! "buy" LEXICON Adjectives אַלט:אַלט ADJ-UML ; ! "old" אַנדער:אַנדער ADJ-NO-COMP ; ! "different" גוט:בעס ADJ-IRREG-COMP ; ! "better/best" גוט:גוט ADJ-NO-COMP ; ! "good" גרױס:גרױס ADJ-UML ; ! "big" יונג:יונג ADJ-UML ; ! "young" שטאַרק:שטאַרק ADJ ; ! "strong" שלעכט:ערג ADJ-IRREG-COMP ; ! "worse/worst" שלעכט:שלעכט ADJ-NO-COMP ; ! "bad" שײן:שײן ADJ-UML ; ! "beautiful" LEXICON ProperNouns אַמעריקע:אַמעריקע NP-TOP ; ! "America" דײַטשלאַנד:דײַטשלאַנד NP-TOP ; ! "Germany" ישראל:ישראל NP-TOP ; ! "Israel" דוד:דוד NP-ANT-M ; ! "Dovid" ישראל:ישראל NP-ANT-M ; ! "Yisroel" LEXICON Punctuation %.%:%. # ; ,%:%, # ; ! Resources: ! http://wiki.apertium.org/wiki/Starting_a_new_language_with_HFST#Lexicon ! http://wiki.apertium.org/wiki/Lttoolbox_and_lexc ! http://wiki.apertium.org/wiki/Apertium-specific_conventions_for_lexc ! https://kitwiki.csc.fi/twiki/bin/view/KitWiki/HfstHome ! http://hfst.sourceforge.net/ ! http://www.cis.upenn.edu/~cis639/docs/lexc.html ! http://wiki.apertium.org/wiki/Hfst