niobures's picture
XPF
4a08ba7 verified
# Nepali Rule Set
# Written by: Becky Mathew
# Last updated: 2020-02-27
type,sfrom,sto,weight,precede,follow,comment
# Zero Width Joiners
sub,‌,,1,,,"removing zero width non-joiner",
sub,‍,,1,,,"removing zero width joiner",
# Class Rules
class,vowels,(ʌ|a|i|u|e),,,,
class,consonants,(k|kʰ|g|gʱ|ŋ|ts|tsʰ|dz|dzʱ|ɲ|ʈ|ʈʰ|ɖ|ɖʱ|ɳ|t̪|t̪ʰ|d̪|d̪ʱ|n̪|p|pʰ|b|bʱ|m|r|l|s),,,,
## Consonants
class,KUH,क,,,,
class,KHUH,ख,,,,
class,GUH,ग,,,,
class,GHUH,घ,,,,
class,NGUH,ङ,,,,
class,TSUH,च,,,,
class,TSHUH,छ,,,,
class,DZUH,ज,,,,
class,DZHUH,झ,,,,
class,RETROFLEXTUH,ट,,,,
class,RETROFLEXTHUH,ठ,,,,
class,RETROFLEXDUH,ड,,,,
class,RETROFLEXDHUH,ढ,,,,
class,DENTALTUH,त,,,,
class,DENTALTHUH,थ,,,,
class,DENTALDUH,द,,,,
class,DENTALDHUH,ध,,,,
class,DENTALNUH,(न|ञ|ण),,,,
class,PUH,प,,,,
class,PHUH,फ,,,,
class,BUH,ब,,,,
class,BHUH,भ,,,,
class,MUH,म,,,,
class,YUH,य,,,,
class,RUH,र,,,,
class,LUH,ल,,,,
class,WUH,व,,,,
class,SUH,(स|ष|श),,,,
class,HUH,ह,,,,
## Independent Characters
class,UH,अ,,,,
class,A,आ,,,,
class,I,(इ|ई),,,,"includes short and long form, since vowel length is not contrastive",
class,U,(उ|ऊ),,,,"includes short and long form, since vowel length is not contrastive",
class,RI,ऋ,,,,
class,E,ए,,,,
class,AI,ऐ,,,,
class,O,ओ,,,,
class,AU,औ,,,,
## Diacritics
class,DIACRITICA,ा,,,,
class,DIACRITICI,(ि|ी),,,,
class,DIACRITICU,(ु|ू),,,,
class,DIACRITICRI,ृ,,,,
class,DIACRITICE,े,,,,
class,DIACRITICAI,ै,,,,
class,DIACRITICO,ो,,,,
class,DIACRITICAU,ौ,,,,
class,VIRAMA,्,,,,
class,CANDRABINDU,ँ,,,,
class,SIRBINDU,ं,,,,
# Sub Rules
## Consonants
sub,{KUH},k ʌ,1,,,
sub,{KHUH},kʰ ʌ,1,,,
sub,{GUH},ɡ ʌ,1,,,
sub,{GHUH},ɡʱ ʌ,1,,,
sub,{NGUH},ŋ ʌ,1,,,
sub,{TSUH},ts ʌ,1,,,
sub,{TSHUH},tsʰ ʌ,1,,,
sub,{DZUH},dz ʌ,1,,,
sub,{DZHUH},dzʱ ʌ,1,,,
sub,{RETROFLEXTUH},ʈ ʌ,1,,,
sub,{RETROFLEXTHUH},ʈʰ ʌ,1,,,
sub,{RETROFLEXDUH},ɖ ʌ,1,,,
sub,{RETROFLEXDHUH},ɖʱ ʌ,1,,,
sub,{DENTALTUH},t̪ ʌ,1,,,
sub,{DENTALTHUH},t̪ʰ ʌ,1,,,
sub,{DENTALDUH},d̪ ʌ,1,,,
sub,{DENTALDHUH},d̪ʱ ʌ,1,,,
sub,{DENTALNUH},n̪ ʌ,1,,,
sub,{PUH},p ʌ,1,,,
sub,{PHUH},pʰ ʌ,1,,,
sub,{BUH},b ʌ,1,,,
sub,{BHUH},bʱ ʌ,1,,,
sub,{MUH},m ʌ,1,,,
sub,{YUH},j ʌ,1,,,
sub,{RUH},r ʌ,1,,,
sub,{LUH},l ʌ,1,,,
sub,{WUH},w ʌ,1,,,
sub,{SUH},s ʌ,1,,,
sub,{HUH},ɦ ʌ,1,,,
## Independent Characters
sub,{UH},ʌ,1,,,
sub,{A},a,1,,,
sub,{I},i,1,,,
sub,{U},u,1,,,
sub,{RI},r i,1,,,
sub,{E},e,1,,,
sub,{AI},ai,1,,,
sub,{O},o,1,,,
sub,{AU},au,1,,,
## Diacritics
sub,{DIACRITICA},ERASE a,1,,,
sub,{DIACRITICI},ERASE i,1,,,
sub,{DIACRITICU},ERASE u,1,,,
sub,{DIACRITICRI},ERASE r i,1,,,
sub,{DIACRITICE},ERASE e,1,,,
sub,{DIACRITICAI},ERASE ai,1,,,
sub,{DIACRITICO},ERASE o,1,,,
sub,{DIACRITICAU},ERASE au,1,,,
sub,{VIRAMA},ERASE,1,,,"removes inherent vowel",
sub,{CANDRABINDU},NASAL,1,,,"makes previous vowel nasal",
sub,{SIRBINDU},n̪,1,,,
# ipasub Rules
ipasub,ʌ ERASE,,8,,,"removes the inherent vowel when there's a diacritic after",
ipasub,({vowels}) NASAL, \1̃,6,,,"candrabindu makes previous vowel nasal",
ipasub,ai NASAL,ãĩ,7,,,
ipasub,au NASAL,ãũ,7,,,
ipasub,o NASAL,o,6,,,"/o/ doesn't have a contrastive nasal variant, but they may vary freely (this rule excludes that nasal variation)",
ipasub,({consonants}) ʌ ERASE \1,\1 ː,9,,,"consonant gemination",
ipasub,({consonants}) ʌ ERASE \1ʰ,\1ʰ ː,9.5,,,"fixes gemination rule",
ipasub,({consonants}) ʌ ERASE \1ʱ,\1ʱ ː,9.5,,,"fixes gemination rule",
# Misc. Rules
ipasub,NASAL,@,1,,,"accounts for unattested combos (one occurrence of a nasal consonant)",
ipasub,ERASE,@,1,,,"accounts for unattested combos",