Module:Ko-translit/data and Module:Ko-translit/data/sandbox: Difference between pages

(Difference between pages)
Jump to navigation Jump to search
Page 1
Page 2
imported>Grapesurgeon
more detailed comment and also sandhi -> resyllabification
 
maybe this is sufficient
 
Line 23: Line 23:
{"_", " "},
{"_", " "},


-- converting Compatibility Jamo (U+31xx) to Hangul Jamo (U+11xx)
-- for linguistic contexts
-- as decomposed Compatibility Jamo do not differentiate between initial/final,
-- we convert only several jamo where initial/final is a relevant distinction
{"ㄴ([ᄀ-ᄒ])", "ᆫ%1"}, -- -ㄴ다
{"ㄴ([ᄀ-ᄒ])", "ᆫ%1"}, -- -ㄴ다
{"ㄹ([ᄀ-ᄒ])", "ᆯ%1"}, -- -ㄹ까, -ㄹ래
{"ㄹ([ᄀ-ᄒ])", "ᆯ%1"}, -- -ㄹ까, -ㄹ래
Line 115: Line 113:
{"([ᆨ-ᇂ])@ᄋ([ᅣᅤᅧᅨᅭᅲᅵ])", "%1ᄂ%2"}, -- 색연필 [생년필], 물엿 [물렫]
{"([ᆨ-ᇂ])@ᄋ([ᅣᅤᅧᅨᅭᅲᅵ])", "%1ᄂ%2"}, -- 색연필 [생년필], 물엿 [물렫]


-- for null-init consonant ㅇ (resyllabification; 연음)
-- for null-init consonant ㅇ (연음)
{"ᆨᄋ", "ᄀ"},
{"ᆩᄋ", "ᄁ"},
{"ᆩᄋ", "ᄁ"},
{"ᆪᄋ", "ᆨᄉ"},
{"ᆪᄋ", "ᆨᄉ"},
{"ᆬᄋ", "ᆫᄌ"},
{"ᆬᄋ", "ᆫᄌ"},
{"ᆮᄋ", "ᄃ"},
{"[ᆯᆶ]ᄋ", "ᄅ"},
{"ᆰᄋ", "ᆯᄀ"},
{"ᆰᄋ", "ᆯᄀ"},
{"ᆱᄋ", "ᆯᄆ"},
{"ᆱᄋ", "ᆯᄆ"},
Line 128: Line 123:
{"ᆴᄋ", "ᆯᄐ"},
{"ᆴᄋ", "ᆯᄐ"},
{"ᆵᄋ", "ᆯᄑ"},
{"ᆵᄋ", "ᆯᄑ"},
{"ᆸᄋ", "ᄇ"},
{"ᆹᄋ", "ᆸᄉ"},
{"ᆹᄋ", "ᆸᄉ"},
{"ᆺᄋ", "ᄉ"},
{"ᆺᄋ", "ᄉ"},
Line 161: Line 155:
{"[ᆲᆴᆶ]ᄉ", "ᆯᄊ"},
{"[ᆲᆴᆶ]ᄉ", "ᆯᄊ"},
{"ᇂᄉ", "ᄊ"},
{"ᇂᄉ", "ᄊ"},
-- @ for written epenthetic ㅅ + ㄱ/ㅂ
-- @ for written 사이시옷 + ㄱ/ㅂ
{"ᆺ@ᄀ", "ᄁ"},
{"ᆺ@ᄀ", "ᄁ"},
{"ᆺ@ᄇ", "ᄈ"}
{"ᆺ@ᄇ", "ᄈ"}
Line 180: Line 174:
p.at_dollar_irregularities = {
p.at_dollar_irregularities = {
{"ᆫ@ᄅ", "ᆫᄂ"}, -- 음운론 [으문논]
{"ᆫ@ᄅ", "ᆫᄂ"}, -- 음운론 [으문논]
{"ᆨ%$ᄋ", "ᄀ"},
{"ᆨ%$?ᄋ", "ᄀ"},
{"ᆮ%$ᄋ", "ᄃ"}, -- 웃어른 [우더른]
{"ᆮ%$?ᄋ", "ᄃ"}, -- 웃어른 [우더른]
{"ᆯ%$ᄋ", "ᄅ"},
{"ᆯ%$?ᄋ", "ᄅ"},
{"ᆸ%$ᄋ", "ᄇ"},
{"ᆸ%$?ᄋ", "ᄇ"},
{"%$", ""}
{"%$", ""}
}
}
Line 362: Line 356:
{"[ᄑㅍ]", "p'"},
{"[ᄑㅍ]", "p'"},
{"[ᄒㅎ]", "h"}
{"[ᄒㅎ]", "h"}
}
-- ISO/TR 11941, common in methods 1 & 2
p.iso_common = {
{"[ᄂᆫㄴ]", "n"},
{"[ᆭㄶ]", "nh"},
{"[ᄅㄹ]", "r"},
{"ᆯ", "l"},
{"[ᆱㄻ]", "lm"},
{"[ᆳㄽ]", "ls"},
{"[ᆶㅀ]", "lh"},
{"[ᄆᆷㅁ]", "m"},
{"[ᄉᆺㅅ]", "s"},
{"[ᄊᆻㅆ]", "ss"},
{"[ᄋㅇ]", ""},
{"ᆼ", "ng"},
{"[ᄒᇂㅎ]", "h"},
{"[ᅡㅏ]", "a"},
{"[ᅢㅐ]", "ae"},
{"[ᅣㅑ]", "ya"},
{"[ᅤㅒ]", "yae"},
{"[ᅥㅓ]", "eo"},
{"[ᅦㅔ]", "e"},
{"[ᅧㅕ]", "yeo"},
{"[ᅨㅖ]", "ye"},
{"[ᅩㅗ]", "o"},
{"[ᅪㅘ]", "wa"},
{"[ᅫㅙ]", "wae"},
{"[ᅬㅚ]", "oe"},
{"[ᅭㅛ]", "yo"},
{"[ᅮㅜ]", "u"},
{"[ᅯㅝ]", "weo"},
{"[ᅰㅞ]", "we"},
{"[ᅱㅟ]", "wi"},
{"[ᅲㅠ]", "yu"},
{"[ᅳㅡ]", "eu"},
{"[ᅴㅢ]", "yi"},
{"[ᅵㅣ]", "i"}
}
}