summaryrefslogtreecommitdiff
path: root/icu/translit_Latin_Coptic.txt
blob: 5f40008d7ed001310534c634216d24ebabd697c5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
//--------------------------------------------------------------------
// Copyright 2001, CrossWire Bible Society (http://www.crosswire.org)
// Use freely.
//--------------------------------------------------------------------
// Based upon SBL standard Coptic transliteration system from
// The SBL Handbook of Style p. 30
//--------------------------------------------------------------------

// Latin-Coptic

translit_Latin_Coptic {
  Rule {
    ":: NFD (NFC) ;" 
    
    "$macron = \u0304;"
    "$caron = \u030C;"

    //completeness mappings for latin
    "C}[^$caron]>|C $caron;"
    "c}[^$caron]>|c $caron;"
    "Q>|K;"
    "q>|k;"
    "V>|U;"
    "v>|u;"
    "W>|U;"
    "w>|u;"
    "X>|KS;"
    "x>|ks;"
    "Y>|U;"
    "y>|u;"

    //titlecase digraphs
    "Th<>\u0398}[:LowercaseLetter:];"
    "Ks<>\u039E}[:LowercaseLetter:];"
    "Ph<>\u03A6}[:LowercaseLetter:];"
    "Kh<>\u03A7}[:LowercaseLetter:];"
    "Ps<>\u03A8}[:LowercaseLetter:];"

    //coptic-unique
    "Ti<>\u03EE}[:LowercaseLetter:];"

    //uppercase digraphs
    "TH<>\u0398;"
    "KS<>\u039E;"
    "PH<>\u03A6;"
    "KH<>\u03A7;"
    "PS<>\u03A8;"

    //coptic-unique
    "TI<>\u03EE;"

    "E $macron<>\u0397;"
    "O $macron<>\u03A9;"

    //coptic-unique
    "S $caron<>\u03E2;"
    "C $caron<>\u03EC;"

    "A<>\u0391;"
    "B<>\u0392;"
    "G<>\u0393;"
    "D<>\u0394;"
    "E<>\u0395;"
    "Z<>\u0396;"
    "I<>\u0399;"
    "K<>\u039A;"
    "L<>\u039B;"
    "M<>\u039C;"
    "N<>\u039D;"
    "O<>\u039F;"
    "P<>\u03A0;"
    "R<>\u03A1;"
    "S<>\u03A3;"
    "T<>\u03A4;"
    "U<>\u03A5;"

    //coptic-unique    
    "F<>\u03E4;"
    "H<>\u03E8;"
    "J<>\u03EA;"

    // lowercase digraphs
    "th<>\u03B8;"
    "ks<>\u03BE;"
    "ph<>\u03C6;"
    "kh<>\u03C7;"
    "ps<>\u03C8;"

    //coptic-unique
    "ti<>\u03EF;"

    "e $macron<>\u03B7;"
    "o $macron<>\u03C9;"

    //coptic-unique
    "s $caron<>\u03E3;"
    "c $caron<>\u03ED;"

    "a<>\u03B1;"
    "b<>\u03B2;"
    "g<>\u03B3;"
    "d<>\u03B4;"
    "e<>\u03B5;"
    "z<>\u03B6;"
    "i<>\u03B9;"
    "k<>\u03BA;"
    "l<>\u03BB;"
    "m<>\u03BC;"
    "n<>\u03BD;"
    "o<>\u03BF;"
    "p<>\u03C0;"
    "r<>\u03C1;"
    "s<\u03C2;"
    "s<>\u03C3;"
    "t<>\u03C4;"
    "u<>\u03C5;"

    //coptic-unique
    "f<>\u03E5;"
    "h<>\u03E9;"
    "j<>\u03EB;"

    //remove untransliterated
    "<[:GREEK:];"
    "[:LATIN:]>;"    

    ":: NFC (NFD) ;"    
  }
}