Bug fixes. Plus, now 99% in sync with the new EWTS draft. Search for 'DLC' to find a few open issues.
Readded the line for reversed dza; it should never have been deleted, as that breaks TM<->TMW. I tested the whole mapping by hand once; this incident shows that automation is very helpful. '{' and '}' were swapped... The Unicode for something was "", not "none". +R, +W, +Y, R+ now in use (though more testing is needed)
This commit is contained in:
parent
216c5b0d54
commit
08c676c186
1 changed files with 114 additions and 95 deletions
|
@ -10,12 +10,22 @@
|
|||
// ACIP->Unicode conversion. So keep ACIPRules in sync with this, and be
|
||||
// sure to run 'ant clean check' after your change.
|
||||
//
|
||||
// Note that some glyphs have EWTS \uF021-\uF0FF inclusive. These do
|
||||
// not have anything in the Unicode column, though, because this is just
|
||||
// the EWTS -- if someone wants to convert TMSkt3.183->Unicode and get
|
||||
// \u0F21, let them do that, but our *->Unicode converters shouldn't
|
||||
// output codes in the PUA without explicit user authorization.
|
||||
//
|
||||
// Note that 0F00, 0F02, 0F03, and 0F0E are made by using multiple
|
||||
// glyphs from TMW. 0F6A is not listed here (DLC FIXME: should it be?),
|
||||
// but the glyph for it is the glyph for 0F62.
|
||||
//
|
||||
// DuffPaneTest ensures that the na-ro column truly contains na-ros,
|
||||
// by the way.
|
||||
|
||||
<?Input:Punctuation?>
|
||||
//_~32,1~0,32
|
||||
// ~45,1~0,45~~~~~~~0F0B
|
||||
// ~45,1~0,45~~~~~~~0FB0
|
||||
// DLC 0020 or a wider space, perhaps a couple of EM spaces (2003,2003)? Than couldn't say, but he also had thought of U+2003.
|
||||
_~32,1~~1,32~~~~~~~0020
|
||||
~45,1~~1,45~~~~~~~0F0B
|
||||
|
@ -67,19 +77,19 @@ M~~~8,91~~~~~~~0F7E
|
|||
// virama:
|
||||
?~252,1~~8,105~~~~~~~0F84
|
||||
// rgya.gram.shad:
|
||||
]~48,5~~9,51~~~~~~~0F12
|
||||
\u0F12~48,5~~9,51~~~~~~~0F12
|
||||
// shad + single ornament:
|
||||
[~43,5~~9,47~~~~~~~0F10
|
||||
\u0F10~43,5~~9,47~~~~~~~0F10
|
||||
// gug.rtags.gyon:
|
||||
<~95,5~~9,95~~~~~~~0F3A
|
||||
// gug.rtags.gyas:
|
||||
>~96,5~~9,96~~~~~~~0F3B
|
||||
// yar.tshes.rtags:
|
||||
{~134,5~~10,39~~~~~~~0F3E
|
||||
}~134,5~~10,39~~~~~~~0F3E
|
||||
// mar.tshes.rtags
|
||||
}~135,5~~10,40~~~~~~~0F3F
|
||||
{~135,5~~10,40~~~~~~~0F3F
|
||||
// dzud.rtags.me.long.can:
|
||||
`~94,5~~9,92~~~~~~~0F13
|
||||
\u0F13~94,5~~9,92~~~~~~~0F13
|
||||
// hard tsheg:
|
||||
*~205,1~~1,108~~~~~~~0F0C
|
||||
|
||||
|
@ -216,9 +226,11 @@ au~237,1~~8,89~~~~~~~0F7D~~8,104
|
|||
// DLC FIXME: need -I as well
|
||||
|
||||
<?Input:Sanskrit?>
|
||||
|
||||
// 0F5F,0F39 might work, but the OpenType font's author must've had
|
||||
// Dza in mind if it does. Note that the bottommost horizontal stroke
|
||||
// goes upward on U+0F5F and downward on U+0F5B.
|
||||
// the TMSkt4.146 glyph in mind if it does. Note that the bottommost
|
||||
// horizontal stroke goes upward on U+0F5F and downward on U+0F5B.
|
||||
\uF031~146,5~~10,42~~~~~~~none
|
||||
f~153,5~~10,58~1,110~1,118~1,124~1,126~10,114~10,123~0F55,0F39
|
||||
v~154,5~~10,59~1,110~1,118~1,124~1,126~10,114~10,123~0F56,f39
|
||||
T~170,1~~1,64~1,109~1,120~1,123~1,125~10,115~10,124~0F4A
|
||||
|
@ -812,12 +824,12 @@ ts~224,5~~10,95~1,110~~1,125~1,126~~~0FA9
|
|||
tsh~225,5~~10,96~1,110~~1,125~1,126~~~0FAA
|
||||
dz~226,5~~10,97~1,110~~1,125~1,126~~~0FAB
|
||||
dz+h~227,5~~10,98~1,110~~1,125~1,126~~~0FAC
|
||||
w~228,5~~10,99~1,109~~1,123~1,125~~~0FBA
|
||||
W~228,5~~10,99~1,109~~1,123~1,125~~~0FBA
|
||||
zh~229,5~~10,100~1,109~~1,123~1,125~~~0FAE
|
||||
z~230,5~~10,101~1,109~~1,123~1,125~~~0FAF
|
||||
'~231,5~~10,102~1,109~~1,123~1,125~~~0FB0
|
||||
y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB
|
||||
r~233,5~~10,104~1,109~~1,123~1,125~~~0FBC
|
||||
Y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB
|
||||
R~233,5~~10,104~1,109~~1,123~1,125~~~0FBC
|
||||
l~234,5~~10,105~1,109~~1,123~1,125~~~0FB3
|
||||
sh~235,5~~10,106~1,109~~1,123~1,125~~~0FB4
|
||||
Sh~236,5~~10,107~1,109~~1,123~1,125~~~0FB5
|
||||
|
@ -945,32 +957,32 @@ r~176,4~~8,71~~~~~~~0FB2
|
|||
<?Ignore?>
|
||||
|
||||
// DLC EWTS doesn't give mappings for these half numerals...
|
||||
\tmw8073~70,5~~9,73~~~~~~~0F33
|
||||
\tmw8074~71,5~~9,74~~~~~~~0F2A
|
||||
\tmw8075~72,5~~9,75~~~~~~~0F2B
|
||||
\tmw8076~73,5~~9,76~~~~~~~0F2C
|
||||
\tmw8077~74,5~~9,77~~~~~~~0F2D
|
||||
\tmw8078~75,5~~9,78~~~~~~~0F2E
|
||||
\tmw8079~76,5~~9,79~~~~~~~0F2F
|
||||
\tmw8080~77,5~~9,80~~~~~~~0F30
|
||||
\tmw8081~78,5~~9,81~~~~~~~0F31
|
||||
\tmw8082~79,5~~9,82~~~~~~~0F32
|
||||
\u0F33~70,5~~9,73~~~~~~~0F33
|
||||
\u0F2A~71,5~~9,74~~~~~~~0F2A
|
||||
\u0F2B~72,5~~9,75~~~~~~~0F2B
|
||||
\u0F2C~73,5~~9,76~~~~~~~0F2C
|
||||
\u0F2D~74,5~~9,77~~~~~~~0F2D
|
||||
\u0F2E~75,5~~9,78~~~~~~~0F2E
|
||||
\u0F2F~76,5~~9,79~~~~~~~0F2F
|
||||
\u0F30~77,5~~9,80~~~~~~~0F30
|
||||
\u0F31~78,5~~9,81~~~~~~~0F31
|
||||
\u0F32~79,5~~9,82~~~~~~~0F32
|
||||
|
||||
// cantillation sign,heavy beat:
|
||||
\tmw8083~80,5~~9,83~~~~~~~0FC0
|
||||
\u0FC0~80,5~~9,83~~~~~~~0FC0
|
||||
// cantillation sign,light beat:
|
||||
\tmw8084~81,5~~9,84~~~~~~~0FC1
|
||||
\u0FC1~81,5~~9,84~~~~~~~0FC1
|
||||
// cantillation sign,cang.te-u:
|
||||
\tmw8085~82,5~~9,85~~~~~~~0FC2
|
||||
\u0FC2~82,5~~9,85~~~~~~~0FC2
|
||||
// cantillation sign sbub.chal:
|
||||
\tmw8086~83,5~~9,86~~~~~~~0FC3
|
||||
\u0FC3~83,5~~9,86~~~~~~~0FC3
|
||||
// zhi.rol.btags:
|
||||
\tmw8087~84,5~~9,87~~~~~~~none
|
||||
\uF03B~84,5~~9,87~~~~~~~none
|
||||
|
||||
// sher.bu:
|
||||
\tmw8088~90,5~~9,88~~~~~~~none
|
||||
\uF039~90,5~~9,88~~~~~~~none
|
||||
// kuruka:
|
||||
\tmw8090~92,5~~9,90~~~~~~~none
|
||||
\uF035~92,5~~9,90~~~~~~~none
|
||||
|
||||
// yungs.drung (reversed):
|
||||
\tmw8097~97,5~~9,97~~~~~~~5350
|
||||
|
@ -978,61 +990,61 @@ r~176,4~~8,71~~~~~~~0FB2
|
|||
\tmw8098~98,5~~9,98~~~~~~~534D
|
||||
|
||||
// mchan rtags trailing:
|
||||
\tmw8099~99,5~~9,99~~~~~~~none
|
||||
\uF038~99,5~~9,99~~~~~~~none
|
||||
// mchan rtags leading:
|
||||
\tmw8100~100,5~~9,100~~~~~~~none
|
||||
\uF037~100,5~~9,100~~~~~~~none
|
||||
|
||||
// che.mgo:
|
||||
\tmw8103~103,5~~9,103~~~~~~~0F38
|
||||
\u0F38~103,5~~9,103~~~~~~~0F38
|
||||
// kuruka:
|
||||
\tmw8104~104,5~~9,104~~~~~~~0FBE
|
||||
\u0FBE~104,5~~9,104~~~~~~~0FBE
|
||||
// Kuruka.mig.lda:
|
||||
\tmw8105~105,5~~9,105~~~~~~~0FBF
|
||||
\u0FBF~105,5~~9,105~~~~~~~0FBF
|
||||
// ornament:
|
||||
\tmw8106~106,5~~9,106~~~~~~~0F36
|
||||
\u0F36~106,5~~9,106~~~~~~~0F36
|
||||
// yang.rtags:
|
||||
\tmw8107~107,5~~9,107~~~~~~~0F87
|
||||
\u0F87~107,5~~9,107~~~~~~~0F87
|
||||
// lci.rtags:
|
||||
\tmw8108~108,5~~9,108~~~~~~~0F86
|
||||
\u0F86~108,5~~9,108~~~~~~~0F86
|
||||
// mchu.can:
|
||||
\tmw8109~109,5~~9,109~~~~~~~0F89
|
||||
\u0F89~109,5~~9,109~~~~~~~0F89
|
||||
// gru.can.rgyings:
|
||||
\tmw8110~110,5~~9,110~~~~~~~0F8A
|
||||
\u0F8A~110,5~~9,110~~~~~~~0F8A
|
||||
// gru.med.gyings:
|
||||
\tmw8111~111,5~~9,111~~~~~~~0F8B
|
||||
\u0F8B~111,5~~9,111~~~~~~~0F8B
|
||||
|
||||
// single white pebble:
|
||||
\tmw8115~115,5~~9,115~~~~~~~0F1A
|
||||
\u0F1A~115,5~~9,115~~~~~~~0F1A
|
||||
// single black pebble:
|
||||
\tmw8116~116,5~~9,116~~~~~~~0F1D
|
||||
\u0F1D~116,5~~9,116~~~~~~~0F1D
|
||||
// double white pebble:
|
||||
\tmw8117~117,5~~9,117~~~~~~~0F1B
|
||||
\u0F1B~117,5~~9,117~~~~~~~0F1B
|
||||
// double black pebble:
|
||||
\tmw8118~118,5~~9,118~~~~~~~0F1E
|
||||
\u0F1E~118,5~~9,118~~~~~~~0F1E
|
||||
// white and black pebble:
|
||||
\tmw8119~119,5~~9,119~~~~~~~0F1F
|
||||
\u0F1F~119,5~~9,119~~~~~~~0F1F
|
||||
// triple white pebble:
|
||||
\tmw8120~120,5~~9,120~~~~~~~0F1C
|
||||
\u0F1C~120,5~~9,120~~~~~~~0F1C
|
||||
// triple black pebble:
|
||||
\tmw8121~121,5~~9,121~~~~~~~0FCF
|
||||
\u0FCF~121,5~~9,121~~~~~~~0FCF
|
||||
|
||||
\tmw8122~122,5~~9,122~~~~~~~none
|
||||
\tmw8123~123,5~~9,123~~~~~~~none
|
||||
\tmw8124~124,5~~9,124~~~~~~~none
|
||||
\tmw8125~125,5~~9,125~~~~~~~none
|
||||
\tmw8126~126,5~~9,126~~~~~~~none
|
||||
\tmw9033~128,5~~10,33~~~~~~~none
|
||||
\uF03C~122,5~~9,122~~~~~~~none
|
||||
\uF03D~123,5~~9,123~~~~~~~none
|
||||
\uF03E~124,5~~9,124~~~~~~~none
|
||||
\uF03F~125,5~~9,125~~~~~~~none
|
||||
\uF040~126,5~~9,126~~~~~~~none
|
||||
\uF041~128,5~~10,33~~~~~~~none
|
||||
|
||||
// logo sign chad.rtags:
|
||||
\tmw9034~129,5~~10,34~~~~~~~0F15
|
||||
\u0F15~129,5~~10,34~~~~~~~0F15
|
||||
// logo sign lhag.rtags:
|
||||
\tmw9035~130,5~~10,35~~~~~~~0F16
|
||||
\u0F16~130,5~~10,35~~~~~~~0F16
|
||||
// sgra.gcan.char.rtags:
|
||||
\tmw9036~131,5~~10,36~~~~~~~0F17
|
||||
\u0F17~131,5~~10,36~~~~~~~0F17
|
||||
// khyud.pa:
|
||||
\tmw9037~132,5~~10,37~~~~~~~0F18
|
||||
\u0F18~132,5~~10,37~~~~~~~0F18
|
||||
// sdong.tshugs:
|
||||
\tmw9038~133,5~~10,38~~~~~~~0F19
|
||||
\u0F19~133,5~~10,38~~~~~~~0F19
|
||||
|
||||
// utsama ka:
|
||||
\tmw2059~57,2~~3,59~1,109~4,120~1,125~1,123~4,106~4,113~f88,f90
|
||||
|
@ -1040,92 +1052,99 @@ r~176,4~~8,71~~~~~~~0FB2
|
|||
\tmw2060~58,2~~3,60~1,109~4,120~1,125~1,123~4,106~4,113~f88,f91
|
||||
|
||||
// tza.'phru:
|
||||
\tmw7067~174,4~~8,67~~~~~~~0F39
|
||||
^~174,4~~8,67~~~~~~~0F39
|
||||
// reversed tza.'phru: (non-reversed is in Unicode, but not this)
|
||||
\tmw7068~145,5~~8,68~~~~~~~
|
||||
\uF034~145,5~~8,68~~~~~~~none
|
||||
// damaru.rtags:
|
||||
\tmw7072~178,4~~8,72~~~~~~~0F88
|
||||
\u0F88~178,4~~8,72~~~~~~~0F88
|
||||
// half a.chen:
|
||||
\tmw7073~179,4~~8,73~~~~~~~0F01
|
||||
\u0F01~179,4~~8,73~~~~~~~0F01
|
||||
|
||||
// ITHI secret sign:
|
||||
//
|
||||
// f68,fa0,f80,f72 comes close, but fa0 might be larger. The OpenType
|
||||
// font will probably have had this very glyph in mind!
|
||||
// font will probably have had this very glyph in mind if that works!
|
||||
// DLC FIXME: No way this is Unicode f68,fa0,f80,f72, though: tha is
|
||||
// small, and gi-gu plus reversed gi-gu together is ill-defined.
|
||||
//
|
||||
// DLC FIXME: WHAT'S THE EWTS?
|
||||
//
|
||||
// ITHI secret sign:
|
||||
\tmw7074~180,4~~8,74~~~~~~~f68,fa0,f80,f72
|
||||
\tmw7074~180,4~~8,74~~~~~~~none
|
||||
|
||||
// Terton's mark:
|
||||
\tmw7075~181,4~~8,75~~~~~~~none
|
||||
\uF023~181,4~~8,75~~~~~~~none
|
||||
// Terton's mark:
|
||||
\tmw7076~182,4~~8,76~~~~~~~none
|
||||
\uF022~182,4~~8,76~~~~~~~none
|
||||
// Terton's mark:
|
||||
\tmw7077~183,4~~8,77~~~~~~~none
|
||||
\uF021~183,4~~8,77~~~~~~~none
|
||||
// Note that this is close to 0f11:
|
||||
// Terton's mark:
|
||||
\tmw7078~149,5~~8,78~~~~~~~none
|
||||
\uF027~149,5~~8,78~~~~~~~none
|
||||
// Terma mark:
|
||||
\tmw7079~184,4~~8,79~~~~~~~none
|
||||
\uF02D~184,4~~8,79~~~~~~~none
|
||||
// Terma mark:
|
||||
\tmw7080~185,4~~8,80~~~~~~~none
|
||||
\uF02E~185,4~~8,80~~~~~~~none
|
||||
// Terma mark:
|
||||
\tmw7081~186,4~~8,81~~~~~~~none
|
||||
\uF02F~186,4~~8,81~~~~~~~none
|
||||
// Mark:
|
||||
\tmw7082~187,4~~8,82~~~~~~~none
|
||||
\uF030~187,4~~8,82~~~~~~~none
|
||||
|
||||
// DLC see chinese unicode:
|
||||
// Chinese letter:
|
||||
\tmw9060~155,5~~10,60~~~~~~~none
|
||||
|
||||
// dril.bu:
|
||||
\tmw9062~190,5~~10,62~~~~~~~0FC4
|
||||
\u0FC4~190,5~~10,62~~~~~~~0FC4
|
||||
// rdo.rje:
|
||||
\tmw9063~191,5~~10,63~~~~~~~0FC5
|
||||
\u0FC5~191,5~~10,63~~~~~~~0FC5
|
||||
// padma.gdan:
|
||||
\tmw9064~192,5~~10,64~~~~~~~0FC6
|
||||
\u0FC6~192,5~~10,64~~~~~~~0FC6
|
||||
// rdo.rje.rgya.gram:
|
||||
\tmw9065~193,5~~10,65~~~~~~~0FC7
|
||||
\u0FC7~193,5~~10,65~~~~~~~0FC7
|
||||
// phur.ba:
|
||||
\tmw9066~194,5~~10,66~~~~~~~0FC8
|
||||
\u0FC8~194,5~~10,66~~~~~~~0FC8
|
||||
// nor.bu:
|
||||
\tmw9067~195,5~~10,67~~~~~~~0FC9
|
||||
\u0FC9~195,5~~10,67~~~~~~~0FC9
|
||||
// nor.bu.gnyis.khyil:
|
||||
\tmw9068~196,5~~10,68~~~~~~~0FCA
|
||||
\u0FCA~196,5~~10,68~~~~~~~0FCA
|
||||
// nor.bu.gsum.khyil:
|
||||
\tmw9069~197,5~~10,69~~~~~~~0FCB
|
||||
\u0FCB~197,5~~10,69~~~~~~~0FCB
|
||||
// nor.bu.bzhi.khyil:
|
||||
\tmw9070~198,5~~10,70~~~~~~~0FCC
|
||||
\u0FCC~198,5~~10,70~~~~~~~0FCC
|
||||
|
||||
// bindu + datse + thigle:
|
||||
// bindu + datse + thigle: DLC NOW 0f82 or not? 91,5 is a candidate too
|
||||
// DLC NOW: \uF03A or not? Awaiting Than's reply...
|
||||
\tmw7095~242,1~~8,95~~~~~~~none
|
||||
|
||||
// zhu.yig.mgo.rgyan:
|
||||
\tmw8033~33,5~~9,33~~~~~~~0F0A
|
||||
\u0F0A~33,5~~9,33~~~~~~~0F0A
|
||||
// bka'.shog.mgo.rgyan:
|
||||
\tmw8034~34,5~~9,34~~~~~~~none
|
||||
\uF024~34,5~~9,34~~~~~~~none
|
||||
// mnyam.yig.mgo.rgyan:
|
||||
\tmw8035~35,5~~9,35~~~~~~~none
|
||||
\uF025~35,5~~9,35~~~~~~~none
|
||||
// mnyam.yig.mgo.rgyan:
|
||||
\tmw8036~36,5~~9,36~~~~~~~0F09
|
||||
\u0F09~36,5~~9,36~~~~~~~0F09
|
||||
// nameless sign:
|
||||
\tmw8037~37,5~~9,37~~~~~~~none
|
||||
\uF026~37,5~~9,37~~~~~~~none
|
||||
|
||||
// shad (hooked) + single tsheg:
|
||||
\tmw8044~41,5~~9,44~~~~~~~none
|
||||
\uF02B~41,5~~9,44~~~~~~~none
|
||||
// shad + double tsheg:
|
||||
\tmw8046~42,5~~9,46~~~~~~~none
|
||||
\uF02C~42,5~~9,46~~~~~~~none
|
||||
// sbrul.shad + single ornament:
|
||||
\tmw8048~44,5~~9,48~~~~~~~none
|
||||
\uF028~44,5~~9,48~~~~~~~none
|
||||
// sbrul.shad + double ornament:
|
||||
\tmw8049~46,5~~9,49~~~~~~~none
|
||||
\uF02A~46,5~~9,49~~~~~~~none
|
||||
// sbrul.shad variant form:
|
||||
\tmw8050~47,5~~9,50~~~~~~~none
|
||||
\uF029~47,5~~9,50~~~~~~~none
|
||||
|
||||
// reversed hu:
|
||||
\tmw9043~147,5~~10,43~~~~~~~none
|
||||
\uF032~147,5~~10,43~~~~~~~none
|
||||
// Inverted ha:
|
||||
\tmw9044~148,5~~10,44~~~~~~~none
|
||||
\uF033~148,5~~10,44~~~~~~~none
|
||||
|
||||
// no name:
|
||||
\tmw8091~93,5~~9,91~~~~~~~none
|
||||
\uF036~93,5~~9,91~~~~~~~none
|
||||
// nyi.zla:
|
||||
\tmw8089~91,5~~9,89~~~~~~~0F82
|
||||
\u0F82~91,5~~9,89~~~~~~~0F82
|
||||
|
|
Loading…
Reference in a new issue