Bug fixes. Plus, now 99% in sync with the new EWTS draft. Search for 'DLC' to find a few open issues.

Readded the line for reversed dza; it should never have been deleted, as that breaks TM<->TMW.  I tested the whole mapping by hand once; this incident shows that automation is very helpful.

'{' and '}' were swapped...

The Unicode for something was "", not "none".

+R, +W, +Y, R+ now in use (though more testing is needed)
This commit is contained in:
dchandler 2003-11-24 02:40:40 +00:00
parent 216c5b0d54
commit 08c676c186

View file

@ -10,12 +10,22 @@
// ACIP->Unicode conversion. So keep ACIPRules in sync with this, and be
// sure to run 'ant clean check' after your change.
//
// Note that some glyphs have EWTS \uF021-\uF0FF inclusive. These do
// not have anything in the Unicode column, though, because this is just
// the EWTS -- if someone wants to convert TMSkt3.183->Unicode and get
// \u0F21, let them do that, but our *->Unicode converters shouldn't
// output codes in the PUA without explicit user authorization.
//
// Note that 0F00, 0F02, 0F03, and 0F0E are made by using multiple
// glyphs from TMW. 0F6A is not listed here (DLC FIXME: should it be?),
// but the glyph for it is the glyph for 0F62.
//
// DuffPaneTest ensures that the na-ro column truly contains na-ros,
// by the way.
<?Input:Punctuation?>
//_~32,1~0,32
// ~45,1~0,45~~~~~~~0F0B
// ~45,1~0,45~~~~~~~0FB0
// DLC 0020 or a wider space, perhaps a couple of EM spaces (2003,2003)? Than couldn't say, but he also had thought of U+2003.
_~32,1~~1,32~~~~~~~0020
~45,1~~1,45~~~~~~~0F0B
@ -67,19 +77,19 @@ M~~~8,91~~~~~~~0F7E
// virama:
?~252,1~~8,105~~~~~~~0F84
// rgya.gram.shad:
]~48,5~~9,51~~~~~~~0F12
\u0F12~48,5~~9,51~~~~~~~0F12
// shad + single ornament:
[~43,5~~9,47~~~~~~~0F10
\u0F10~43,5~~9,47~~~~~~~0F10
// gug.rtags.gyon:
<~95,5~~9,95~~~~~~~0F3A
// gug.rtags.gyas:
>~96,5~~9,96~~~~~~~0F3B
// yar.tshes.rtags:
{~134,5~~10,39~~~~~~~0F3E
}~134,5~~10,39~~~~~~~0F3E
// mar.tshes.rtags
}~135,5~~10,40~~~~~~~0F3F
{~135,5~~10,40~~~~~~~0F3F
// dzud.rtags.me.long.can:
`~94,5~~9,92~~~~~~~0F13
\u0F13~94,5~~9,92~~~~~~~0F13
// hard tsheg:
*~205,1~~1,108~~~~~~~0F0C
@ -216,9 +226,11 @@ au~237,1~~8,89~~~~~~~0F7D~~8,104
// DLC FIXME: need -I as well
<?Input:Sanskrit?>
// 0F5F,0F39 might work, but the OpenType font's author must've had
// Dza in mind if it does. Note that the bottommost horizontal stroke
// goes upward on U+0F5F and downward on U+0F5B.
// the TMSkt4.146 glyph in mind if it does. Note that the bottommost
// horizontal stroke goes upward on U+0F5F and downward on U+0F5B.
\uF031~146,5~~10,42~~~~~~~none
f~153,5~~10,58~1,110~1,118~1,124~1,126~10,114~10,123~0F55,0F39
v~154,5~~10,59~1,110~1,118~1,124~1,126~10,114~10,123~0F56,f39
T~170,1~~1,64~1,109~1,120~1,123~1,125~10,115~10,124~0F4A
@ -812,12 +824,12 @@ ts~224,5~~10,95~1,110~~1,125~1,126~~~0FA9
tsh~225,5~~10,96~1,110~~1,125~1,126~~~0FAA
dz~226,5~~10,97~1,110~~1,125~1,126~~~0FAB
dz+h~227,5~~10,98~1,110~~1,125~1,126~~~0FAC
w~228,5~~10,99~1,109~~1,123~1,125~~~0FBA
W~228,5~~10,99~1,109~~1,123~1,125~~~0FBA
zh~229,5~~10,100~1,109~~1,123~1,125~~~0FAE
z~230,5~~10,101~1,109~~1,123~1,125~~~0FAF
'~231,5~~10,102~1,109~~1,123~1,125~~~0FB0
y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB
r~233,5~~10,104~1,109~~1,123~1,125~~~0FBC
Y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB
R~233,5~~10,104~1,109~~1,123~1,125~~~0FBC
l~234,5~~10,105~1,109~~1,123~1,125~~~0FB3
sh~235,5~~10,106~1,109~~1,123~1,125~~~0FB4
Sh~236,5~~10,107~1,109~~1,123~1,125~~~0FB5
@ -945,32 +957,32 @@ r~176,4~~8,71~~~~~~~0FB2
<?Ignore?>
// DLC EWTS doesn't give mappings for these half numerals...
\tmw8073~70,5~~9,73~~~~~~~0F33
\tmw8074~71,5~~9,74~~~~~~~0F2A
\tmw8075~72,5~~9,75~~~~~~~0F2B
\tmw8076~73,5~~9,76~~~~~~~0F2C
\tmw8077~74,5~~9,77~~~~~~~0F2D
\tmw8078~75,5~~9,78~~~~~~~0F2E
\tmw8079~76,5~~9,79~~~~~~~0F2F
\tmw8080~77,5~~9,80~~~~~~~0F30
\tmw8081~78,5~~9,81~~~~~~~0F31
\tmw8082~79,5~~9,82~~~~~~~0F32
\u0F33~70,5~~9,73~~~~~~~0F33
\u0F2A~71,5~~9,74~~~~~~~0F2A
\u0F2B~72,5~~9,75~~~~~~~0F2B
\u0F2C~73,5~~9,76~~~~~~~0F2C
\u0F2D~74,5~~9,77~~~~~~~0F2D
\u0F2E~75,5~~9,78~~~~~~~0F2E
\u0F2F~76,5~~9,79~~~~~~~0F2F
\u0F30~77,5~~9,80~~~~~~~0F30
\u0F31~78,5~~9,81~~~~~~~0F31
\u0F32~79,5~~9,82~~~~~~~0F32
// cantillation sign,heavy beat:
\tmw8083~80,5~~9,83~~~~~~~0FC0
\u0FC0~80,5~~9,83~~~~~~~0FC0
// cantillation sign,light beat:
\tmw8084~81,5~~9,84~~~~~~~0FC1
\u0FC1~81,5~~9,84~~~~~~~0FC1
// cantillation sign,cang.te-u:
\tmw8085~82,5~~9,85~~~~~~~0FC2
\u0FC2~82,5~~9,85~~~~~~~0FC2
// cantillation sign sbub.chal:
\tmw8086~83,5~~9,86~~~~~~~0FC3
\u0FC3~83,5~~9,86~~~~~~~0FC3
// zhi.rol.btags:
\tmw8087~84,5~~9,87~~~~~~~none
\uF03B~84,5~~9,87~~~~~~~none
// sher.bu:
\tmw8088~90,5~~9,88~~~~~~~none
\uF039~90,5~~9,88~~~~~~~none
// kuruka:
\tmw8090~92,5~~9,90~~~~~~~none
\uF035~92,5~~9,90~~~~~~~none
// yungs.drung (reversed):
\tmw8097~97,5~~9,97~~~~~~~5350
@ -978,61 +990,61 @@ r~176,4~~8,71~~~~~~~0FB2
\tmw8098~98,5~~9,98~~~~~~~534D
// mchan rtags trailing:
\tmw8099~99,5~~9,99~~~~~~~none
\uF038~99,5~~9,99~~~~~~~none
// mchan rtags leading:
\tmw8100~100,5~~9,100~~~~~~~none
\uF037~100,5~~9,100~~~~~~~none
// che.mgo:
\tmw8103~103,5~~9,103~~~~~~~0F38
\u0F38~103,5~~9,103~~~~~~~0F38
// kuruka:
\tmw8104~104,5~~9,104~~~~~~~0FBE
\u0FBE~104,5~~9,104~~~~~~~0FBE
// Kuruka.mig.lda:
\tmw8105~105,5~~9,105~~~~~~~0FBF
\u0FBF~105,5~~9,105~~~~~~~0FBF
// ornament:
\tmw8106~106,5~~9,106~~~~~~~0F36
\u0F36~106,5~~9,106~~~~~~~0F36
// yang.rtags:
\tmw8107~107,5~~9,107~~~~~~~0F87
\u0F87~107,5~~9,107~~~~~~~0F87
// lci.rtags:
\tmw8108~108,5~~9,108~~~~~~~0F86
\u0F86~108,5~~9,108~~~~~~~0F86
// mchu.can:
\tmw8109~109,5~~9,109~~~~~~~0F89
\u0F89~109,5~~9,109~~~~~~~0F89
// gru.can.rgyings:
\tmw8110~110,5~~9,110~~~~~~~0F8A
\u0F8A~110,5~~9,110~~~~~~~0F8A
// gru.med.gyings:
\tmw8111~111,5~~9,111~~~~~~~0F8B
\u0F8B~111,5~~9,111~~~~~~~0F8B
// single white pebble:
\tmw8115~115,5~~9,115~~~~~~~0F1A
\u0F1A~115,5~~9,115~~~~~~~0F1A
// single black pebble:
\tmw8116~116,5~~9,116~~~~~~~0F1D
\u0F1D~116,5~~9,116~~~~~~~0F1D
// double white pebble:
\tmw8117~117,5~~9,117~~~~~~~0F1B
\u0F1B~117,5~~9,117~~~~~~~0F1B
// double black pebble:
\tmw8118~118,5~~9,118~~~~~~~0F1E
\u0F1E~118,5~~9,118~~~~~~~0F1E
// white and black pebble:
\tmw8119~119,5~~9,119~~~~~~~0F1F
\u0F1F~119,5~~9,119~~~~~~~0F1F
// triple white pebble:
\tmw8120~120,5~~9,120~~~~~~~0F1C
\u0F1C~120,5~~9,120~~~~~~~0F1C
// triple black pebble:
\tmw8121~121,5~~9,121~~~~~~~0FCF
\u0FCF~121,5~~9,121~~~~~~~0FCF
\tmw8122~122,5~~9,122~~~~~~~none
\tmw8123~123,5~~9,123~~~~~~~none
\tmw8124~124,5~~9,124~~~~~~~none
\tmw8125~125,5~~9,125~~~~~~~none
\tmw8126~126,5~~9,126~~~~~~~none
\tmw9033~128,5~~10,33~~~~~~~none
\uF03C~122,5~~9,122~~~~~~~none
\uF03D~123,5~~9,123~~~~~~~none
\uF03E~124,5~~9,124~~~~~~~none
\uF03F~125,5~~9,125~~~~~~~none
\uF040~126,5~~9,126~~~~~~~none
\uF041~128,5~~10,33~~~~~~~none
// logo sign chad.rtags:
\tmw9034~129,5~~10,34~~~~~~~0F15
\u0F15~129,5~~10,34~~~~~~~0F15
// logo sign lhag.rtags:
\tmw9035~130,5~~10,35~~~~~~~0F16
\u0F16~130,5~~10,35~~~~~~~0F16
// sgra.gcan.char.rtags:
\tmw9036~131,5~~10,36~~~~~~~0F17
\u0F17~131,5~~10,36~~~~~~~0F17
// khyud.pa:
\tmw9037~132,5~~10,37~~~~~~~0F18
\u0F18~132,5~~10,37~~~~~~~0F18
// sdong.tshugs:
\tmw9038~133,5~~10,38~~~~~~~0F19
\u0F19~133,5~~10,38~~~~~~~0F19
// utsama ka:
\tmw2059~57,2~~3,59~1,109~4,120~1,125~1,123~4,106~4,113~f88,f90
@ -1040,92 +1052,99 @@ r~176,4~~8,71~~~~~~~0FB2
\tmw2060~58,2~~3,60~1,109~4,120~1,125~1,123~4,106~4,113~f88,f91
// tza.'phru:
\tmw7067~174,4~~8,67~~~~~~~0F39
^~174,4~~8,67~~~~~~~0F39
// reversed tza.'phru: (non-reversed is in Unicode, but not this)
\tmw7068~145,5~~8,68~~~~~~~
\uF034~145,5~~8,68~~~~~~~none
// damaru.rtags:
\tmw7072~178,4~~8,72~~~~~~~0F88
\u0F88~178,4~~8,72~~~~~~~0F88
// half a.chen:
\tmw7073~179,4~~8,73~~~~~~~0F01
\u0F01~179,4~~8,73~~~~~~~0F01
// ITHI secret sign:
//
// f68,fa0,f80,f72 comes close, but fa0 might be larger. The OpenType
// font will probably have had this very glyph in mind!
// font will probably have had this very glyph in mind if that works!
// DLC FIXME: No way this is Unicode f68,fa0,f80,f72, though: tha is
// small, and gi-gu plus reversed gi-gu together is ill-defined.
//
// DLC FIXME: WHAT'S THE EWTS?
//
// ITHI secret sign:
\tmw7074~180,4~~8,74~~~~~~~f68,fa0,f80,f72
\tmw7074~180,4~~8,74~~~~~~~none
// Terton's mark:
\tmw7075~181,4~~8,75~~~~~~~none
\uF023~181,4~~8,75~~~~~~~none
// Terton's mark:
\tmw7076~182,4~~8,76~~~~~~~none
\uF022~182,4~~8,76~~~~~~~none
// Terton's mark:
\tmw7077~183,4~~8,77~~~~~~~none
\uF021~183,4~~8,77~~~~~~~none
// Note that this is close to 0f11:
// Terton's mark:
\tmw7078~149,5~~8,78~~~~~~~none
\uF027~149,5~~8,78~~~~~~~none
// Terma mark:
\tmw7079~184,4~~8,79~~~~~~~none
\uF02D~184,4~~8,79~~~~~~~none
// Terma mark:
\tmw7080~185,4~~8,80~~~~~~~none
\uF02E~185,4~~8,80~~~~~~~none
// Terma mark:
\tmw7081~186,4~~8,81~~~~~~~none
\uF02F~186,4~~8,81~~~~~~~none
// Mark:
\tmw7082~187,4~~8,82~~~~~~~none
\uF030~187,4~~8,82~~~~~~~none
// DLC see chinese unicode:
// Chinese letter:
\tmw9060~155,5~~10,60~~~~~~~none
// dril.bu:
\tmw9062~190,5~~10,62~~~~~~~0FC4
\u0FC4~190,5~~10,62~~~~~~~0FC4
// rdo.rje:
\tmw9063~191,5~~10,63~~~~~~~0FC5
\u0FC5~191,5~~10,63~~~~~~~0FC5
// padma.gdan:
\tmw9064~192,5~~10,64~~~~~~~0FC6
\u0FC6~192,5~~10,64~~~~~~~0FC6
// rdo.rje.rgya.gram:
\tmw9065~193,5~~10,65~~~~~~~0FC7
\u0FC7~193,5~~10,65~~~~~~~0FC7
// phur.ba:
\tmw9066~194,5~~10,66~~~~~~~0FC8
\u0FC8~194,5~~10,66~~~~~~~0FC8
// nor.bu:
\tmw9067~195,5~~10,67~~~~~~~0FC9
\u0FC9~195,5~~10,67~~~~~~~0FC9
// nor.bu.gnyis.khyil:
\tmw9068~196,5~~10,68~~~~~~~0FCA
\u0FCA~196,5~~10,68~~~~~~~0FCA
// nor.bu.gsum.khyil:
\tmw9069~197,5~~10,69~~~~~~~0FCB
\u0FCB~197,5~~10,69~~~~~~~0FCB
// nor.bu.bzhi.khyil:
\tmw9070~198,5~~10,70~~~~~~~0FCC
\u0FCC~198,5~~10,70~~~~~~~0FCC
// bindu + datse + thigle:
// bindu + datse + thigle: DLC NOW 0f82 or not? 91,5 is a candidate too
// DLC NOW: \uF03A or not? Awaiting Than's reply...
\tmw7095~242,1~~8,95~~~~~~~none
// zhu.yig.mgo.rgyan:
\tmw8033~33,5~~9,33~~~~~~~0F0A
\u0F0A~33,5~~9,33~~~~~~~0F0A
// bka'.shog.mgo.rgyan:
\tmw8034~34,5~~9,34~~~~~~~none
\uF024~34,5~~9,34~~~~~~~none
// mnyam.yig.mgo.rgyan:
\tmw8035~35,5~~9,35~~~~~~~none
\uF025~35,5~~9,35~~~~~~~none
// mnyam.yig.mgo.rgyan:
\tmw8036~36,5~~9,36~~~~~~~0F09
\u0F09~36,5~~9,36~~~~~~~0F09
// nameless sign:
\tmw8037~37,5~~9,37~~~~~~~none
\uF026~37,5~~9,37~~~~~~~none
// shad (hooked) + single tsheg:
\tmw8044~41,5~~9,44~~~~~~~none
\uF02B~41,5~~9,44~~~~~~~none
// shad + double tsheg:
\tmw8046~42,5~~9,46~~~~~~~none
\uF02C~42,5~~9,46~~~~~~~none
// sbrul.shad + single ornament:
\tmw8048~44,5~~9,48~~~~~~~none
\uF028~44,5~~9,48~~~~~~~none
// sbrul.shad + double ornament:
\tmw8049~46,5~~9,49~~~~~~~none
\uF02A~46,5~~9,49~~~~~~~none
// sbrul.shad variant form:
\tmw8050~47,5~~9,50~~~~~~~none
\uF029~47,5~~9,50~~~~~~~none
// reversed hu:
\tmw9043~147,5~~10,43~~~~~~~none
\uF032~147,5~~10,43~~~~~~~none
// Inverted ha:
\tmw9044~148,5~~10,44~~~~~~~none
\uF033~148,5~~10,44~~~~~~~none
// no name:
\tmw8091~93,5~~9,91~~~~~~~none
\uF036~93,5~~9,91~~~~~~~none
// nyi.zla:
\tmw8089~91,5~~9,89~~~~~~~0F82
\u0F82~91,5~~9,89~~~~~~~0F82