Bug fixes. Plus, now 99% in sync with the new EWTS draft. Search for 'DLC' to find a few open issues.

Readded the line for reversed dza; it should never have been deleted, as that breaks TM<->TMW.  I tested the whole mapping by hand once; this incident shows that automation is very helpful.

'{' and '}' were swapped...

The Unicode for something was "", not "none".

+R, +W, +Y, R+ now in use (though more testing is needed)
This commit is contained in:
dchandler 2003-11-24 02:40:40 +00:00
parent 216c5b0d54
commit 08c676c186

View file

@ -10,12 +10,22 @@
// ACIP->Unicode conversion. So keep ACIPRules in sync with this, and be // ACIP->Unicode conversion. So keep ACIPRules in sync with this, and be
// sure to run 'ant clean check' after your change. // sure to run 'ant clean check' after your change.
// //
// Note that some glyphs have EWTS \uF021-\uF0FF inclusive. These do
// not have anything in the Unicode column, though, because this is just
// the EWTS -- if someone wants to convert TMSkt3.183->Unicode and get
// \u0F21, let them do that, but our *->Unicode converters shouldn't
// output codes in the PUA without explicit user authorization.
//
// Note that 0F00, 0F02, 0F03, and 0F0E are made by using multiple
// glyphs from TMW. 0F6A is not listed here (DLC FIXME: should it be?),
// but the glyph for it is the glyph for 0F62.
//
// DuffPaneTest ensures that the na-ro column truly contains na-ros, // DuffPaneTest ensures that the na-ro column truly contains na-ros,
// by the way. // by the way.
<?Input:Punctuation?> <?Input:Punctuation?>
//_~32,1~0,32 //_~32,1~0,32
// ~45,1~0,45~~~~~~~0F0B // ~45,1~0,45~~~~~~~0FB0
// DLC 0020 or a wider space, perhaps a couple of EM spaces (2003,2003)? Than couldn't say, but he also had thought of U+2003. // DLC 0020 or a wider space, perhaps a couple of EM spaces (2003,2003)? Than couldn't say, but he also had thought of U+2003.
_~32,1~~1,32~~~~~~~0020 _~32,1~~1,32~~~~~~~0020
~45,1~~1,45~~~~~~~0F0B ~45,1~~1,45~~~~~~~0F0B
@ -67,19 +77,19 @@ M~~~8,91~~~~~~~0F7E
// virama: // virama:
?~252,1~~8,105~~~~~~~0F84 ?~252,1~~8,105~~~~~~~0F84
// rgya.gram.shad: // rgya.gram.shad:
]~48,5~~9,51~~~~~~~0F12 \u0F12~48,5~~9,51~~~~~~~0F12
// shad + single ornament: // shad + single ornament:
[~43,5~~9,47~~~~~~~0F10 \u0F10~43,5~~9,47~~~~~~~0F10
// gug.rtags.gyon: // gug.rtags.gyon:
<~95,5~~9,95~~~~~~~0F3A <~95,5~~9,95~~~~~~~0F3A
// gug.rtags.gyas: // gug.rtags.gyas:
>~96,5~~9,96~~~~~~~0F3B >~96,5~~9,96~~~~~~~0F3B
// yar.tshes.rtags: // yar.tshes.rtags:
{~134,5~~10,39~~~~~~~0F3E }~134,5~~10,39~~~~~~~0F3E
// mar.tshes.rtags // mar.tshes.rtags
}~135,5~~10,40~~~~~~~0F3F {~135,5~~10,40~~~~~~~0F3F
// dzud.rtags.me.long.can: // dzud.rtags.me.long.can:
`~94,5~~9,92~~~~~~~0F13 \u0F13~94,5~~9,92~~~~~~~0F13
// hard tsheg: // hard tsheg:
*~205,1~~1,108~~~~~~~0F0C *~205,1~~1,108~~~~~~~0F0C
@ -216,9 +226,11 @@ au~237,1~~8,89~~~~~~~0F7D~~8,104
// DLC FIXME: need -I as well // DLC FIXME: need -I as well
<?Input:Sanskrit?> <?Input:Sanskrit?>
// 0F5F,0F39 might work, but the OpenType font's author must've had // 0F5F,0F39 might work, but the OpenType font's author must've had
// Dza in mind if it does. Note that the bottommost horizontal stroke // the TMSkt4.146 glyph in mind if it does. Note that the bottommost
// goes upward on U+0F5F and downward on U+0F5B. // horizontal stroke goes upward on U+0F5F and downward on U+0F5B.
\uF031~146,5~~10,42~~~~~~~none
f~153,5~~10,58~1,110~1,118~1,124~1,126~10,114~10,123~0F55,0F39 f~153,5~~10,58~1,110~1,118~1,124~1,126~10,114~10,123~0F55,0F39
v~154,5~~10,59~1,110~1,118~1,124~1,126~10,114~10,123~0F56,f39 v~154,5~~10,59~1,110~1,118~1,124~1,126~10,114~10,123~0F56,f39
T~170,1~~1,64~1,109~1,120~1,123~1,125~10,115~10,124~0F4A T~170,1~~1,64~1,109~1,120~1,123~1,125~10,115~10,124~0F4A
@ -812,12 +824,12 @@ ts~224,5~~10,95~1,110~~1,125~1,126~~~0FA9
tsh~225,5~~10,96~1,110~~1,125~1,126~~~0FAA tsh~225,5~~10,96~1,110~~1,125~1,126~~~0FAA
dz~226,5~~10,97~1,110~~1,125~1,126~~~0FAB dz~226,5~~10,97~1,110~~1,125~1,126~~~0FAB
dz+h~227,5~~10,98~1,110~~1,125~1,126~~~0FAC dz+h~227,5~~10,98~1,110~~1,125~1,126~~~0FAC
w~228,5~~10,99~1,109~~1,123~1,125~~~0FBA W~228,5~~10,99~1,109~~1,123~1,125~~~0FBA
zh~229,5~~10,100~1,109~~1,123~1,125~~~0FAE zh~229,5~~10,100~1,109~~1,123~1,125~~~0FAE
z~230,5~~10,101~1,109~~1,123~1,125~~~0FAF z~230,5~~10,101~1,109~~1,123~1,125~~~0FAF
'~231,5~~10,102~1,109~~1,123~1,125~~~0FB0 '~231,5~~10,102~1,109~~1,123~1,125~~~0FB0
y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB Y~232,5~~10,103~1,109~~1,123~1,125~~~0FBB
r~233,5~~10,104~1,109~~1,123~1,125~~~0FBC R~233,5~~10,104~1,109~~1,123~1,125~~~0FBC
l~234,5~~10,105~1,109~~1,123~1,125~~~0FB3 l~234,5~~10,105~1,109~~1,123~1,125~~~0FB3
sh~235,5~~10,106~1,109~~1,123~1,125~~~0FB4 sh~235,5~~10,106~1,109~~1,123~1,125~~~0FB4
Sh~236,5~~10,107~1,109~~1,123~1,125~~~0FB5 Sh~236,5~~10,107~1,109~~1,123~1,125~~~0FB5
@ -945,32 +957,32 @@ r~176,4~~8,71~~~~~~~0FB2
<?Ignore?> <?Ignore?>
// DLC EWTS doesn't give mappings for these half numerals... // DLC EWTS doesn't give mappings for these half numerals...
\tmw8073~70,5~~9,73~~~~~~~0F33 \u0F33~70,5~~9,73~~~~~~~0F33
\tmw8074~71,5~~9,74~~~~~~~0F2A \u0F2A~71,5~~9,74~~~~~~~0F2A
\tmw8075~72,5~~9,75~~~~~~~0F2B \u0F2B~72,5~~9,75~~~~~~~0F2B
\tmw8076~73,5~~9,76~~~~~~~0F2C \u0F2C~73,5~~9,76~~~~~~~0F2C
\tmw8077~74,5~~9,77~~~~~~~0F2D \u0F2D~74,5~~9,77~~~~~~~0F2D
\tmw8078~75,5~~9,78~~~~~~~0F2E \u0F2E~75,5~~9,78~~~~~~~0F2E
\tmw8079~76,5~~9,79~~~~~~~0F2F \u0F2F~76,5~~9,79~~~~~~~0F2F
\tmw8080~77,5~~9,80~~~~~~~0F30 \u0F30~77,5~~9,80~~~~~~~0F30
\tmw8081~78,5~~9,81~~~~~~~0F31 \u0F31~78,5~~9,81~~~~~~~0F31
\tmw8082~79,5~~9,82~~~~~~~0F32 \u0F32~79,5~~9,82~~~~~~~0F32
// cantillation sign,heavy beat: // cantillation sign,heavy beat:
\tmw8083~80,5~~9,83~~~~~~~0FC0 \u0FC0~80,5~~9,83~~~~~~~0FC0
// cantillation sign,light beat: // cantillation sign,light beat:
\tmw8084~81,5~~9,84~~~~~~~0FC1 \u0FC1~81,5~~9,84~~~~~~~0FC1
// cantillation sign,cang.te-u: // cantillation sign,cang.te-u:
\tmw8085~82,5~~9,85~~~~~~~0FC2 \u0FC2~82,5~~9,85~~~~~~~0FC2
// cantillation sign sbub.chal: // cantillation sign sbub.chal:
\tmw8086~83,5~~9,86~~~~~~~0FC3 \u0FC3~83,5~~9,86~~~~~~~0FC3
// zhi.rol.btags: // zhi.rol.btags:
\tmw8087~84,5~~9,87~~~~~~~none \uF03B~84,5~~9,87~~~~~~~none
// sher.bu: // sher.bu:
\tmw8088~90,5~~9,88~~~~~~~none \uF039~90,5~~9,88~~~~~~~none
// kuruka: // kuruka:
\tmw8090~92,5~~9,90~~~~~~~none \uF035~92,5~~9,90~~~~~~~none
// yungs.drung (reversed): // yungs.drung (reversed):
\tmw8097~97,5~~9,97~~~~~~~5350 \tmw8097~97,5~~9,97~~~~~~~5350
@ -978,61 +990,61 @@ r~176,4~~8,71~~~~~~~0FB2
\tmw8098~98,5~~9,98~~~~~~~534D \tmw8098~98,5~~9,98~~~~~~~534D
// mchan rtags trailing: // mchan rtags trailing:
\tmw8099~99,5~~9,99~~~~~~~none \uF038~99,5~~9,99~~~~~~~none
// mchan rtags leading: // mchan rtags leading:
\tmw8100~100,5~~9,100~~~~~~~none \uF037~100,5~~9,100~~~~~~~none
// che.mgo: // che.mgo:
\tmw8103~103,5~~9,103~~~~~~~0F38 \u0F38~103,5~~9,103~~~~~~~0F38
// kuruka: // kuruka:
\tmw8104~104,5~~9,104~~~~~~~0FBE \u0FBE~104,5~~9,104~~~~~~~0FBE
// Kuruka.mig.lda: // Kuruka.mig.lda:
\tmw8105~105,5~~9,105~~~~~~~0FBF \u0FBF~105,5~~9,105~~~~~~~0FBF
// ornament: // ornament:
\tmw8106~106,5~~9,106~~~~~~~0F36 \u0F36~106,5~~9,106~~~~~~~0F36
// yang.rtags: // yang.rtags:
\tmw8107~107,5~~9,107~~~~~~~0F87 \u0F87~107,5~~9,107~~~~~~~0F87
// lci.rtags: // lci.rtags:
\tmw8108~108,5~~9,108~~~~~~~0F86 \u0F86~108,5~~9,108~~~~~~~0F86
// mchu.can: // mchu.can:
\tmw8109~109,5~~9,109~~~~~~~0F89 \u0F89~109,5~~9,109~~~~~~~0F89
// gru.can.rgyings: // gru.can.rgyings:
\tmw8110~110,5~~9,110~~~~~~~0F8A \u0F8A~110,5~~9,110~~~~~~~0F8A
// gru.med.gyings: // gru.med.gyings:
\tmw8111~111,5~~9,111~~~~~~~0F8B \u0F8B~111,5~~9,111~~~~~~~0F8B
// single white pebble: // single white pebble:
\tmw8115~115,5~~9,115~~~~~~~0F1A \u0F1A~115,5~~9,115~~~~~~~0F1A
// single black pebble: // single black pebble:
\tmw8116~116,5~~9,116~~~~~~~0F1D \u0F1D~116,5~~9,116~~~~~~~0F1D
// double white pebble: // double white pebble:
\tmw8117~117,5~~9,117~~~~~~~0F1B \u0F1B~117,5~~9,117~~~~~~~0F1B
// double black pebble: // double black pebble:
\tmw8118~118,5~~9,118~~~~~~~0F1E \u0F1E~118,5~~9,118~~~~~~~0F1E
// white and black pebble: // white and black pebble:
\tmw8119~119,5~~9,119~~~~~~~0F1F \u0F1F~119,5~~9,119~~~~~~~0F1F
// triple white pebble: // triple white pebble:
\tmw8120~120,5~~9,120~~~~~~~0F1C \u0F1C~120,5~~9,120~~~~~~~0F1C
// triple black pebble: // triple black pebble:
\tmw8121~121,5~~9,121~~~~~~~0FCF \u0FCF~121,5~~9,121~~~~~~~0FCF
\tmw8122~122,5~~9,122~~~~~~~none \uF03C~122,5~~9,122~~~~~~~none
\tmw8123~123,5~~9,123~~~~~~~none \uF03D~123,5~~9,123~~~~~~~none
\tmw8124~124,5~~9,124~~~~~~~none \uF03E~124,5~~9,124~~~~~~~none
\tmw8125~125,5~~9,125~~~~~~~none \uF03F~125,5~~9,125~~~~~~~none
\tmw8126~126,5~~9,126~~~~~~~none \uF040~126,5~~9,126~~~~~~~none
\tmw9033~128,5~~10,33~~~~~~~none \uF041~128,5~~10,33~~~~~~~none
// logo sign chad.rtags: // logo sign chad.rtags:
\tmw9034~129,5~~10,34~~~~~~~0F15 \u0F15~129,5~~10,34~~~~~~~0F15
// logo sign lhag.rtags: // logo sign lhag.rtags:
\tmw9035~130,5~~10,35~~~~~~~0F16 \u0F16~130,5~~10,35~~~~~~~0F16
// sgra.gcan.char.rtags: // sgra.gcan.char.rtags:
\tmw9036~131,5~~10,36~~~~~~~0F17 \u0F17~131,5~~10,36~~~~~~~0F17
// khyud.pa: // khyud.pa:
\tmw9037~132,5~~10,37~~~~~~~0F18 \u0F18~132,5~~10,37~~~~~~~0F18
// sdong.tshugs: // sdong.tshugs:
\tmw9038~133,5~~10,38~~~~~~~0F19 \u0F19~133,5~~10,38~~~~~~~0F19
// utsama ka: // utsama ka:
\tmw2059~57,2~~3,59~1,109~4,120~1,125~1,123~4,106~4,113~f88,f90 \tmw2059~57,2~~3,59~1,109~4,120~1,125~1,123~4,106~4,113~f88,f90
@ -1040,92 +1052,99 @@ r~176,4~~8,71~~~~~~~0FB2
\tmw2060~58,2~~3,60~1,109~4,120~1,125~1,123~4,106~4,113~f88,f91 \tmw2060~58,2~~3,60~1,109~4,120~1,125~1,123~4,106~4,113~f88,f91
// tza.'phru: // tza.'phru:
\tmw7067~174,4~~8,67~~~~~~~0F39 ^~174,4~~8,67~~~~~~~0F39
// reversed tza.'phru: (non-reversed is in Unicode, but not this) // reversed tza.'phru: (non-reversed is in Unicode, but not this)
\tmw7068~145,5~~8,68~~~~~~~ \uF034~145,5~~8,68~~~~~~~none
// damaru.rtags: // damaru.rtags:
\tmw7072~178,4~~8,72~~~~~~~0F88 \u0F88~178,4~~8,72~~~~~~~0F88
// half a.chen: // half a.chen:
\tmw7073~179,4~~8,73~~~~~~~0F01 \u0F01~179,4~~8,73~~~~~~~0F01
// ITHI secret sign:
//
// f68,fa0,f80,f72 comes close, but fa0 might be larger. The OpenType // f68,fa0,f80,f72 comes close, but fa0 might be larger. The OpenType
// font will probably have had this very glyph in mind! // font will probably have had this very glyph in mind if that works!
// DLC FIXME: No way this is Unicode f68,fa0,f80,f72, though: tha is
// small, and gi-gu plus reversed gi-gu together is ill-defined.
//
// DLC FIXME: WHAT'S THE EWTS?
// //
// ITHI secret sign: // ITHI secret sign:
\tmw7074~180,4~~8,74~~~~~~~f68,fa0,f80,f72 \tmw7074~180,4~~8,74~~~~~~~none
// Terton's mark: // Terton's mark:
\tmw7075~181,4~~8,75~~~~~~~none \uF023~181,4~~8,75~~~~~~~none
// Terton's mark: // Terton's mark:
\tmw7076~182,4~~8,76~~~~~~~none \uF022~182,4~~8,76~~~~~~~none
// Terton's mark: // Terton's mark:
\tmw7077~183,4~~8,77~~~~~~~none \uF021~183,4~~8,77~~~~~~~none
// Note that this is close to 0f11: // Note that this is close to 0f11:
// Terton's mark: // Terton's mark:
\tmw7078~149,5~~8,78~~~~~~~none \uF027~149,5~~8,78~~~~~~~none
// Terma mark: // Terma mark:
\tmw7079~184,4~~8,79~~~~~~~none \uF02D~184,4~~8,79~~~~~~~none
// Terma mark: // Terma mark:
\tmw7080~185,4~~8,80~~~~~~~none \uF02E~185,4~~8,80~~~~~~~none
// Terma mark: // Terma mark:
\tmw7081~186,4~~8,81~~~~~~~none \uF02F~186,4~~8,81~~~~~~~none
// Mark: // Mark:
\tmw7082~187,4~~8,82~~~~~~~none \uF030~187,4~~8,82~~~~~~~none
// DLC see chinese unicode: // DLC see chinese unicode:
// Chinese letter: // Chinese letter:
\tmw9060~155,5~~10,60~~~~~~~none \tmw9060~155,5~~10,60~~~~~~~none
// dril.bu: // dril.bu:
\tmw9062~190,5~~10,62~~~~~~~0FC4 \u0FC4~190,5~~10,62~~~~~~~0FC4
// rdo.rje: // rdo.rje:
\tmw9063~191,5~~10,63~~~~~~~0FC5 \u0FC5~191,5~~10,63~~~~~~~0FC5
// padma.gdan: // padma.gdan:
\tmw9064~192,5~~10,64~~~~~~~0FC6 \u0FC6~192,5~~10,64~~~~~~~0FC6
// rdo.rje.rgya.gram: // rdo.rje.rgya.gram:
\tmw9065~193,5~~10,65~~~~~~~0FC7 \u0FC7~193,5~~10,65~~~~~~~0FC7
// phur.ba: // phur.ba:
\tmw9066~194,5~~10,66~~~~~~~0FC8 \u0FC8~194,5~~10,66~~~~~~~0FC8
// nor.bu: // nor.bu:
\tmw9067~195,5~~10,67~~~~~~~0FC9 \u0FC9~195,5~~10,67~~~~~~~0FC9
// nor.bu.gnyis.khyil: // nor.bu.gnyis.khyil:
\tmw9068~196,5~~10,68~~~~~~~0FCA \u0FCA~196,5~~10,68~~~~~~~0FCA
// nor.bu.gsum.khyil: // nor.bu.gsum.khyil:
\tmw9069~197,5~~10,69~~~~~~~0FCB \u0FCB~197,5~~10,69~~~~~~~0FCB
// nor.bu.bzhi.khyil: // nor.bu.bzhi.khyil:
\tmw9070~198,5~~10,70~~~~~~~0FCC \u0FCC~198,5~~10,70~~~~~~~0FCC
// bindu + datse + thigle: // bindu + datse + thigle: DLC NOW 0f82 or not? 91,5 is a candidate too
// DLC NOW: \uF03A or not? Awaiting Than's reply...
\tmw7095~242,1~~8,95~~~~~~~none \tmw7095~242,1~~8,95~~~~~~~none
// zhu.yig.mgo.rgyan: // zhu.yig.mgo.rgyan:
\tmw8033~33,5~~9,33~~~~~~~0F0A \u0F0A~33,5~~9,33~~~~~~~0F0A
// bka'.shog.mgo.rgyan: // bka'.shog.mgo.rgyan:
\tmw8034~34,5~~9,34~~~~~~~none \uF024~34,5~~9,34~~~~~~~none
// mnyam.yig.mgo.rgyan: // mnyam.yig.mgo.rgyan:
\tmw8035~35,5~~9,35~~~~~~~none \uF025~35,5~~9,35~~~~~~~none
// mnyam.yig.mgo.rgyan: // mnyam.yig.mgo.rgyan:
\tmw8036~36,5~~9,36~~~~~~~0F09 \u0F09~36,5~~9,36~~~~~~~0F09
// nameless sign: // nameless sign:
\tmw8037~37,5~~9,37~~~~~~~none \uF026~37,5~~9,37~~~~~~~none
// shad (hooked) + single tsheg: // shad (hooked) + single tsheg:
\tmw8044~41,5~~9,44~~~~~~~none \uF02B~41,5~~9,44~~~~~~~none
// shad + double tsheg: // shad + double tsheg:
\tmw8046~42,5~~9,46~~~~~~~none \uF02C~42,5~~9,46~~~~~~~none
// sbrul.shad + single ornament: // sbrul.shad + single ornament:
\tmw8048~44,5~~9,48~~~~~~~none \uF028~44,5~~9,48~~~~~~~none
// sbrul.shad + double ornament: // sbrul.shad + double ornament:
\tmw8049~46,5~~9,49~~~~~~~none \uF02A~46,5~~9,49~~~~~~~none
// sbrul.shad variant form: // sbrul.shad variant form:
\tmw8050~47,5~~9,50~~~~~~~none \uF029~47,5~~9,50~~~~~~~none
// reversed hu: // reversed hu:
\tmw9043~147,5~~10,43~~~~~~~none \uF032~147,5~~10,43~~~~~~~none
// Inverted ha: // Inverted ha:
\tmw9044~148,5~~10,44~~~~~~~none \uF033~148,5~~10,44~~~~~~~none
// no name: // no name:
\tmw8091~93,5~~9,91~~~~~~~none \uF036~93,5~~9,91~~~~~~~none
// nyi.zla: // nyi.zla:
\tmw8089~91,5~~9,89~~~~~~~0F82 \u0F82~91,5~~9,89~~~~~~~0F82