ACIP->Unicode, without going through TMW, is now possible, so long as
\, the Sanskrit virama, is not used. Of the 1370-odd ACIP texts I've got here, about 57% make it through the gauntlet (fewer if you demand a vowel or disambiguator on every stack of a non-Tibetan tsheg bar).
This commit is contained in:
parent
245aac4911
commit
1afb3a0fdd
12 changed files with 646 additions and 40 deletions
|
@ -167,4 +167,19 @@ class TPair {
|
|||
if (null == rightWylie) rightWylie = "";
|
||||
return leftWylie + rightWylie;
|
||||
}
|
||||
|
||||
/** Appends legal Unicode corresponding to this (possible
|
||||
* subscribed) pair to sb. DLC FIXME: which normalization form,
|
||||
* if any? */
|
||||
void getUnicode(StringBuffer sb, boolean subscribed) {
|
||||
if (null != getLeft()) {
|
||||
String x = ACIPRules.getUnicodeFor(getLeft(), subscribed);
|
||||
if (null != x) sb.append(x);
|
||||
}
|
||||
if (null != getRight()
|
||||
&& !("-".equals(getRight()) || "A".equals(getRight()))) {
|
||||
String x = ACIPRules.getUnicodeFor(getRight(), subscribed);
|
||||
if (null != x) sb.append(x);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue