Better error messages in TMW->Wylie conversions. The user knows what's
up.
This commit is contained in:
parent
3113a4b8de
commit
a48ec641d5
8 changed files with 211 additions and 132 deletions
|
@ -297,6 +297,12 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
return s;
|
||||
}
|
||||
|
||||
/** An array containing one boolean value. Pass this to
|
||||
TibetanMachineWeb.getWylieForGlyph(..) if you don't care if a
|
||||
certain glyph has corresponding Wylie or not. */
|
||||
public static final boolean[] weDoNotCareIfThereIsCorrespondingWylieOrNot
|
||||
= new boolean[] { false };
|
||||
|
||||
/**
|
||||
* Converts a string of Extended Wylie into {@link DuffData DuffData}.
|
||||
* @param wylie the Wylie you want to convert
|
||||
|
@ -371,7 +377,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
vowel_block: {
|
||||
if (size > 1) {
|
||||
dc = (DuffCode)glyphs.get(glyphs.size()-1);
|
||||
if (!TibetanMachineWeb.isWyliePunc(TibetanMachineWeb.getWylieForGlyph(dc))) {
|
||||
if (!TibetanMachineWeb.isWyliePunc(TibetanMachineWeb.getWylieForGlyph(dc, weDoNotCareIfThereIsCorrespondingWylieOrNot))) {
|
||||
DuffCode dc_2 = (DuffCode)glyphs.removeLast();
|
||||
DuffCode dc_1 = (DuffCode)glyphs.removeLast();
|
||||
glyphs.addAll(getVowel(dc_1, dc_2, next));
|
||||
|
@ -805,9 +811,12 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
* @param glyphList a list of TibetanMachineWeb glyphs, i.e. {@link
|
||||
* org.thdl.tib.text.DuffCode DuffCodes}. Pass in an ArrayList if you
|
||||
* care at all for speed.
|
||||
* @return the Wylie string corresponding to this glyph list, with 'a' inserted.
|
||||
*/
|
||||
public static String withA(java.util.List glyphList) {
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to these glyphs, then noSuchWylie[0] will be set to
|
||||
* true
|
||||
* @return the Wylie string corresponding to this glyph list, with 'a' inserted. */
|
||||
public static String withA(java.util.List glyphList, boolean noSuchWylie[]) {
|
||||
StringBuffer sb = new StringBuffer();
|
||||
int size = glyphList.size();
|
||||
String wylie;
|
||||
|
@ -818,16 +827,16 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
return "";
|
||||
|
||||
case 1: //only one glyph: 'a' goes after it
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0));
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0), noSuchWylie);
|
||||
sb.append(wylie);
|
||||
sb.append(aVowelToUseAfter(wylie));
|
||||
|
||||
return sb.toString();
|
||||
|
||||
case 2: //two glyphs: 'a' either goes after first or after both
|
||||
lastWylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0));
|
||||
lastWylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0), noSuchWylie);
|
||||
sb.append(lastWylie);
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(1));
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(1), noSuchWylie);
|
||||
if (TibetanMachineWeb.isWylieRight(wylie)) {
|
||||
sb.append(aVowelToUseAfter(lastWylie));
|
||||
sb.append(wylie);
|
||||
|
@ -870,17 +879,17 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
StringBuffer tailEndWylie = null;
|
||||
int effectiveSize = size - 2;
|
||||
while (effectiveSize >= 0
|
||||
&& TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(effectiveSize)).equals(ACHUNG)) {
|
||||
&& TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(effectiveSize), noSuchWylie).equals(ACHUNG)) {
|
||||
if (null == tailEndWylie) tailEndWylie = new StringBuffer();
|
||||
// prepend:
|
||||
tailEndWylie.insert(0,
|
||||
ACHUNG
|
||||
+ aVowelToUseAfter(ACHUNG)
|
||||
+ TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(effectiveSize + 1)));
|
||||
+ TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(effectiveSize + 1), noSuchWylie));
|
||||
effectiveSize -= 2;
|
||||
}
|
||||
if (null != tailEndWylie) {
|
||||
return (withA(glyphList.subList(0, effectiveSize + 2))
|
||||
return (withA(glyphList.subList(0, effectiveSize + 2), noSuchWylie)
|
||||
+ tailEndWylie.toString());
|
||||
}
|
||||
}
|
||||
|
@ -890,17 +899,17 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
// this is illegal because it doesn't begin
|
||||
// with a prefix:
|
||||
|| (size == 4
|
||||
&& (!TibetanMachineWeb.isWylieLeft(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0)))
|
||||
&& (!TibetanMachineWeb.isWylieLeft(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(0), weDoNotCareIfThereIsCorrespondingWylieOrNot))
|
||||
// this is illegal because it doesn't have a
|
||||
// suffix in the proper place, e.g. mjskad:
|
||||
|| !TibetanMachineWeb.isWylieRight(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(size - 2)))
|
||||
|| !TibetanMachineWeb.isWylieRight(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(size - 2), weDoNotCareIfThereIsCorrespondingWylieOrNot))
|
||||
// this is illegal because it doesn't have a
|
||||
// postsuffix in the proper place,
|
||||
// e.g. 'lan.g, which would otherwise become
|
||||
// 'lang (with nga, not na and then ga):
|
||||
|| !TibetanMachineWeb.isWylieFarRight(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(size - 1))))))) {
|
||||
|| !TibetanMachineWeb.isWylieFarRight(TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(size - 1), weDoNotCareIfThereIsCorrespondingWylieOrNot)))))) {
|
||||
for (int i = 0; i < size; i++) {
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i));
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i), noSuchWylie);
|
||||
if (TibetanMachineWeb.isAmbiguousWylie(lastWylie, wylie)
|
||||
|| (i != 0 && wylie.equals(ACHEN)))
|
||||
sb.append(WYLIE_DISAMBIGUATING_KEY);
|
||||
|
@ -914,7 +923,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
/* Else, chew up all the glyphs except for the last two. Then decide. */
|
||||
int i = 0;
|
||||
while (i+2 < size) {
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i));
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i), noSuchWylie);
|
||||
if (TibetanMachineWeb.isAmbiguousWylie(lastWylie, wylie)
|
||||
|| (i != 0 && wylie.equals(ACHEN)))
|
||||
sb.append(WYLIE_DISAMBIGUATING_KEY);
|
||||
|
@ -925,9 +934,9 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
}
|
||||
|
||||
String wylie1
|
||||
= TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i));
|
||||
= TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i), noSuchWylie);
|
||||
String wylie2
|
||||
= TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i + 1));
|
||||
= TibetanMachineWeb.getWylieForGlyph((DuffCode)glyphList.get(i + 1), noSuchWylie);
|
||||
|
||||
if (size == 3) {
|
||||
String wylie0 = lastWylie;
|
||||
|
@ -1047,9 +1056,12 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
* org.thdl.tib.text.DuffCode DuffCodes}
|
||||
* @param isBeforeVowel true if these glyphs occur before a vowel,
|
||||
* false if these glyphs occur after a vowel
|
||||
* @return the Wylie string corresponding to this glyph list
|
||||
*/
|
||||
public static String withoutA(java.util.ArrayList glyphList, boolean isBeforeVowel) {
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to these glyphs, then noSuchWylie[0] will be set to
|
||||
* true
|
||||
* @return the Wylie string corresponding to this glyph list */
|
||||
public static String withoutA(java.util.ArrayList glyphList, boolean isBeforeVowel, boolean noSuchWylie[]) {
|
||||
StringBuffer sb = new StringBuffer();
|
||||
Iterator iter = glyphList.iterator();
|
||||
DuffCode dc;
|
||||
|
@ -1058,7 +1070,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
|
||||
while (iter.hasNext()) {
|
||||
dc = (DuffCode)iter.next();
|
||||
currWylie = TibetanMachineWeb.getWylieForGlyph(dc);
|
||||
currWylie = TibetanMachineWeb.getWylieForGlyph(dc, noSuchWylie);
|
||||
|
||||
if (TibetanMachineWeb.isAmbiguousWylie(lastWylie, currWylie)
|
||||
|| (!lastWylie.equals("")
|
||||
|
@ -1084,9 +1096,12 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
/**
|
||||
* Gets the Extended Wylie for a sequence of glyphs.
|
||||
* @param dcs an array of glyphs
|
||||
* @return the Extended Wylie corresponding to these glyphs
|
||||
*/
|
||||
public static String getWylie(DuffCode[] dcs) {
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to these glyphs, then noSuchWylie[0] will be set to
|
||||
* true
|
||||
* @return the Extended Wylie corresponding to these glyphs */
|
||||
public static String getWylie(DuffCode[] dcs, boolean noSuchWylie[]) {
|
||||
if (dcs.length == 0)
|
||||
return null;
|
||||
|
||||
|
@ -1108,9 +1123,9 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
if (wylieBuffer.length() > 0 || !glyphList.isEmpty()) {
|
||||
String thisPart;
|
||||
if (needsVowel)
|
||||
thisPart = withA(glyphList);
|
||||
thisPart = withA(glyphList, noSuchWylie);
|
||||
else
|
||||
thisPart = withoutA(glyphList, false);
|
||||
thisPart = withoutA(glyphList, false, noSuchWylie);
|
||||
wylieBuffer.append(thisPart);
|
||||
|
||||
glyphList.clear();
|
||||
|
@ -1120,7 +1135,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
|
||||
wylieBuffer.append(ch);
|
||||
} else {
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph(dcs[i]);
|
||||
wylie = TibetanMachineWeb.getWylieForGlyph(dcs[i], noSuchWylie);
|
||||
|
||||
boolean containsBindu = false;
|
||||
if (wylie.length() > 1 && wylie.charAt(wylie.length()-1) == BINDU) {
|
||||
|
@ -1138,9 +1153,9 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
} else {
|
||||
String thisPart;
|
||||
if (needsVowel)
|
||||
thisPart = withA(glyphList);
|
||||
thisPart = withA(glyphList, noSuchWylie);
|
||||
else
|
||||
thisPart = withoutA(glyphList, false);
|
||||
thisPart = withoutA(glyphList, false, noSuchWylie);
|
||||
wylieBuffer.append(thisPart);
|
||||
|
||||
wylieBuffer.append(wylie); //append the punctuation
|
||||
|
@ -1185,7 +1200,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
|
||||
if (0 != glyphCount) {
|
||||
DuffCode top_dc = (DuffCode)glyphList.get(glyphCount-1);
|
||||
String top_wylie = TibetanMachineWeb.getWylieForGlyph(top_dc);
|
||||
String top_wylie = TibetanMachineWeb.getWylieForGlyph(top_dc, noSuchWylie);
|
||||
|
||||
if (top_wylie.equals(ACHEN)) {
|
||||
glyphList.remove(glyphCount-1);
|
||||
|
@ -1198,15 +1213,15 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
}
|
||||
}
|
||||
|
||||
if (top_dc == null || !TibetanMachineWeb.getWylieForGlyph(top_dc).equals(ACHUNG)) {
|
||||
String thisPart = withoutA(glyphList, true);
|
||||
if (top_dc == null || !TibetanMachineWeb.getWylieForGlyph(top_dc, noSuchWylie).equals(ACHUNG)) {
|
||||
String thisPart = withoutA(glyphList, true, noSuchWylie);
|
||||
wylieBuffer.append(thisPart); //append consonants in glyphList
|
||||
} else {
|
||||
glyphCount = glyphList.size();
|
||||
glyphList.remove(glyphCount-1);
|
||||
|
||||
if (glyphCount-1 != 0) {
|
||||
String thisPart = withA(glyphList);
|
||||
String thisPart = withA(glyphList, noSuchWylie);
|
||||
wylieBuffer.append(thisPart);
|
||||
}
|
||||
|
||||
|
@ -1231,7 +1246,7 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
|
||||
if (containsBindu) {
|
||||
isLastVowel = false;
|
||||
wylieBuffer.append(withoutA(glyphList, false));
|
||||
wylieBuffer.append(withoutA(glyphList, false, noSuchWylie));
|
||||
wylieBuffer.append(BINDU); //append the bindu
|
||||
glyphList.clear();
|
||||
}
|
||||
|
@ -1243,9 +1258,9 @@ public class TibTextUtils implements THDLWylieConstants {
|
|||
if (!glyphList.isEmpty()) {
|
||||
String thisPart;
|
||||
if (needsVowel)
|
||||
thisPart = withA(glyphList);
|
||||
thisPart = withA(glyphList, noSuchWylie);
|
||||
else
|
||||
thisPart = withoutA(glyphList, false);
|
||||
thisPart = withoutA(glyphList, false, noSuchWylie);
|
||||
wylieBuffer.append(thisPart);
|
||||
}
|
||||
|
||||
|
|
|
@ -246,10 +246,13 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
* If the document consists of both Tibetan and
|
||||
* non-Tibetan fonts, however, the conversion stops
|
||||
* at the first non-Tibetan font.
|
||||
* @return the string of Wylie corresponding to this document
|
||||
*/
|
||||
public String getWylie() {
|
||||
return getWylie(0, getLength());
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to one of these glyphs, then noSuchWylie[0] will be
|
||||
* set to true
|
||||
* @return the string of Wylie corresponding to this document */
|
||||
public String getWylie(boolean noSuchWylie[]) {
|
||||
return getWylie(0, getLength(), noSuchWylie);
|
||||
}
|
||||
|
||||
/**
|
||||
|
@ -259,9 +262,12 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
* at the first non-Tibetan font.
|
||||
* @param begin the beginning of the region to convert
|
||||
* @param end the end of the region to convert
|
||||
* @return the string of Wylie corresponding to this document
|
||||
*/
|
||||
public String getWylie(int begin, int end) {
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to one of these glyphs, then noSuchWylie[0] will be
|
||||
* set to true
|
||||
* @return the string of Wylie corresponding to this document */
|
||||
public String getWylie(int begin, int end, boolean noSuchWylie[]) {
|
||||
AttributeSet attr;
|
||||
String fontName;
|
||||
int fontNum;
|
||||
|
@ -287,7 +293,7 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
if (dcs.size() > 0) {
|
||||
DuffCode[] dc_array = new DuffCode[0];
|
||||
dc_array = (DuffCode[])dcs.toArray(dc_array);
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array));
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array, noSuchWylie));
|
||||
dcs.clear();
|
||||
}
|
||||
wylieBuffer.append(ch);
|
||||
|
@ -298,7 +304,7 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
if (dcs.size() > 0) {
|
||||
DuffCode[] dc_array = new DuffCode[0];
|
||||
dc_array = (DuffCode[])dcs.toArray(dc_array);
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array));
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array, noSuchWylie));
|
||||
dcs.clear();
|
||||
}
|
||||
}
|
||||
|
@ -313,7 +319,7 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
if (dcs.size() > 0) {
|
||||
DuffCode[] dc_array = new DuffCode[0];
|
||||
dc_array = (DuffCode[])dcs.toArray(dc_array);
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array));
|
||||
wylieBuffer.append(TibTextUtils.getWylie(dc_array, noSuchWylie));
|
||||
}
|
||||
return wylieBuffer.toString();
|
||||
}
|
||||
|
@ -761,66 +767,6 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
return ceh.errorReturn;
|
||||
}
|
||||
|
||||
/** Appends to sb a text representation of the characters (glyphs)
|
||||
in this document in the range [begin, end). In this
|
||||
representation, \tmwXYYY and \tmXYYY are used for TMW and TM
|
||||
glyphs, respectively. \otherYYY is used for all other
|
||||
characters. X is zero-based; Y is the decimal glyph number.
|
||||
After every 10 characters, '\n' is added. Note well that some
|
||||
TM oddballs (see TibetanMachineWeb.getUnusualTMtoTMW(int,
|
||||
int)) are not handled well, so you may get \tm08222 etc. */
|
||||
public void getTextRepresentation(int begin, int end, StringBuffer sb) {
|
||||
if (end < 0)
|
||||
end = getLength();
|
||||
if (begin >= end)
|
||||
return; // nothing to do
|
||||
|
||||
// For speed, do as few replaces as possible. To preserve
|
||||
// formatting, we'll try to replace one paragraph at a time.
|
||||
// But we *must* replace when we hit a different font (TMW3 as
|
||||
// opposed to TMW2, e.g.), so we'll likely replace many times
|
||||
// per paragraph. One very important optimization is that we
|
||||
// don't have to treat TMW3.45 or TMW3.32 as a different font
|
||||
// than TMW.33 -- that's because each of the ten TMW fonts has
|
||||
// the same glyph at position 32 (space) and the same glyph at
|
||||
// position 45 (tsheg). Note that we're building up a big
|
||||
// StringBuffer; we're trading space for time.
|
||||
try {
|
||||
int i = begin;
|
||||
int tenCount = 0;
|
||||
while (i < end) {
|
||||
AttributeSet attr = getCharacterElement(i).getAttributes();
|
||||
String fontName = StyleConstants.getFontFamily(attr);
|
||||
int tmwFontNum
|
||||
= TibetanMachineWeb.getTMWFontNumber(fontName);
|
||||
int tmFontNum;
|
||||
if (tmwFontNum != 0) {
|
||||
sb.append("\\tmw" + (tmwFontNum - 1));
|
||||
} else if ((tmFontNum
|
||||
= TibetanMachineWeb.getTMFontNumber(fontName))
|
||||
!= 0) {
|
||||
sb.append("\\tm" + (tmFontNum - 1));
|
||||
} else {
|
||||
// non-tmw, non-tm character:
|
||||
sb.append("\\other");
|
||||
}
|
||||
int ordinal = (int)getText(i,1).charAt(0);
|
||||
if (ordinal < 100)
|
||||
sb.append('0');
|
||||
if (ordinal < 10)
|
||||
sb.append('0');
|
||||
sb.append("" + ordinal);
|
||||
if ((++tenCount) % 10 == 0) {
|
||||
tenCount = 0;
|
||||
sb.append('\n');
|
||||
}
|
||||
i++;
|
||||
}
|
||||
} catch (BadLocationException e) {
|
||||
throw new ThdlLazyException(e);
|
||||
}
|
||||
}
|
||||
|
||||
/** See the sole caller, convertHelper. */
|
||||
private void convertHelperHelper(int begin, int end, boolean toTM,
|
||||
boolean toUnicode, StringBuffer errors,
|
||||
|
@ -1101,13 +1047,17 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
* @param end the point at which to stop converting to Wylie
|
||||
* @param numAttemptedReplacements an array that contains one element;
|
||||
* this first element will be, upon exit, incremented by the number of
|
||||
* TMW glyphs that we encountered and attempted to convert to Wylie */
|
||||
public void toWylie(int start, int end,
|
||||
long numAttemptedReplacements[]) {
|
||||
* TMW glyphs that we encountered and attempted to convert to Wylie
|
||||
* @return true if entirely successful, false if we put some
|
||||
* "<<[[JSKAD_TMW_TO_WYLIE_ERROR_NO_SUCH_WYLIE: Cannot convert
|
||||
* DuffCode..." text into the document */
|
||||
public boolean toWylie(int start, int end,
|
||||
long numAttemptedReplacements[]) {
|
||||
if (start >= end)
|
||||
return;
|
||||
return true;
|
||||
|
||||
try {
|
||||
boolean noSuchWylie[] = new boolean[] { false };
|
||||
DuffCode[] any_dc_array = new DuffCode[0];
|
||||
DuffCode[] dc_array;
|
||||
Position endPos = createPosition(end);
|
||||
|
@ -1124,8 +1074,9 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
if (i != start) {
|
||||
dc_array = (DuffCode[])dcs.toArray(any_dc_array);
|
||||
remove(start, i-start);
|
||||
ThdlDebug.verify(getRomanAttributeSet() != null);
|
||||
insertString(start,
|
||||
TibTextUtils.getWylie(dc_array),
|
||||
TibTextUtils.getWylie(dc_array, noSuchWylie),
|
||||
getRomanAttributeSet());
|
||||
dcs.clear();
|
||||
}
|
||||
|
@ -1138,9 +1089,11 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
|
||||
i++;
|
||||
}
|
||||
return !noSuchWylie[0];
|
||||
} catch (BadLocationException ble) {
|
||||
ble.printStackTrace();
|
||||
ThdlDebug.noteIffyCode();
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -1172,6 +1125,66 @@ public class TibetanDocument extends DefaultStyledDocument {
|
|||
return (Element[])v.toArray(arrayType);
|
||||
}
|
||||
|
||||
/** Appends to sb a text representation of the characters (glyphs)
|
||||
in this document in the range [begin, end). In this
|
||||
representation, \tmwXYYY and \tmXYYY are used for TMW and TM
|
||||
glyphs, respectively. \otherYYY is used for all other
|
||||
characters. X is zero-based; Y is the decimal glyph number.
|
||||
After every 10 characters, '\n' is added. Note well that some
|
||||
TM oddballs (see TibetanMachineWeb.getUnusualTMtoTMW(int,
|
||||
int)) are not handled well, so you may get \tm08222 etc. */
|
||||
public void getTextRepresentation(int begin, int end, StringBuffer sb) {
|
||||
if (end < 0)
|
||||
end = getLength();
|
||||
if (begin >= end)
|
||||
return; // nothing to do
|
||||
|
||||
// For speed, do as few replaces as possible. To preserve
|
||||
// formatting, we'll try to replace one paragraph at a time.
|
||||
// But we *must* replace when we hit a different font (TMW3 as
|
||||
// opposed to TMW2, e.g.), so we'll likely replace many times
|
||||
// per paragraph. One very important optimization is that we
|
||||
// don't have to treat TMW3.45 or TMW3.32 as a different font
|
||||
// than TMW.33 -- that's because each of the ten TMW fonts has
|
||||
// the same glyph at position 32 (space) and the same glyph at
|
||||
// position 45 (tsheg). Note that we're building up a big
|
||||
// StringBuffer; we're trading space for time.
|
||||
try {
|
||||
int i = begin;
|
||||
int tenCount = 0;
|
||||
while (i < end) {
|
||||
AttributeSet attr = getCharacterElement(i).getAttributes();
|
||||
String fontName = StyleConstants.getFontFamily(attr);
|
||||
int tmwFontNum
|
||||
= TibetanMachineWeb.getTMWFontNumber(fontName);
|
||||
int tmFontNum;
|
||||
if (tmwFontNum != 0) {
|
||||
sb.append("\\tmw" + (tmwFontNum - 1));
|
||||
} else if ((tmFontNum
|
||||
= TibetanMachineWeb.getTMFontNumber(fontName))
|
||||
!= 0) {
|
||||
sb.append("\\tm" + (tmFontNum - 1));
|
||||
} else {
|
||||
// non-tmw, non-tm character:
|
||||
sb.append("\\other");
|
||||
}
|
||||
int ordinal = (int)getText(i,1).charAt(0);
|
||||
if (ordinal < 100)
|
||||
sb.append('0');
|
||||
if (ordinal < 10)
|
||||
sb.append('0');
|
||||
sb.append("" + ordinal);
|
||||
if ((++tenCount) % 10 == 0) {
|
||||
tenCount = 0;
|
||||
sb.append('\n');
|
||||
}
|
||||
i++;
|
||||
}
|
||||
} catch (BadLocationException e) {
|
||||
throw new ThdlLazyException(e);
|
||||
}
|
||||
}
|
||||
|
||||
/** For debugging only. Start with an empty document, and call
|
||||
this on it. You'll get all the TibetanMachine glyphs
|
||||
inserted, in order, into your document. */
|
||||
|
|
|
@ -71,7 +71,7 @@ public class TibetanHTML {
|
|||
break;
|
||||
}
|
||||
htmlBuffer.append("</span>");
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k]);
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k], TibTextUtils.weDoNotCareIfThereIsCorrespondingWylieOrNot);
|
||||
if (TibetanMachineWeb.isWyliePunc(wylie))
|
||||
htmlBuffer.append("<wbr/>");
|
||||
} else {
|
||||
|
@ -138,7 +138,7 @@ public class TibetanHTML {
|
|||
htmlBuffer.append(c[k]);
|
||||
break;
|
||||
}
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k]);
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k], TibTextUtils.weDoNotCareIfThereIsCorrespondingWylieOrNot);
|
||||
if (TibetanMachineWeb.isWyliePunc(wylie))
|
||||
htmlBuffer.append("<wbr/>");
|
||||
} else {
|
||||
|
@ -209,7 +209,7 @@ public class TibetanHTML {
|
|||
htmlBuffer.append(c[k]);
|
||||
break;
|
||||
}
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k]);
|
||||
String wylie = TibetanMachineWeb.getWylieForGlyph(duffData[i].font, c[k], TibTextUtils.weDoNotCareIfThereIsCorrespondingWylieOrNot);
|
||||
if (TibetanMachineWeb.isWyliePunc(wylie))
|
||||
htmlBuffer.append("<wbr>");
|
||||
} else {
|
||||
|
|
|
@ -1414,12 +1414,17 @@ private static String getTMWToWylieErrorString(DuffCode dc) {
|
|||
* glyph you want the Wylie of
|
||||
* @param code the ordinal, minus 32, of the TibetanMachineWeb glyph
|
||||
* you want the Wylie of
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to the glyph, then noSuchWylie[0] will be set to true
|
||||
* @return the Wylie value corresponding to the
|
||||
* glyph denoted by font, code
|
||||
*/
|
||||
public static String getWylieForGlyph(int font, int code) {
|
||||
public static String getWylieForGlyph(int font, int code,
|
||||
boolean noSuchWylie[]) {
|
||||
String hashKey = getHashKeyForGlyph(font, code);
|
||||
if (hashKey == null) {
|
||||
noSuchWylie[0] = true;
|
||||
return getTMWToWylieErrorString(new DuffCode(font, (char)code));
|
||||
}
|
||||
return wylieForGlyph(hashKey);
|
||||
|
@ -1429,12 +1434,15 @@ public static String getWylieForGlyph(int font, int code) {
|
|||
* Gets the Extended Wylie value for this glyph.
|
||||
* @param dc the DuffCode of the glyph you want
|
||||
* the Wylie of
|
||||
* @param noSuchWylie an array which will not be touched if this is
|
||||
* successful; however, if there is no THDL Extended Wylie
|
||||
* corresponding to the glyph, then noSuchWylie[0] will be set to true
|
||||
* @return the Wylie value corresponding to the
|
||||
* glyph denoted by dc
|
||||
*/
|
||||
public static String getWylieForGlyph(DuffCode dc) {
|
||||
* glyph denoted by dc */
|
||||
public static String getWylieForGlyph(DuffCode dc, boolean noSuchWylie[]) {
|
||||
String hashKey = getHashKeyForGlyph(dc);
|
||||
if (hashKey == null) {
|
||||
noSuchWylie[0] = true;
|
||||
return getTMWToWylieErrorString(dc);
|
||||
}
|
||||
return wylieForGlyph(hashKey);
|
||||
|
@ -1637,7 +1645,9 @@ public static String getAVowel() {
|
|||
* @return true if the glyph is a top-hanging (superscript) vowel (i,
|
||||
* u, e, o, ai, or ao) and false if not */
|
||||
public static boolean isTopVowel(DuffCode dc) {
|
||||
String wylie = getWylieForGlyph(dc);
|
||||
String wylie
|
||||
= getWylieForGlyph(dc,
|
||||
TibTextUtils.weDoNotCareIfThereIsCorrespondingWylieOrNot);
|
||||
if (top_vowels.contains(wylie))
|
||||
return true;
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue