I've undone the SNYAM'AM == SNYAMA'AM hack. The only occurrence of SNYAM'AM in the ACIP texts I've got is likely a typo, says Robert Chilton.
The code would be cleaner if I could bear to delete my terrible hack. Maybe in a month, when I don't feel so dumb for coding it up in the first place. The correct solution for such things is to give the ACIP->Tibetan converters a pre-filter mechanism. This would be before the lexer or part of the lexer (maybe you only want to filter tsheg bars), and it would allow the end user to specify things like "s/SNYAM'AM/S+NYAMA'AMA/g".
This commit is contained in:
parent
4b1395e0ba
commit
5aab4acc93
3 changed files with 34 additions and 18 deletions
|
@ -94,7 +94,7 @@ public class PackageTest extends TestCase {
|
|||
String[] expectedLegalParses,
|
||||
String expectedBestParse,
|
||||
int pairListToUse) {
|
||||
TPairList[] la = TPairListFactory.breakACIPIntoChunks(acip);
|
||||
TPairList[] la = TPairListFactory.breakACIPIntoChunks(acip, true);
|
||||
TPairList l = la[(pairListToUse == -1) ? 0 : ((pairListToUse >= 1) ? 1 : pairListToUse)];
|
||||
if (sdebug || debug)
|
||||
System.out.println("ACIP=" + acip + " and l'=" + l);
|
||||
|
@ -268,8 +268,8 @@ public class PackageTest extends TestCase {
|
|||
tstHelper("9012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678901234567890123456789012345678");
|
||||
}
|
||||
|
||||
/** Tests {@link TPairListFactory#breakACIPIntoChunks(String)},
|
||||
* {@link TPairList#getACIPError()}, and {@link
|
||||
/** Tests {@link TPairListFactory#breakACIPIntoChunks(String,
|
||||
* boolean)}, {@link TPairList#getACIPError()}, and {@link
|
||||
* TPairList#recoverACIP()}. */
|
||||
public void testBreakACIPIntoChunks() {
|
||||
tstHelper("GASN"); // ambiguous with regard to prefix rules
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue