good solution for g suffix problem in the acip dictionary. Perhaps solves 90% of the ambiguous cases!

This commit is contained in:
amontano 2002-10-14 21:08:19 +00:00
parent cfa4ba4fdb
commit 32c9c95129

View file

@ -104,7 +104,7 @@ public class BinaryFileGenerator extends LinkedList
int marker, len, marker2, n=0, total=0, currentPage=0, currentLine=1; int marker, len, marker2, n=0, total=0, currentPage=0, currentLine=1;
char ch; char ch;
BufferedReader br = new BufferedReader(new InputStreamReader(new FileInputStream(archivo))); BufferedReader br = new BufferedReader(new InputStreamReader(new FileInputStream(archivo)));
String entrada="", s1="", s2="", currentLetter="", temp=""; String entrada="", s1="", s2="", currentLetter="", temp="", lastWeirdDefiniendum="";
boolean markerNotFound; boolean markerNotFound;
// used for acip dict // used for acip dict
@ -234,8 +234,13 @@ public class BinaryFileGenerator extends LinkedList
case 'g': // verify "g " case 'g': // verify "g "
if (marker+1<len && Manipulate.isVowel(entrada.charAt(marker-1)) && entrada.charAt(marker+1)==' ') if (marker+1<len && Manipulate.isVowel(entrada.charAt(marker-1)) && entrada.charAt(marker+1)==' ')
{ {
markerNotFound=false; temp = entrada.substring(0, marker+1);
marker2=++marker; if (!lastWeirdDefiniendum.startsWith(temp))
{
markerNotFound=false;
marker2=++marker;
lastWeirdDefiniendum=temp;
}
} }
break; break;
case ' ': // verify " " case ' ': // verify " "
@ -517,11 +522,15 @@ public class BinaryFileGenerator extends LinkedList
System.out.println("Stores multiple dictionaries into a binary tree file."); System.out.println("Stores multiple dictionaries into a binary tree file.");
System.out.println("Sintaxis:"); System.out.println("Sintaxis:");
System.out.println("-For multiple dictionary sources:"); System.out.println("-For multiple dictionary sources:");
System.out.println(" java BinaryFileGenerator arch-dest [-delimiter1] arch-dict1 [[-delimiter2] arch-dict2 ...]"); System.out.println(" java BinaryFileGenerator arch-dest [-delimiter1] arch-dict1");
System.out.println(" [[-delimiter2] arch-dict2 ...]");
System.out.println("-For one dictionary"); System.out.println("-For one dictionary");
System.out.println(" java BinaryFileGenerator [-delimiter] arch-dict"); System.out.println(" java BinaryFileGenerator [-delimiter] arch-dict");
System.out.println("Dictionary files are assumed to be .txt. Don't include extensions!"); System.out.println("Dictionary files are assumed to be .txt. Don't include extensions!");
System.out.println(" -delimiter: default value is \'-\'. -tab takes \'\\t\' as delimiter."); System.out.println(" -delimiter: default value is \'-\'. -tab takes \'\\t\' as delimiter.");
System.out.println(" -acip: use this to process dictionaries entered using the ACIP standard");
System.out.println(" to mark page numbers, comments, etc. Make sure to convert it to");
System.out.println(" THDL's extended Wylie scheme first using the AcipToWylie class.");
} }
public static void main(String args[]) throws Exception public static void main(String args[]) throws Exception