2002-10-03 19:28:09 +00:00
|
|
|
/*
|
|
|
|
The contents of this file are subject to the AMP Open Community License
|
|
|
|
Version 1.0 (the "License"); you may not use this file except in compliance
|
|
|
|
with the License. You may obtain a copy of the License on the AMP web site
|
|
|
|
(http://www.tibet.iteso.mx/Guatemala/).
|
|
|
|
|
|
|
|
Software distributed under the License is distributed on an "AS IS" basis,
|
|
|
|
WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
|
|
|
|
License for the specific terms governing rights and limitations under the
|
|
|
|
License.
|
|
|
|
|
|
|
|
The Initial Developer of this software is Andres Montano Pellegrini. Portions
|
|
|
|
created by Andres Montano Pellegrini are Copyright 2001 Andres Montano
|
|
|
|
Pellegrini. All Rights Reserved.
|
|
|
|
|
|
|
|
Contributor(s): ______________________________________.
|
|
|
|
*/
|
|
|
|
package org.thdl.tib.scanner;
|
|
|
|
|
|
|
|
import java.io.*;
|
2003-04-01 13:08:38 +00:00
|
|
|
import org.thdl.util.*;
|
2002-10-03 19:28:09 +00:00
|
|
|
|
2002-11-03 08:56:11 +00:00
|
|
|
/** Provides recommended implementation of the {@link SyllableListTree}
|
2002-10-03 19:28:09 +00:00
|
|
|
(currently most efficient memory-speed combination) loading
|
2002-11-03 08:56:11 +00:00
|
|
|
from file into memory only the "trunk" of the tree,
|
|
|
|
and resorting to the disk when searching the rest of the tree.
|
2002-10-03 19:28:09 +00:00
|
|
|
|
|
|
|
<p>The words must be stored in a binary file tree structure format.
|
2002-11-03 08:56:11 +00:00
|
|
|
This can be done using the {@link BinaryFileGenerator}.</p>
|
2002-10-03 19:28:09 +00:00
|
|
|
|
|
|
|
@author Andrés Montano Pellegrini
|
|
|
|
@see TibetanScanner
|
|
|
|
@see BinaryFileGenerator
|
|
|
|
*/
|
|
|
|
public class CachedSyllableListTree implements SyllableListTree
|
|
|
|
{
|
|
|
|
SyllableListTree syllables[];
|
2005-01-23 00:57:02 +00:00
|
|
|
|
2002-10-03 19:28:09 +00:00
|
|
|
public CachedSyllableListTree(String archivo) throws Exception
|
2005-01-23 00:57:02 +00:00
|
|
|
{
|
|
|
|
this (archivo, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
public CachedSyllableListTree(String archivo, boolean backwardCompatible) throws Exception
|
2002-10-03 19:28:09 +00:00
|
|
|
{
|
|
|
|
String sil;
|
|
|
|
long pos, defSources[];
|
|
|
|
DictionarySource sourceDef;
|
|
|
|
int i;
|
2004-08-13 04:47:35 +00:00
|
|
|
|
2005-01-23 00:57:02 +00:00
|
|
|
FileSyllableListTree.openFiles(archivo, backwardCompatible);
|
2004-08-13 04:47:35 +00:00
|
|
|
|
|
|
|
SimplifiedLinkedList syllables = new SimplifiedLinkedList();
|
2002-10-03 19:28:09 +00:00
|
|
|
do
|
|
|
|
{
|
2004-08-13 04:47:35 +00:00
|
|
|
// get "link" to children
|
2002-10-03 19:28:09 +00:00
|
|
|
pos = (long) FileSyllableListTree.wordRaf.readInt();
|
2004-08-13 04:47:35 +00:00
|
|
|
// get syllable
|
2002-10-03 19:28:09 +00:00
|
|
|
sil = FileSyllableListTree.wordRaf.readUTF();
|
2004-08-13 04:47:35 +00:00
|
|
|
// get dictionary information for each definition
|
|
|
|
if (FileSyllableListTree.versionNumber==2) sourceDef = new BitDictionarySource();
|
|
|
|
else sourceDef = new ByteDictionarySource();
|
|
|
|
sourceDef.read(FileSyllableListTree.wordRaf);
|
|
|
|
|
2002-10-03 19:28:09 +00:00
|
|
|
if (sourceDef.isEmpty()) defSources = null;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
defSources = new long[sourceDef.countDefs()];
|
|
|
|
for (i=0; i<defSources.length; i++)
|
|
|
|
{
|
|
|
|
defSources[i] = (long) FileSyllableListTree.wordRaf.readInt();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
syllables.addLast(new FileSyllableListTree(sil, defSources, sourceDef, pos));
|
|
|
|
}while(sourceDef.hasBrothers());
|
|
|
|
|
|
|
|
int n = syllables.size();
|
|
|
|
this.syllables = new SyllableListTree[n];
|
2003-04-01 13:08:38 +00:00
|
|
|
SimplifiedListIterator li = syllables.listIterator();
|
2002-10-03 19:28:09 +00:00
|
|
|
while (li.hasNext())
|
|
|
|
{
|
|
|
|
n--;
|
|
|
|
this.syllables[n] = (SyllableListTree) li.next();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public String getDef()
|
|
|
|
{
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
public Definitions getDefs()
|
|
|
|
{
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
public DictionarySource getDictionarySource()
|
2004-08-13 04:47:35 +00:00
|
|
|
{
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
|
|
|
public BitDictionarySource getDictionarySourcesWanted()
|
2002-10-03 19:28:09 +00:00
|
|
|
{
|
|
|
|
return FileSyllableListTree.defSourcesWanted;
|
|
|
|
}
|
|
|
|
|
|
|
|
public boolean hasDef()
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
public SyllableListTree lookUp(String silStr)
|
|
|
|
{
|
|
|
|
int principio=0, medio, fin=syllables.length-1, comp;
|
|
|
|
if (silStr==null) return null;
|
|
|
|
while (principio<=fin)
|
|
|
|
{
|
|
|
|
medio = (principio+fin)/2;
|
|
|
|
comp = syllables[medio].toString().compareTo(silStr);
|
|
|
|
if (comp==0) return syllables[medio];
|
|
|
|
else
|
|
|
|
if (comp<0) principio = medio+1;
|
|
|
|
else fin = medio-1;
|
|
|
|
}
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
}
|