X-Git-Url: https://git.mdrn.pl/pylucene.git/blobdiff_plain/a2e61f0c04805cfcb8706176758d1283c7e3a55c..aaeed5504b982cf3545252ab528713250aa33eed:/lucene-java-3.5.0/lucene/contrib/analyzers/stempel/src/java/org/egothor/stemmer/Reduce.java diff --git a/lucene-java-3.5.0/lucene/contrib/analyzers/stempel/src/java/org/egothor/stemmer/Reduce.java b/lucene-java-3.5.0/lucene/contrib/analyzers/stempel/src/java/org/egothor/stemmer/Reduce.java new file mode 100644 index 0000000..6ebb595 --- /dev/null +++ b/lucene-java-3.5.0/lucene/contrib/analyzers/stempel/src/java/org/egothor/stemmer/Reduce.java @@ -0,0 +1,134 @@ +/* + Egothor Software License version 1.00 + Copyright (C) 1997-2004 Leo Galambos. + Copyright (C) 2002-2004 "Egothor developers" + on behalf of the Egothor Project. + All rights reserved. + + This software is copyrighted by the "Egothor developers". If this + license applies to a single file or document, the "Egothor developers" + are the people or entities mentioned as copyright holders in that file + or document. If this license applies to the Egothor project as a + whole, the copyright holders are the people or entities mentioned in + the file CREDITS. This file can be found in the same location as this + license in the distribution. + + Redistribution and use in source and binary forms, with or without + modification, are permitted provided that the following conditions are + met: + 1. Redistributions of source code must retain the above copyright + notice, the list of contributors, this list of conditions, and the + following disclaimer. + 2. Redistributions in binary form must reproduce the above copyright + notice, the list of contributors, this list of conditions, and the + disclaimer that follows these conditions in the documentation + and/or other materials provided with the distribution. + 3. The name "Egothor" must not be used to endorse or promote products + derived from this software without prior written permission. For + written permission, please contact Leo.G@seznam.cz + 4. Products derived from this software may not be called "Egothor", + nor may "Egothor" appear in their name, without prior written + permission from Leo.G@seznam.cz. + + In addition, we request that you include in the end-user documentation + provided with the redistribution and/or in the software itself an + acknowledgement equivalent to the following: + "This product includes software developed by the Egothor Project. + http://egothor.sf.net/" + + THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED + WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF + MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. + IN NO EVENT SHALL THE EGOTHOR PROJECT OR ITS CONTRIBUTORS BE LIABLE + FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR + CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF + SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR + BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, + WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE + OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN + IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + + This software consists of voluntary contributions made by many + individuals on behalf of the Egothor Project and was originally + created by Leo Galambos (Leo.G@seznam.cz). + */ +package org.egothor.stemmer; + +import java.util.ArrayList; +import java.util.Arrays; +import java.util.Iterator; +import java.util.List; + +/** + * The Reduce object is used to remove gaps in a Trie which stores a dictionary. + */ +public class Reduce { + + /** + * Constructor for the Reduce object. + */ + public Reduce() {} + + /** + * Optimize (remove holes in the rows) the given Trie and return the + * restructured Trie. + * + * @param orig the Trie to optimize + * @return the restructured Trie + */ + public Trie optimize(Trie orig) { + List cmds = orig.cmds; + List rows = new ArrayList(); + List orows = orig.rows; + int remap[] = new int[orows.size()]; + + Arrays.fill(remap, -1); + rows = removeGaps(orig.root, rows, new ArrayList(), remap); + + return new Trie(orig.forward, remap[orig.root], cmds, rows); + } + + List removeGaps(int ind, List old, List to, int remap[]) { + remap[ind] = to.size(); + + Row now = old.get(ind); + to.add(now); + Iterator i = now.cells.values().iterator(); + for (; i.hasNext();) { + Cell c = i.next(); + if (c.ref >= 0 && remap[c.ref] < 0) { + removeGaps(c.ref, old, to, remap); + } + } + to.set(remap[ind], new Remap(now, remap)); + return to; + } + + /** + * This class is part of the Egothor Project + */ + class Remap extends Row { + /** + * Constructor for the Remap object + * + * @param old Description of the Parameter + * @param remap Description of the Parameter + */ + public Remap(Row old, int remap[]) { + super(); + Iterator i = old.cells.keySet().iterator(); + for (; i.hasNext();) { + Character ch = i.next(); + Cell c = old.at(ch); + Cell nc; + if (c.ref >= 0) { + nc = new Cell(c); + nc.ref = remap[nc.ref]; + } else { + nc = new Cell(c); + } + cells.put(ch, nc); + } + } + } +}