+++ /dev/null
-package org.apache.lucene.util.collections;
-
-import java.util.Arrays;
-
-/**
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/**
- * A Set or primitive int. Implemented as a HashMap of int->int. *
- *
- * @lucene.experimental
- */
-public class IntHashSet {
-
- // TODO (Facet): This is wasteful as the "values" are actually the "keys" and
- // we could spare this amount of space (capacity * sizeof(int)). Perhaps even
- // though it is not OOP, we should re-implement the hash for just that cause.
-
- /**
- * Implements an IntIterator which iterates over all the allocated indexes.
- */
- private final class IndexIterator implements IntIterator {
- /**
- * The last used baseHashIndex. Needed for "jumping" from one hash entry
- * to another.
- */
- private int baseHashIndex = 0;
-
- /**
- * The next not-yet-visited index.
- */
- private int index = 0;
-
- /**
- * Index of the last visited pair. Used in {@link #remove()}.
- */
- private int lastIndex = 0;
-
- /**
- * Create the Iterator, make <code>index</code> point to the "first"
- * index which is not empty. If such does not exist (eg. the map is
- * empty) it would be zero.
- */
- public IndexIterator() {
- for (baseHashIndex = 0; baseHashIndex < baseHash.length; ++baseHashIndex) {
- index = baseHash[baseHashIndex];
- if (index != 0) {
- break;
- }
- }
- }
-
- public boolean hasNext() {
- return (index != 0);
- }
-
- public int next() {
- // Save the last index visited
- lastIndex = index;
-
- // next the index
- index = next[index];
-
- // if the next index points to the 'Ground' it means we're done with
- // the current hash entry and we need to jump to the next one. This
- // is done until all the hash entries had been visited.
- while (index == 0 && ++baseHashIndex < baseHash.length) {
- index = baseHash[baseHashIndex];
- }
-
- return lastIndex;
- }
-
- public void remove() {
- IntHashSet.this.remove(keys[lastIndex]);
- }
-
- }
-
- /**
- * Implements an IntIterator, used for iteration over the map's keys.
- */
- private final class KeyIterator implements IntIterator {
- private IntIterator iterator = new IndexIterator();
-
- KeyIterator() { }
-
- public boolean hasNext() {
- return iterator.hasNext();
- }
-
- public int next() {
- return keys[iterator.next()];
- }
-
- public void remove() {
- iterator.remove();
- }
- }
-
- /**
- * Default capacity - in case no capacity was specified in the constructor
- */
- private static int defaultCapacity = 16;
-
- /**
- * Holds the base hash entries. if the capacity is 2^N, than the base hash
- * holds 2^(N+1). It can hold
- */
- int[] baseHash;
-
- /**
- * The current capacity of the map. Always 2^N and never less than 16. We
- * never use the zero index. It is needed to improve performance and is also
- * used as "ground".
- */
- private int capacity;
-
- /**
- * All objects are being allocated at map creation. Those objects are "free"
- * or empty. Whenever a new pair comes along, a pair is being "allocated" or
- * taken from the free-linked list. as this is just a free list.
- */
- private int firstEmpty;
-
- /**
- * hashFactor is always (2^(N+1)) - 1. Used for faster hashing.
- */
- private int hashFactor;
-
- /**
- * This array holds the unique keys
- */
- int[] keys;
-
- /**
- * In case of collisions, we implement a double linked list of the colliding
- * hash's with the following next[] and prev[]. Those are also used to store
- * the "empty" list.
- */
- int[] next;
-
- private int prev;
-
- /**
- * Number of currently objects in the map.
- */
- private int size;
-
- /**
- * Constructs a map with default capacity.
- */
- public IntHashSet() {
- this(defaultCapacity);
- }
-
- /**
- * Constructs a map with given capacity. Capacity is adjusted to a native
- * power of 2, with minimum of 16.
- *
- * @param capacity
- * minimum capacity for the map.
- */
- public IntHashSet(int capacity) {
- this.capacity = 16;
- // Minimum capacity is 16..
- while (this.capacity < capacity) {
- // Multiply by 2 as long as we're still under the requested capacity
- this.capacity <<= 1;
- }
-
- // As mentioned, we use the first index (0) as 'Ground', so we need the
- // length of the arrays to be one more than the capacity
- int arrayLength = this.capacity + 1;
-
- this.keys = new int[arrayLength];
- this.next = new int[arrayLength];
-
- // Hash entries are twice as big as the capacity.
- int baseHashSize = this.capacity << 1;
-
- this.baseHash = new int[baseHashSize];
-
- // The has factor is 2^M - 1 which is used as an "AND" hashing operator.
- // {@link #calcBaseHash()}
- this.hashFactor = baseHashSize - 1;
-
- this.size = 0;
-
- clear();
- }
-
- /**
- * Adds a pair to the map. Takes the first empty position from the
- * empty-linked-list's head - {@link firstEmpty}.
- *
- * New pairs are always inserted to baseHash, and are followed by the old
- * colliding pair.
- *
- * @param key
- * integer which maps the given value
- * @param e
- * value which is being mapped using the given key
- */
- private void prvt_add(int key) {
- // Hash entry to which the new pair would be inserted
- int hashIndex = calcBaseHashIndex(key);
-
- // 'Allocating' a pair from the "Empty" list.
- int objectIndex = firstEmpty;
-
- // Setting data
- firstEmpty = next[firstEmpty];
- keys[objectIndex] = key;
-
- // Inserting the new pair as the first node in the specific hash entry
- next[objectIndex] = baseHash[hashIndex];
- baseHash[hashIndex] = objectIndex;
-
- // Announcing a new pair was added!
- ++size;
- }
-
- /**
- * Calculating the baseHash index using the internal <code>hashFactor</code>
- * .
- *
- * @param key
- */
- protected int calcBaseHashIndex(int key) {
- return key & hashFactor;
- }
-
- /**
- * Empties the map. Generates the "Empty" space list for later allocation.
- */
- public void clear() {
- // Clears the hash entries
- Arrays.fill(this.baseHash, 0);
-
- // Set size to zero
- size = 0;
-
- // Mark all array entries as empty. This is done with
- // <code>firstEmpty</code> pointing to the first valid index (1 as 0 is
- // used as 'Ground').
- firstEmpty = 1;
-
- // And setting all the <code>next[i]</code> to point at
- // <code>i+1</code>.
- for (int i = 1; i < this.capacity;) {
- next[i] = ++i;
- }
-
- // Surly, the last one should point to the 'Ground'.
- next[this.capacity] = 0;
- }
-
- /**
- * Checks if a given key exists in the map.
- *
- * @param value
- * that is checked against the map data.
- * @return true if the key exists in the map. false otherwise.
- */
- public boolean contains(int value) {
- return find(value) != 0;
- }
-
- /**
- * Find the actual index of a given key.
- *
- * @param key
- * @return index of the key. zero if the key wasn't found.
- */
- protected int find(int key) {
- // Calculate the hash entry.
- int baseHashIndex = calcBaseHashIndex(key);
-
- // Start from the hash entry.
- int localIndex = baseHash[baseHashIndex];
-
- // while the index does not point to the 'Ground'
- while (localIndex != 0) {
- // returns the index found in case of of a matching key.
- if (keys[localIndex] == key) {
- return localIndex;
- }
-
- // next the local index
- localIndex = next[localIndex];
- }
-
- // If we got this far, it could only mean we did not find the key we
- // were asked for. return 'Ground' index.
- return 0;
- }
-
- /**
- * Find the actual index of a given key with it's baseHashIndex.<br>
- * Some methods use the baseHashIndex. If those call {@link #find()} there's
- * no need to re-calculate that hash.
- *
- * @param key
- * @param baseHashIndex
- * @return the index of the given key, or 0 as 'Ground' if the key wasn't
- * found.
- */
- private int findForRemove(int key, int baseHashIndex) {
- // Start from the hash entry.
- this.prev = 0;
- int index = baseHash[baseHashIndex];
-
- // while the index does not point to the 'Ground'
- while (index != 0) {
- // returns the index found in case of of a matching key.
- if (keys[index] == key) {
- return index;
- }
-
- // next the local index
- prev = index;
- index = next[index];
- }
-
- // If we got this far, it could only mean we did not find the key we
- // were asked for. return 'Ground' index.
- this.prev = 0;
- return 0;
- }
-
- /**
- * Grows the map. Allocates a new map of double the capacity, and
- * fast-insert the old key-value pairs.
- */
- protected void grow() {
- IntHashSet that = new IntHashSet(this.capacity * 2);
-
- // Iterates fast over the collection. Any valid pair is put into the new
- // map without checking for duplicates or if there's enough space for
- // it.
- for (IndexIterator iterator = new IndexIterator(); iterator.hasNext();) {
- int index = iterator.next();
- that.prvt_add(this.keys[index]);
- }
- // for (int i = capacity; i > 0; --i) {
- //
- // that._add(this.keys[i]);
- //
- // }
-
- // Copy that's data into this.
- this.capacity = that.capacity;
- this.size = that.size;
- this.firstEmpty = that.firstEmpty;
- this.keys = that.keys;
- this.next = that.next;
- this.baseHash = that.baseHash;
- this.hashFactor = that.hashFactor;
- }
-
- /**
- *
- * @return true if the map is empty. false otherwise.
- */
- public boolean isEmpty() {
- return size == 0;
- }
-
- /**
- * Returns a new iterator for the mapped objects.
- */
- public IntIterator iterator() {
- return new KeyIterator();
- }
-
- /**
- * Prints the baseHash array, used for debug purposes.
- */
- public void printBaseHash() {
- for (int i = 0; i < this.baseHash.length; i++) {
- if (baseHash[i] != 0) {
- System.out.println(i + ".\t" + baseHash[i]);
- }
- }
- }
-
- /**
- * Add a mapping int key -> int value.
- * <p>
- * If the key was already inside just
- * updating the value it refers to as the given object.
- * <p>
- * Otherwise if the map is full, first {@link #grow()} the map.
- *
- * @param value
- * integer which maps the given value
- * @return true always.
- */
- public boolean add(int value) {
- // Does key exists?
- int index = find(value);
-
- // Yes!
- if (index != 0) {
- return true;
- }
-
- // Is there enough room for a new pair?
- if (size == capacity) {
- // No? Than grow up!
- grow();
- }
-
- // Now that everything is set, the pair can be just put inside with no
- // worries.
- prvt_add(value);
-
- return true;
- }
-
- /**
- * Remove a pair from the map, specified by it's key.
- *
- * @param value
- * specify the value to be removed
- *
- * @return true if the map was changed (the key was found and removed).
- * false otherwise.
- */
- public boolean remove(int value) {
- int baseHashIndex = calcBaseHashIndex(value);
- int index = findForRemove(value, baseHashIndex);
- if (index != 0) {
- // If it is the first in the collision list, we should promote its
- // next colliding element.
- if (prev == 0) {
- baseHash[baseHashIndex] = next[index];
- }
-
- next[prev] = next[index];
- next[index] = firstEmpty;
- firstEmpty = index;
- --size;
- return true;
- }
-
- return false;
- }
-
- /**
- * @return number of pairs currently in the map
- */
- public int size() {
- return this.size;
- }
-
- /**
- * Translates the mapped pairs' values into an array of Objects
- *
- * @return an object array of all the values currently in the map.
- */
- public int[] toArray() {
- int j = -1;
- int[] array = new int[size];
-
- // Iterates over the values, adding them to the array.
- for (IntIterator iterator = iterator(); iterator.hasNext();) {
- array[++j] = iterator.next();
- }
- return array;
- }
-
- /**
- * Translates the mapped pairs' values into an array of ints
- *
- * @param a
- * the array into which the elements of the map are to be stored,
- * if it is big enough; otherwise, a new array of the same
- * runtime type is allocated for this purpose.
- *
- * @return an array containing the values stored in the map
- *
- */
- public int[] toArray(int[] a) {
- int j = 0;
- if (a.length < size) {
- a = new int[size];
- }
- // Iterates over the values, adding them to the array.
- for (IntIterator iterator = iterator(); j < a.length
- && iterator.hasNext(); ++j) {
- a[j] = iterator.next();
- }
- return a;
- }
-
- /**
- * I have no idea why would anyone call it - but for debug purposes.<br>
- * Prints the entire map, including the index, key, object, next and prev.
- */
- @Override
- public String toString() {
- StringBuffer sb = new StringBuffer();
- sb.append('{');
- IntIterator iterator = iterator();
- while (iterator.hasNext()) {
- sb.append(iterator.next());
- if (iterator.hasNext()) {
- sb.append(',');
- sb.append(' ');
- }
- }
- sb.append('}');
- return sb.toString();
- }
-
- public String toHashString() {
- String string = "\n";
- StringBuffer sb = new StringBuffer();
-
- for (int i = 0; i < this.baseHash.length; i++) {
- StringBuffer sb2 = new StringBuffer();
- boolean shouldAppend = false;
- sb2.append(i + ".\t");
- for (int index = baseHash[i]; index != 0; index = next[index]) {
- sb2.append(" -> " + keys[index] + "@" + index);
- shouldAppend = true;
- }
- if (shouldAppend) {
- sb.append(sb2);
- sb.append(string);
- }
- }
-
- return sb.toString();
- }
-}
\ No newline at end of file