--- /dev/null
+package org.apache.lucene.util.encoding;
+
+import java.io.IOException;
+import java.io.OutputStream;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * A variation of {@link FourFlagsIntEncoder} which translates the data as
+ * follows:
+ * <ul>
+ * <li>Values ≥ 2 are trnalsated to <code>value+1</code> (2 ⇒ 3, 3
+ * ⇒ 4 and so forth).
+ * <li>Any <code>N</code> occurrences of 1 are encoded as a single 2.
+ * <li>Otherwise, each 1 is encoded as 1.
+ * </ul>
+ * <p>
+ * Encoding examples:
+ * <ul>
+ * <li>N = 4: the data 1,1,1,1,1 is translated to: 2, 1
+ * <li>N = 3: the data 1,2,3,4,1,1,1,1,5 is translated to 1,3,4,5,2,1,6
+ * </ul>
+ * <b>NOTE:</b> this encoder does not support values ≤ 0 and
+ * {@link Integer#MAX_VALUE}. 0 is not supported because it's not supported by
+ * {@link FourFlagsIntEncoder} and {@link Integer#MAX_VALUE} because this
+ * encoder translates N to N+1, which will cause an overflow and
+ * {@link Integer#MAX_VALUE} will become a negative number, which is not
+ * supported as well.<br>
+ * This does not mean you cannot encode {@link Integer#MAX_VALUE}. If it is not
+ * the first value to encode, and you wrap this encoder with
+ * {@link DGapIntEncoder}, then the value that will be sent to this encoder will
+ * be <code>MAX_VAL - prev</code>.
+ *
+ * @lucene.experimental
+ */
+public class NOnesIntEncoder extends FourFlagsIntEncoder {
+
+ /** Number of consecutive '1's to be translated into single target value '2'. */
+ private int n;
+
+ /** Counts the number of consecutive ones seen. */
+ private int onesCounter = 0;
+
+ /**
+ * Constructs an encoder with a given value of N (N: Number of consecutive
+ * '1's to be translated into single target value '2').
+ */
+ public NOnesIntEncoder(int n) {
+ this.n = n;
+ }
+
+ @Override
+ public void close() throws IOException {
+ // We might have ones in our buffer, encode them as neccesary.
+ while (onesCounter-- > 0) {
+ super.encode(1);
+ }
+
+ super.close();
+ }
+
+ @Override
+ public void encode(int value) throws IOException {
+ if (value == 1) {
+ // Increment the number of consecutive ones seen so far
+ if (++onesCounter == n) {
+ super.encode(2);
+ onesCounter = 0;
+ }
+ return;
+ }
+
+ // If it's not one - there might have been ones we had to encode prior to
+ // this value
+ while (onesCounter > 0) {
+ --onesCounter;
+ super.encode(1);
+ }
+
+ // encode value + 1 --> the translation.
+ super.encode(value + 1);
+ }
+
+ @Override
+ public IntDecoder createMatchingDecoder() {
+ return new NOnesIntDecoder(n);
+ }
+
+ @Override
+ public void reInit(OutputStream out) {
+ super.reInit(out);
+ onesCounter = 0;
+ }
+
+ @Override
+ public String toString() {
+ return "NOnes (" + n + ") (" + super.toString() + ")";
+ }
+
+}