/* * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one * or more contributor license agreements. Licensed under the "Elastic License * 2.0", the "GNU Affero General Public License v3.0 only", and the "Server Side * Public License v 1"; you may not use this file except in compliance with, at * your election, the "Elastic License 2.0", the "GNU Affero General Public * License v3.0 only", or the "Server Side Public License, v 1". */ package org.elasticsearch.index.codec.tsdb; import org.apache.lucene.store.DataInput; import org.apache.lucene.store.DataOutput; import org.apache.lucene.util.MathUtil; import org.apache.lucene.util.packed.PackedInts; import java.io.IOException; import java.util.Arrays; /** * This class provides encoding and decoding of doc values using the following schemes: *

* delta encoding: encodes numeric fields in such a way to store the initial value and the difference between the initial value and * all subsequent values. Delta values normally require much less bits than the original 32 or 64 bits. *
* offset encoding: encodes numeric fields in such a way to store values in range [0, max - min] instead of [min, max]. Reducing the * range makes delta encoding much more effective since numbers in range [0, max - min] require less bits than values in range * [min, max]. *
* gcd encoding: encodes numeric fields in such a way to store values divided by their Greatest Common Divisor. Diving values by their * GCD reduces values magnitude making delta encoding much more effective as a result of the fact that dividing a number by another * number reduces its magnitude and, as a result, the bits required to represent it. *
* (f)or encoding: encodes numeric fields in such a way to store the initial value and then the XOR between each value and the previous * one, making delta encoding much more effective. Values sharing common values for higher bits will require less bits when delta * encoded. This is expected to be effective especially with floating point values sharing a common exponent and sign bit. *

* * Notice that encoding and decoding are written in a nested way, for instance {@link TSDBDocValuesEncoder#deltaEncode} calling * {@link TSDBDocValuesEncoder#removeOffset} and so on. This allows us to easily introduce new encoding schemes or remove existing * (non-effective) encoding schemes in a backward-compatible way. * * A token is used as a bitmask to represent which encoding is applied and allows us to detect the applied encoding scheme at decoding time. * This encoding and decoding scheme is meant to work on blocks of 128 values. Larger block sizes incur a decoding penalty when random * access to doc values is required since a full block must be decoded. * * Of course, decoding follows the opposite order with respect to encoding. */ public class TSDBDocValuesEncoder { private final DocValuesForUtil forUtil; private final int numericBlockSize; public TSDBDocValuesEncoder(int numericBlockSize) { this.forUtil = new DocValuesForUtil(numericBlockSize); this.numericBlockSize = numericBlockSize; } /** * Delta-encode monotonic fields. This is typically helpful with near-primary sort fields or * SORTED_NUMERIC/SORTED_SET doc values with many values per document. */ private void deltaEncode(int token, int tokenBits, long[] in, DataOutput out) throws IOException { int gts = 0; int lts = 0; for (int i = 1; i < numericBlockSize; ++i) { if (in[i] > in[i - 1]) { gts++; } else if (in[i] < in[i - 1]) { lts++; } } final boolean doDeltaCompression = (gts == 0 && lts >= 2) || (lts == 0 && gts >= 2); long first = 0; if (doDeltaCompression) { for (int i = numericBlockSize - 1; i > 0; --i) { in[i] -= in[i - 1]; } // Avoid setting in[0] to 0 in case there is a minimum interval between // consecutive values. This might later help compress data using fewer // bits per value. first = in[0] - in[1]; in[0] = in[1]; token = (token << 1) | 0x01; } else { token <<= 1; } removeOffset(token, tokenBits + 1, in, out); if (doDeltaCompression) { out.writeZLong(first); } } private void removeOffset(int token, int tokenBits, long[] in, DataOutput out) throws IOException { long min = Long.MAX_VALUE; long max = Long.MIN_VALUE; for (long l : in) { min = Math.min(l, min); max = Math.max(l, max); } if (max - min < 0) { // overflow min = 0; } else if (min > 0 && min < (max >>> 2)) { // removing the offset is unlikely going to help save bits per value, yet it makes decoding // slower min = 0; } if (min != 0) { for (int i = 0; i < numericBlockSize; ++i) { in[i] -= min; } token = (token << 1) | 0x01; } else { token <<= 1; } gcdEncode(token, tokenBits + 1, in, out); if (min != 0) { out.writeZLong(min); } } /** * See if numbers have a common divisor. This is typically helpful for integer values in * floats/doubles or dates that don't have millisecond accuracy. */ private void gcdEncode(int token, int tokenBits, long[] in, DataOutput out) throws IOException { long gcd = 0; for (long l : in) { gcd = MathUtil.gcd(gcd, l); if (gcd == 1) { break; } } final boolean doGcdCompression = Long.compareUnsigned(gcd, 1) > 0; if (doGcdCompression) { for (int i = 0; i < numericBlockSize; ++i) { in[i] /= gcd; } token = (token << 1) | 0x01; } else { token <<= 1; } forEncode(token, tokenBits + 1, in, out); if (doGcdCompression) { out.writeVLong(gcd - 2); } } private void forEncode(int token, int tokenBits, long[] in, DataOutput out) throws IOException { long or = 0; for (long l : in) { or |= l; } int bitsPerValue = or == 0 ? 0 : DocValuesForUtil.roundBits(PackedInts.unsignedBitsRequired(or)); out.writeVInt((bitsPerValue << tokenBits) | token); if (bitsPerValue > 0) { forUtil.encode(in, bitsPerValue, out); } } /** * Encode the given longs using a combination of delta-coding, GCD factorization and bit packing. */ public void encode(long[] in, DataOutput out) throws IOException { assert in.length == numericBlockSize; deltaEncode(0, 0, in, out); } /** * Optimizes for encoding sorted fields where we expect a block to mostly either be the same value * or to make a transition from one value to a second one. *

* The header is a vlong where the number of trailing ones defines the encoding strategy: *

0: single run
1: two runs
2: bit-packed
3: cycle

*/ public void encodeOrdinals(long[] in, DataOutput out, int bitsPerOrd) throws IOException { assert in.length == numericBlockSize; int numRuns = 1; long firstValue = in[0]; long previousValue = firstValue; boolean cyclic = false; int cycleLength = 0; for (int i = 1; i < in.length; ++i) { long currentValue = in[i]; if (previousValue != currentValue) { numRuns++; } if (currentValue == firstValue && cycleLength != -1) { if (cycleLength == 0) { // first candidate cycle detected cycleLength = i; } else if (cycleLength == 1 || i % cycleLength != 0) { // if the first two values are the same this isn't a cycle, it might be a run, though // this also isn't a cycle if the index of the next occurrence of the first value // isn't a multiple of the candidate cycle length // we can stop looking for cycles now cycleLength = -1; } } previousValue = currentValue; } // if the cycle is too long, bit-packing may be more space efficient int maxCycleLength = in.length / 4; if (numRuns > 2 && cycleLength > 1 && cycleLength <= maxCycleLength) { cyclic = true; for (int i = cycleLength; i < in.length; ++i) { if (in[i] != in[i - cycleLength]) { cyclic = false; break; } } } if (numRuns == 1 && bitsPerOrd < 63) { long value = in[0]; // unset first bit (0 trailing ones) to indicate the block has a single run out.writeVLong(value << 1); } else if (numRuns == 2 && bitsPerOrd < 62) { // set 1 trailing bit to indicate the block has two runs out.writeVLong((in[0] << 2) | 0b01); int firstRunLen = in.length; for (int i = 1; i < in.length; ++i) { if (in[i] != in[0]) { firstRunLen = i; break; } } out.writeVInt(firstRunLen); out.writeZLong(in[in.length - 1] - in[0]); } else if (cyclic) { // set 3 trailing bits to indicate the block cycles through the same values long headerAndCycleLength = ((long) cycleLength << 4) | 0b0111; out.writeVLong(headerAndCycleLength); for (int i = 0; i < cycleLength; i++) { out.writeVLong(in[i]); } } else { // set 2 trailing bits to indicate the block is bit-packed out.writeVLong(0b11); forUtil.encode(in, bitsPerOrd, out); } } public void decodeOrdinals(DataInput in, long[] out, int bitsPerOrd) throws IOException { assert out.length == numericBlockSize : out.length; long v1 = in.readVLong(); int encoding = Long.numberOfTrailingZeros(~v1); v1 >>>= encoding + 1; if (encoding == 0) { // single run Arrays.fill(out, v1); } else if (encoding == 1) { // two runs int runLen = in.readVInt(); long v2 = v1 + in.readZLong(); Arrays.fill(out, 0, runLen, v1); Arrays.fill(out, runLen, out.length, v2); } else if (encoding == 2) { // bit-packed forUtil.decode(bitsPerOrd, in, out); } else if (encoding == 3) { // cycle encoding int cycleLength = (int) v1; for (int i = 0; i < cycleLength; i++) { out[i] = in.readVLong(); } int length = cycleLength; while (length < out.length) { int copyLength = Math.min(length, out.length - length); System.arraycopy(out, 0, out, length, copyLength); length += copyLength; } } } /** Decode longs that have been encoded with {@link #encode}. */ public void decode(DataInput in, long[] out) throws IOException { assert out.length == numericBlockSize : out.length; final int token = in.readVInt(); final int bitsPerValue = token >>> 3; if (bitsPerValue != 0) { forUtil.decode(bitsPerValue, in, out); } else { Arrays.fill(out, 0L); } // simple blocks that only perform bit packing exit early here // this is typical for SORTED(_SET) ordinals if ((token & 0x07) != 0) { final boolean doGcdCompression = (token & 0x01) != 0; if (doGcdCompression) { final long gcd = 2 + in.readVLong(); mul(out, gcd); } final boolean hasOffset = (token & 0x02) != 0; if (hasOffset) { final long min = in.readZLong(); add(out, min); } final boolean doDeltaCompression = (token & 0x04) != 0; if (doDeltaCompression) { final long first = in.readZLong(); out[0] += first; deltaDecode(out); } } } // this loop should auto-vectorize private void mul(long[] arr, long m) { for (int i = 0; i < numericBlockSize; ++i) { arr[i] *= m; } } // this loop should auto-vectorize private void add(long[] arr, long min) { for (int i = 0; i < numericBlockSize; ++i) { arr[i] += min; } } private void deltaDecode(long[] arr) { for (int i = 1; i < numericBlockSize; ++i) { arr[i] += arr[i - 1]; } } }