/* * Copyright (c) 2017, 2025, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. Oracle designates this * particular file as subject to the "Classpath" exception as provided * by Oracle in the LICENSE file that accompanied this code. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. */ package jdk.incubator.vector; import java.lang.foreign.MemorySegment; import java.lang.foreign.ValueLayout; import java.nio.ByteOrder; import java.util.Arrays; import java.util.Objects; import java.util.function.Function; import jdk.internal.foreign.AbstractMemorySegmentImpl; import jdk.internal.misc.ScopedMemoryAccess; import jdk.internal.misc.Unsafe; import jdk.internal.vm.annotation.ForceInline; import jdk.internal.vm.vector.VectorSupport; import static jdk.internal.vm.vector.VectorSupport.*; import static jdk.incubator.vector.VectorIntrinsics.*; import static jdk.incubator.vector.VectorOperators.*; // -- This file was mechanically generated: Do not edit! -- // /** * A specialized {@link Vector} representing an ordered immutable sequence of * {@code byte} values. */ @SuppressWarnings("cast") // warning: redundant cast public abstract class ByteVector extends AbstractVector { ByteVector(byte[] vec) { super(vec); } static final int FORBID_OPCODE_KIND = VO_ONLYFP; static final ValueLayout.OfByte ELEMENT_LAYOUT = ValueLayout.JAVA_BYTE.withByteAlignment(1); @ForceInline static int opCode(Operator op) { return VectorOperators.opCode(op, VO_OPCODE_VALID, FORBID_OPCODE_KIND); } @ForceInline static int opCode(Operator op, int requireKind) { requireKind |= VO_OPCODE_VALID; return VectorOperators.opCode(op, requireKind, FORBID_OPCODE_KIND); } @ForceInline static boolean opKind(Operator op, int bit) { return VectorOperators.opKind(op, bit); } // Virtualized factories and operators, // coded with portable definitions. // These are all @ForceInline in case // they need to be used performantly. // The various shape-specific subclasses // also specialize them by wrapping // them in a call like this: // return (Byte128Vector) // super.bOp((Byte128Vector) o); // The purpose of that is to forcibly inline // the generic definition from this file // into a sharply-typed and size-specific // wrapper in the subclass file, so that // the JIT can specialize the code. // The code is only inlined and expanded // if it gets hot. Think of it as a cheap // and lazy version of C++ templates. // Virtualized getter /*package-private*/ abstract byte[] vec(); // Virtualized constructors /** * Build a vector directly using my own constructor. * It is an error if the array is aliased elsewhere. */ /*package-private*/ abstract ByteVector vectorFactory(byte[] vec); /** * Build a mask directly using my species. * It is an error if the array is aliased elsewhere. */ /*package-private*/ @ForceInline final AbstractMask maskFactory(boolean[] bits) { return vspecies().maskFactory(bits); } // Constant loader (takes dummy as vector arg) interface FVOp { byte apply(int i); } /*package-private*/ @ForceInline final ByteVector vOp(FVOp f) { byte[] res = new byte[length()]; for (int i = 0; i < res.length; i++) { res[i] = f.apply(i); } return vectorFactory(res); } @ForceInline final ByteVector vOp(VectorMask m, FVOp f) { byte[] res = new byte[length()]; boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { if (mbits[i]) { res[i] = f.apply(i); } } return vectorFactory(res); } // Unary operator /*package-private*/ interface FUnOp { byte apply(int i, byte a); } /*package-private*/ abstract ByteVector uOp(FUnOp f); @ForceInline final ByteVector uOpTemplate(FUnOp f) { byte[] vec = vec(); byte[] res = new byte[length()]; for (int i = 0; i < res.length; i++) { res[i] = f.apply(i, vec[i]); } return vectorFactory(res); } /*package-private*/ abstract ByteVector uOp(VectorMask m, FUnOp f); @ForceInline final ByteVector uOpTemplate(VectorMask m, FUnOp f) { if (m == null) { return uOpTemplate(f); } byte[] vec = vec(); byte[] res = new byte[length()]; boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { res[i] = mbits[i] ? f.apply(i, vec[i]) : vec[i]; } return vectorFactory(res); } // Binary operator /*package-private*/ interface FBinOp { byte apply(int i, byte a, byte b); } /*package-private*/ abstract ByteVector bOp(Vector o, FBinOp f); @ForceInline final ByteVector bOpTemplate(Vector o, FBinOp f) { byte[] res = new byte[length()]; byte[] vec1 = this.vec(); byte[] vec2 = ((ByteVector)o).vec(); for (int i = 0; i < res.length; i++) { res[i] = f.apply(i, vec1[i], vec2[i]); } return vectorFactory(res); } /*package-private*/ abstract ByteVector bOp(Vector o, VectorMask m, FBinOp f); @ForceInline final ByteVector bOpTemplate(Vector o, VectorMask m, FBinOp f) { if (m == null) { return bOpTemplate(o, f); } byte[] res = new byte[length()]; byte[] vec1 = this.vec(); byte[] vec2 = ((ByteVector)o).vec(); boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i]) : vec1[i]; } return vectorFactory(res); } // Ternary operator /*package-private*/ interface FTriOp { byte apply(int i, byte a, byte b, byte c); } /*package-private*/ abstract ByteVector tOp(Vector o1, Vector o2, FTriOp f); @ForceInline final ByteVector tOpTemplate(Vector o1, Vector o2, FTriOp f) { byte[] res = new byte[length()]; byte[] vec1 = this.vec(); byte[] vec2 = ((ByteVector)o1).vec(); byte[] vec3 = ((ByteVector)o2).vec(); for (int i = 0; i < res.length; i++) { res[i] = f.apply(i, vec1[i], vec2[i], vec3[i]); } return vectorFactory(res); } /*package-private*/ abstract ByteVector tOp(Vector o1, Vector o2, VectorMask m, FTriOp f); @ForceInline final ByteVector tOpTemplate(Vector o1, Vector o2, VectorMask m, FTriOp f) { if (m == null) { return tOpTemplate(o1, o2, f); } byte[] res = new byte[length()]; byte[] vec1 = this.vec(); byte[] vec2 = ((ByteVector)o1).vec(); byte[] vec3 = ((ByteVector)o2).vec(); boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { res[i] = mbits[i] ? f.apply(i, vec1[i], vec2[i], vec3[i]) : vec1[i]; } return vectorFactory(res); } // Reduction operator /*package-private*/ abstract byte rOp(byte v, VectorMask m, FBinOp f); @ForceInline final byte rOpTemplate(byte v, VectorMask m, FBinOp f) { if (m == null) { return rOpTemplate(v, f); } byte[] vec = vec(); boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < vec.length; i++) { v = mbits[i] ? f.apply(i, v, vec[i]) : v; } return v; } @ForceInline final byte rOpTemplate(byte v, FBinOp f) { byte[] vec = vec(); for (int i = 0; i < vec.length; i++) { v = f.apply(i, v, vec[i]); } return v; } // Memory reference /*package-private*/ interface FLdOp { byte apply(M memory, int offset, int i); } /*package-private*/ @ForceInline final ByteVector ldOp(M memory, int offset, FLdOp f) { //dummy; no vec = vec(); byte[] res = new byte[length()]; for (int i = 0; i < res.length; i++) { res[i] = f.apply(memory, offset, i); } return vectorFactory(res); } /*package-private*/ @ForceInline final ByteVector ldOp(M memory, int offset, VectorMask m, FLdOp f) { //byte[] vec = vec(); byte[] res = new byte[length()]; boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { if (mbits[i]) { res[i] = f.apply(memory, offset, i); } } return vectorFactory(res); } /*package-private*/ interface FLdLongOp { byte apply(MemorySegment memory, long offset, int i); } /*package-private*/ @ForceInline final ByteVector ldLongOp(MemorySegment memory, long offset, FLdLongOp f) { //dummy; no vec = vec(); byte[] res = new byte[length()]; for (int i = 0; i < res.length; i++) { res[i] = f.apply(memory, offset, i); } return vectorFactory(res); } /*package-private*/ @ForceInline final ByteVector ldLongOp(MemorySegment memory, long offset, VectorMask m, FLdLongOp f) { //byte[] vec = vec(); byte[] res = new byte[length()]; boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { if (mbits[i]) { res[i] = f.apply(memory, offset, i); } } return vectorFactory(res); } static byte memorySegmentGet(MemorySegment ms, long o, int i) { return ms.get(ELEMENT_LAYOUT, o + i * 1L); } interface FStOp { void apply(M memory, int offset, int i, byte a); } /*package-private*/ @ForceInline final void stOp(M memory, int offset, FStOp f) { byte[] vec = vec(); for (int i = 0; i < vec.length; i++) { f.apply(memory, offset, i, vec[i]); } } /*package-private*/ @ForceInline final void stOp(M memory, int offset, VectorMask m, FStOp f) { byte[] vec = vec(); boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < vec.length; i++) { if (mbits[i]) { f.apply(memory, offset, i, vec[i]); } } } interface FStLongOp { void apply(MemorySegment memory, long offset, int i, byte a); } /*package-private*/ @ForceInline final void stLongOp(MemorySegment memory, long offset, FStLongOp f) { byte[] vec = vec(); for (int i = 0; i < vec.length; i++) { f.apply(memory, offset, i, vec[i]); } } /*package-private*/ @ForceInline final void stLongOp(MemorySegment memory, long offset, VectorMask m, FStLongOp f) { byte[] vec = vec(); boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < vec.length; i++) { if (mbits[i]) { f.apply(memory, offset, i, vec[i]); } } } static void memorySegmentSet(MemorySegment ms, long o, int i, byte e) { ms.set(ELEMENT_LAYOUT, o + i * 1L, e); } // Binary test /*package-private*/ interface FBinTest { boolean apply(int cond, int i, byte a, byte b); } /*package-private*/ @ForceInline final AbstractMask bTest(int cond, Vector o, FBinTest f) { byte[] vec1 = vec(); byte[] vec2 = ((ByteVector)o).vec(); boolean[] bits = new boolean[length()]; for (int i = 0; i < length(); i++){ bits[i] = f.apply(cond, i, vec1[i], vec2[i]); } return maskFactory(bits); } /*package-private*/ @ForceInline static byte rotateLeft(byte a, int n) { return (byte)(((((byte)a) & Byte.toUnsignedInt((byte)-1)) << (n & Byte.SIZE-1)) | ((((byte)a) & Byte.toUnsignedInt((byte)-1)) >>> (Byte.SIZE - (n & Byte.SIZE-1)))); } /*package-private*/ @ForceInline static byte rotateRight(byte a, int n) { return (byte)(((((byte)a) & Byte.toUnsignedInt((byte)-1)) >>> (n & Byte.SIZE-1)) | ((((byte)a) & Byte.toUnsignedInt((byte)-1)) << (Byte.SIZE - (n & Byte.SIZE-1)))); } /*package-private*/ @Override abstract ByteSpecies vspecies(); /*package-private*/ @ForceInline static long toBits(byte e) { return e; } /*package-private*/ @ForceInline static byte fromBits(long bits) { return ((byte)bits); } static ByteVector expandHelper(Vector v, VectorMask m) { VectorSpecies vsp = m.vectorSpecies(); ByteVector r = (ByteVector) vsp.zero(); ByteVector vi = (ByteVector) v; if (m.allTrue()) { return vi; } for (int i = 0, j = 0; i < vsp.length(); i++) { if (m.laneIsSet(i)) { r = r.withLane(i, vi.lane(j++)); } } return r; } static ByteVector compressHelper(Vector v, VectorMask m) { VectorSpecies vsp = m.vectorSpecies(); ByteVector r = (ByteVector) vsp.zero(); ByteVector vi = (ByteVector) v; if (m.allTrue()) { return vi; } for (int i = 0, j = 0; i < vsp.length(); i++) { if (m.laneIsSet(i)) { r = r.withLane(j++, vi.lane(i)); } } return r; } static ByteVector selectFromTwoVectorHelper(Vector indexes, Vector src1, Vector src2) { int vlen = indexes.length(); byte[] res = new byte[vlen]; byte[] vecPayload1 = ((ByteVector)indexes).vec(); byte[] vecPayload2 = ((ByteVector)src1).vec(); byte[] vecPayload3 = ((ByteVector)src2).vec(); for (int i = 0; i < vlen; i++) { int wrapped_index = VectorIntrinsics.wrapToRange((int)vecPayload1[i], 2 * vlen); res[i] = wrapped_index >= vlen ? vecPayload3[wrapped_index - vlen] : vecPayload2[wrapped_index]; } return ((ByteVector)src1).vectorFactory(res); } // Static factories (other than memory operations) // Note: A surprising behavior in javadoc // sometimes makes a lone /** {@inheritDoc} */ // comment drop the method altogether, // apparently if the method mentions a // parameter or return type of Vector // instead of Vector as originally specified. // Adding an empty HTML fragment appears to // nudge javadoc into providing the desired // inherited documentation. We use the HTML // comment for this. /** * Returns a vector of the given species * where all lane elements are set to * zero, the default primitive value. * * @param species species of the desired zero vector * @return a zero vector */ @ForceInline public static ByteVector zero(VectorSpecies species) { ByteSpecies vsp = (ByteSpecies) species; return VectorSupport.fromBitsCoerced(vsp.vectorType(), byte.class, species.length(), 0, MODE_BROADCAST, vsp, ((bits_, s_) -> s_.rvOp(i -> bits_))); } /** * Returns a vector of the same species as this one * where all lane elements are set to * the primitive value {@code e}. * * The contents of the current vector are discarded; * only the species is relevant to this operation. * *

This method returns the value of this expression: * {@code ByteVector.broadcast(this.species(), e)}. * * @apiNote * Unlike the similar method named {@code broadcast()} * in the supertype {@code Vector}, this method does not * need to validate its argument, and cannot throw * {@code IllegalArgumentException}. This method is * therefore preferable to the supertype method. * * @param e the value to broadcast * @return a vector where all lane elements are set to * the primitive value {@code e} * @see #broadcast(VectorSpecies,long) * @see Vector#broadcast(long) * @see VectorSpecies#broadcast(long) */ public abstract ByteVector broadcast(byte e); /** * Returns a vector of the given species * where all lane elements are set to * the primitive value {@code e}. * * @param species species of the desired vector * @param e the value to broadcast * @return a vector where all lane elements are set to * the primitive value {@code e} * @see #broadcast(long) * @see Vector#broadcast(long) * @see VectorSpecies#broadcast(long) */ @ForceInline public static ByteVector broadcast(VectorSpecies species, byte e) { ByteSpecies vsp = (ByteSpecies) species; return vsp.broadcast(e); } /*package-private*/ @ForceInline final ByteVector broadcastTemplate(byte e) { ByteSpecies vsp = vspecies(); return vsp.broadcast(e); } /** * {@inheritDoc} * @apiNote * When working with vector subtypes like {@code ByteVector}, * {@linkplain #broadcast(byte) the more strongly typed method} * is typically selected. It can be explicitly selected * using a cast: {@code v.broadcast((byte)e)}. * The two expressions will produce numerically identical results. */ @Override public abstract ByteVector broadcast(long e); /** * Returns a vector of the given species * where all lane elements are set to * the primitive value {@code e}. * * The {@code long} value must be accurately representable * by the {@code ETYPE} of the vector species, so that * {@code e==(long)(ETYPE)e}. * * @param species species of the desired vector * @param e the value to broadcast * @return a vector where all lane elements are set to * the primitive value {@code e} * @throws IllegalArgumentException * if the given {@code long} value cannot * be represented by the vector's {@code ETYPE} * @see #broadcast(VectorSpecies,byte) * @see VectorSpecies#checkValue(long) */ @ForceInline public static ByteVector broadcast(VectorSpecies species, long e) { ByteSpecies vsp = (ByteSpecies) species; return vsp.broadcast(e); } /*package-private*/ @ForceInline final ByteVector broadcastTemplate(long e) { return vspecies().broadcast(e); } // Unary lanewise support /** * {@inheritDoc} */ public abstract ByteVector lanewise(VectorOperators.Unary op); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Unary op) { if (opKind(op, VO_SPECIAL)) { if (op == ZOMO) { return blend(broadcast(-1), compare(NE, 0)); } else if (op == NOT) { return broadcast(-1).lanewise(XOR, this); } } int opc = opCode(op); return VectorSupport.unaryOp( opc, getClass(), null, byte.class, length(), this, null, UN_IMPL.find(op, opc, ByteVector::unaryOperations)); } /** * {@inheritDoc} */ @Override public abstract ByteVector lanewise(VectorOperators.Unary op, VectorMask m); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Unary op, Class> maskClass, VectorMask m) { m.check(maskClass, this); if (opKind(op, VO_SPECIAL)) { if (op == ZOMO) { return blend(broadcast(-1), compare(NE, 0, m)); } else if (op == NOT) { return lanewise(XOR, broadcast(-1), m); } } int opc = opCode(op); return VectorSupport.unaryOp( opc, getClass(), maskClass, byte.class, length(), this, m, UN_IMPL.find(op, opc, ByteVector::unaryOperations)); } private static final ImplCache>> UN_IMPL = new ImplCache<>(Unary.class, ByteVector.class); private static UnaryOperation> unaryOperations(int opc_) { switch (opc_) { case VECTOR_OP_NEG: return (v0, m) -> v0.uOp(m, (i, a) -> (byte) -a); case VECTOR_OP_ABS: return (v0, m) -> v0.uOp(m, (i, a) -> (byte) Math.abs(a)); case VECTOR_OP_BIT_COUNT: return (v0, m) -> v0.uOp(m, (i, a) -> (byte) bitCount(a)); case VECTOR_OP_TZ_COUNT: return (v0, m) -> v0.uOp(m, (i, a) -> (byte) numberOfTrailingZeros(a)); case VECTOR_OP_LZ_COUNT: return (v0, m) -> v0.uOp(m, (i, a) -> (byte) numberOfLeadingZeros(a)); case VECTOR_OP_REVERSE: return (v0, m) -> v0.uOp(m, (i, a) -> reverse(a)); case VECTOR_OP_REVERSE_BYTES: return (v0, m) -> v0.uOp(m, (i, a) -> a); default: return null; } } // Binary lanewise support /** * {@inheritDoc} * @see #lanewise(VectorOperators.Binary,byte) * @see #lanewise(VectorOperators.Binary,byte,VectorMask) */ @Override public abstract ByteVector lanewise(VectorOperators.Binary op, Vector v); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Binary op, Vector v) { ByteVector that = (ByteVector) v; that.check(this); if (opKind(op, VO_SPECIAL | VO_SHIFT)) { if (op == FIRST_NONZERO) { VectorMask mask = this.compare(EQ, (byte) 0); return this.blend(that, mask); } if (opKind(op, VO_SHIFT)) { // As per shift specification for Java, mask the shift count. // This allows the JIT to ignore some ISA details. that = that.lanewise(AND, SHIFT_MASK); } if (op == AND_NOT) { // FIXME: Support this in the JIT. that = that.lanewise(NOT); op = AND; } else if (op == DIV) { VectorMask eqz = that.eq((byte) 0); if (eqz.anyTrue()) { throw that.divZeroException(); } } } int opc = opCode(op); return VectorSupport.binaryOp( opc, getClass(), null, byte.class, length(), this, that, null, BIN_IMPL.find(op, opc, ByteVector::binaryOperations)); } /** * {@inheritDoc} * @see #lanewise(VectorOperators.Binary,byte,VectorMask) */ @Override public abstract ByteVector lanewise(VectorOperators.Binary op, Vector v, VectorMask m); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Binary op, Class> maskClass, Vector v, VectorMask m) { ByteVector that = (ByteVector) v; that.check(this); m.check(maskClass, this); if (opKind(op, VO_SPECIAL | VO_SHIFT)) { if (op == FIRST_NONZERO) { VectorMask mask = this.compare(EQ, (byte) 0, m); return this.blend(that, mask); } if (opKind(op, VO_SHIFT)) { // As per shift specification for Java, mask the shift count. // This allows the JIT to ignore some ISA details. that = that.lanewise(AND, SHIFT_MASK); } if (op == AND_NOT) { // FIXME: Support this in the JIT. that = that.lanewise(NOT); op = AND; } else if (op == DIV) { VectorMask eqz = that.eq((byte)0); if (eqz.and(m).anyTrue()) { throw that.divZeroException(); } // suppress div/0 exceptions in unset lanes that = that.lanewise(NOT, eqz); } } int opc = opCode(op); return VectorSupport.binaryOp( opc, getClass(), maskClass, byte.class, length(), this, that, m, BIN_IMPL.find(op, opc, ByteVector::binaryOperations)); } private static final ImplCache>> BIN_IMPL = new ImplCache<>(Binary.class, ByteVector.class); private static BinaryOperation> binaryOperations(int opc_) { switch (opc_) { case VECTOR_OP_ADD: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a + b)); case VECTOR_OP_SUB: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a - b)); case VECTOR_OP_MUL: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a * b)); case VECTOR_OP_DIV: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a / b)); case VECTOR_OP_MAX: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)Math.max(a, b)); case VECTOR_OP_MIN: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)Math.min(a, b)); case VECTOR_OP_AND: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a & b)); case VECTOR_OP_OR: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a | b)); case VECTOR_OP_XOR: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(a ^ b)); case VECTOR_OP_LSHIFT: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, n) -> (byte)(a << n)); case VECTOR_OP_RSHIFT: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, n) -> (byte)(a >> n)); case VECTOR_OP_URSHIFT: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, n) -> (byte)((a & LSHR_SETUP_MASK) >>> n)); case VECTOR_OP_LROTATE: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, n) -> rotateLeft(a, (int)n)); case VECTOR_OP_RROTATE: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, n) -> rotateRight(a, (int)n)); case VECTOR_OP_UMAX: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)VectorMath.maxUnsigned(a, b)); case VECTOR_OP_UMIN: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)VectorMath.minUnsigned(a, b)); case VECTOR_OP_SADD: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(VectorMath.addSaturating(a, b))); case VECTOR_OP_SSUB: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(VectorMath.subSaturating(a, b))); case VECTOR_OP_SUADD: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(VectorMath.addSaturatingUnsigned(a, b))); case VECTOR_OP_SUSUB: return (v0, v1, vm) -> v0.bOp(v1, vm, (i, a, b) -> (byte)(VectorMath.subSaturatingUnsigned(a, b))); default: return null; } } // FIXME: Maybe all of the public final methods in this file (the // simple ones that just call lanewise) should be pushed down to // the X-VectorBits template. They can't optimize properly at // this level, and must rely on inlining. Does it work? // (If it works, of course keep the code here.) /** * Combines the lane values of this vector * with the value of a broadcast scalar. * * This is a lane-wise binary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e))}. * * @param op the operation used to process lane values * @param e the input scalar * @return the result of applying the operation lane-wise * to the two input vectors * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte,VectorMask) */ @ForceInline public final ByteVector lanewise(VectorOperators.Binary op, byte e) { if (opKind(op, VO_SHIFT) && (byte)(int)e == e) { return lanewiseShift(op, (int) e); } if (op == AND_NOT) { op = AND; e = (byte) ~e; } return lanewise(op, broadcast(e)); } /** * Combines the lane values of this vector * with the value of a broadcast scalar, * with selection of lane elements controlled by a mask. * * This is a masked lane-wise binary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e), m)}. * * @param op the operation used to process lane values * @param e the input scalar * @param m the mask controlling lane selection * @return the result of applying the operation lane-wise * to the input vector and the scalar * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Binary,Vector,VectorMask) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector lanewise(VectorOperators.Binary op, byte e, VectorMask m) { if (opKind(op, VO_SHIFT) && (byte)(int)e == e) { return lanewiseShift(op, (int) e, m); } if (op == AND_NOT) { op = AND; e = (byte) ~e; } return lanewise(op, broadcast(e), m); } /** * {@inheritDoc} * @apiNote * When working with vector subtypes like {@code ByteVector}, * {@linkplain #lanewise(VectorOperators.Binary,byte) * the more strongly typed method} * is typically selected. It can be explicitly selected * using a cast: {@code v.lanewise(op,(byte)e)}. * The two expressions will produce numerically identical results. */ @ForceInline public final ByteVector lanewise(VectorOperators.Binary op, long e) { byte e1 = (byte) e; if ((long)e1 != e // allow shift ops to clip down their int parameters && !(opKind(op, VO_SHIFT) && (int)e1 == e)) { vspecies().checkValue(e); // for exception } return lanewise(op, e1); } /** * {@inheritDoc} * @apiNote * When working with vector subtypes like {@code ByteVector}, * {@linkplain #lanewise(VectorOperators.Binary,byte,VectorMask) * the more strongly typed method} * is typically selected. It can be explicitly selected * using a cast: {@code v.lanewise(op,(byte)e,m)}. * The two expressions will produce numerically identical results. */ @ForceInline public final ByteVector lanewise(VectorOperators.Binary op, long e, VectorMask m) { byte e1 = (byte) e; if ((long)e1 != e // allow shift ops to clip down their int parameters && !(opKind(op, VO_SHIFT) && (int)e1 == e)) { vspecies().checkValue(e); // for exception } return lanewise(op, e1, m); } /*package-private*/ abstract ByteVector lanewiseShift(VectorOperators.Binary op, int e); /*package-private*/ @ForceInline final ByteVector lanewiseShiftTemplate(VectorOperators.Binary op, int e) { // Special handling for these. FIXME: Refactor? assert(opKind(op, VO_SHIFT)); // As per shift specification for Java, mask the shift count. e &= SHIFT_MASK; int opc = opCode(op); return VectorSupport.broadcastInt( opc, getClass(), null, byte.class, length(), this, e, null, BIN_INT_IMPL.find(op, opc, ByteVector::broadcastIntOperations)); } /*package-private*/ abstract ByteVector lanewiseShift(VectorOperators.Binary op, int e, VectorMask m); /*package-private*/ @ForceInline final ByteVector lanewiseShiftTemplate(VectorOperators.Binary op, Class> maskClass, int e, VectorMask m) { m.check(maskClass, this); assert(opKind(op, VO_SHIFT)); // As per shift specification for Java, mask the shift count. e &= SHIFT_MASK; int opc = opCode(op); return VectorSupport.broadcastInt( opc, getClass(), maskClass, byte.class, length(), this, e, m, BIN_INT_IMPL.find(op, opc, ByteVector::broadcastIntOperations)); } private static final ImplCache>> BIN_INT_IMPL = new ImplCache<>(Binary.class, ByteVector.class); private static VectorBroadcastIntOp> broadcastIntOperations(int opc_) { switch (opc_) { case VECTOR_OP_LSHIFT: return (v, n, m) -> v.uOp(m, (i, a) -> (byte)(a << n)); case VECTOR_OP_RSHIFT: return (v, n, m) -> v.uOp(m, (i, a) -> (byte)(a >> n)); case VECTOR_OP_URSHIFT: return (v, n, m) -> v.uOp(m, (i, a) -> (byte)((a & LSHR_SETUP_MASK) >>> n)); case VECTOR_OP_LROTATE: return (v, n, m) -> v.uOp(m, (i, a) -> rotateLeft(a, (int)n)); case VECTOR_OP_RROTATE: return (v, n, m) -> v.uOp(m, (i, a) -> rotateRight(a, (int)n)); default: return null; } } // As per shift specification for Java, mask the shift count. // We mask 0X3F (long), 0X1F (int), 0x0F (short), 0x7 (byte). // The latter two maskings go beyond the JLS, but seem reasonable // since our lane types are first-class types, not just dressed // up ints. private static final int SHIFT_MASK = (Byte.SIZE - 1); // Also simulate >>> on sub-word variables with a mask. private static final int LSHR_SETUP_MASK = ((1 << Byte.SIZE) - 1); // Ternary lanewise support // Ternary operators come in eight variations: // lanewise(op, [broadcast(e1)|v1], [broadcast(e2)|v2]) // lanewise(op, [broadcast(e1)|v1], [broadcast(e2)|v2], mask) // It is annoying to support all of these variations of masking // and broadcast, but it would be more surprising not to continue // the obvious pattern started by unary and binary. /** * {@inheritDoc} * @see #lanewise(VectorOperators.Ternary,byte,byte,VectorMask) * @see #lanewise(VectorOperators.Ternary,Vector,byte,VectorMask) * @see #lanewise(VectorOperators.Ternary,byte,Vector,VectorMask) * @see #lanewise(VectorOperators.Ternary,byte,byte) * @see #lanewise(VectorOperators.Ternary,Vector,byte) * @see #lanewise(VectorOperators.Ternary,byte,Vector) */ @Override public abstract ByteVector lanewise(VectorOperators.Ternary op, Vector v1, Vector v2); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Ternary op, Vector v1, Vector v2) { ByteVector that = (ByteVector) v1; ByteVector tother = (ByteVector) v2; // It's a word: https://www.dictionary.com/browse/tother // See also Chapter 11 of Dickens, Our Mutual Friend: // "Totherest Governor," replied Mr Riderhood... that.check(this); tother.check(this); if (op == BITWISE_BLEND) { // FIXME: Support this in the JIT. that = this.lanewise(XOR, that).lanewise(AND, tother); return this.lanewise(XOR, that); } int opc = opCode(op); return VectorSupport.ternaryOp( opc, getClass(), null, byte.class, length(), this, that, tother, null, TERN_IMPL.find(op, opc, ByteVector::ternaryOperations)); } /** * {@inheritDoc} * @see #lanewise(VectorOperators.Ternary,byte,byte,VectorMask) * @see #lanewise(VectorOperators.Ternary,Vector,byte,VectorMask) * @see #lanewise(VectorOperators.Ternary,byte,Vector,VectorMask) */ @Override public abstract ByteVector lanewise(VectorOperators.Ternary op, Vector v1, Vector v2, VectorMask m); @ForceInline final ByteVector lanewiseTemplate(VectorOperators.Ternary op, Class> maskClass, Vector v1, Vector v2, VectorMask m) { ByteVector that = (ByteVector) v1; ByteVector tother = (ByteVector) v2; // It's a word: https://www.dictionary.com/browse/tother // See also Chapter 11 of Dickens, Our Mutual Friend: // "Totherest Governor," replied Mr Riderhood... that.check(this); tother.check(this); m.check(maskClass, this); if (op == BITWISE_BLEND) { // FIXME: Support this in the JIT. that = this.lanewise(XOR, that).lanewise(AND, tother); return this.lanewise(XOR, that, m); } int opc = opCode(op); return VectorSupport.ternaryOp( opc, getClass(), maskClass, byte.class, length(), this, that, tother, m, TERN_IMPL.find(op, opc, ByteVector::ternaryOperations)); } private static final ImplCache>> TERN_IMPL = new ImplCache<>(Ternary.class, ByteVector.class); private static TernaryOperation> ternaryOperations(int opc_) { switch (opc_) { default: return null; } } /** * Combines the lane values of this vector * with the values of two broadcast scalars. * * This is a lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e1), this.broadcast(e2))}. * * @param op the operation used to combine lane values * @param e1 the first input scalar * @param e2 the second input scalar * @return the result of applying the operation lane-wise * to the input vector and the scalars * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,Vector,Vector) * @see #lanewise(VectorOperators.Ternary,byte,byte,VectorMask) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,e1,e2) byte e1, byte e2) { return lanewise(op, broadcast(e1), broadcast(e2)); } /** * Combines the lane values of this vector * with the values of two broadcast scalars, * with selection of lane elements controlled by a mask. * * This is a masked lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e1), this.broadcast(e2), m)}. * * @param op the operation used to combine lane values * @param e1 the first input scalar * @param e2 the second input scalar * @param m the mask controlling lane selection * @return the result of applying the operation lane-wise * to the input vector and the scalars * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,Vector,Vector,VectorMask) * @see #lanewise(VectorOperators.Ternary,byte,byte) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,e1,e2,m) byte e1, byte e2, VectorMask m) { return lanewise(op, broadcast(e1), broadcast(e2), m); } /** * Combines the lane values of this vector * with the values of another vector and a broadcast scalar. * * This is a lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, v1, this.broadcast(e2))}. * * @param op the operation used to combine lane values * @param v1 the other input vector * @param e2 the input scalar * @return the result of applying the operation lane-wise * to the input vectors and the scalar * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,byte,byte) * @see #lanewise(VectorOperators.Ternary,Vector,byte,VectorMask) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,v1,e2) Vector v1, byte e2) { return lanewise(op, v1, broadcast(e2)); } /** * Combines the lane values of this vector * with the values of another vector and a broadcast scalar, * with selection of lane elements controlled by a mask. * * This is a masked lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, v1, this.broadcast(e2), m)}. * * @param op the operation used to combine lane values * @param v1 the other input vector * @param e2 the input scalar * @param m the mask controlling lane selection * @return the result of applying the operation lane-wise * to the input vectors and the scalar * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,Vector,Vector) * @see #lanewise(VectorOperators.Ternary,byte,byte,VectorMask) * @see #lanewise(VectorOperators.Ternary,Vector,byte) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,v1,e2,m) Vector v1, byte e2, VectorMask m) { return lanewise(op, v1, broadcast(e2), m); } /** * Combines the lane values of this vector * with the values of another vector and a broadcast scalar. * * This is a lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e1), v2)}. * * @param op the operation used to combine lane values * @param e1 the input scalar * @param v2 the other input vector * @return the result of applying the operation lane-wise * to the input vectors and the scalar * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,Vector,Vector) * @see #lanewise(VectorOperators.Ternary,byte,Vector,VectorMask) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,e1,v2) byte e1, Vector v2) { return lanewise(op, broadcast(e1), v2); } /** * Combines the lane values of this vector * with the values of another vector and a broadcast scalar, * with selection of lane elements controlled by a mask. * * This is a masked lane-wise ternary operation which applies * the selected operation to each lane. * The return value will be equal to this expression: * {@code this.lanewise(op, this.broadcast(e1), v2, m)}. * * @param op the operation used to combine lane values * @param e1 the input scalar * @param v2 the other input vector * @param m the mask controlling lane selection * @return the result of applying the operation lane-wise * to the input vectors and the scalar * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #lanewise(VectorOperators.Ternary,Vector,Vector,VectorMask) * @see #lanewise(VectorOperators.Ternary,byte,Vector) */ @ForceInline public final ByteVector lanewise(VectorOperators.Ternary op, //(op,e1,v2,m) byte e1, Vector v2, VectorMask m) { return lanewise(op, broadcast(e1), v2, m); } // (Thus endeth the Great and Mighty Ternary Ogdoad.) // https://en.wikipedia.org/wiki/Ogdoad /// FULL-SERVICE BINARY METHODS: ADD, SUB, MUL, DIV // // These include masked and non-masked versions. // This subclass adds broadcast (masked or not). /** * {@inheritDoc} * @see #add(byte) */ @Override @ForceInline public final ByteVector add(Vector v) { return lanewise(ADD, v); } /** * Adds this vector to the broadcast of an input scalar. * * This is a lane-wise binary operation which applies * the primitive addition operation ({@code +}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#ADD * ADD}{@code , e)}. * * @param e the input scalar * @return the result of adding each lane of this vector to the scalar * @see #add(Vector) * @see #broadcast(byte) * @see #add(byte,VectorMask) * @see VectorOperators#ADD * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector add(byte e) { return lanewise(ADD, e); } /** * {@inheritDoc} * @see #add(byte,VectorMask) */ @Override @ForceInline public final ByteVector add(Vector v, VectorMask m) { return lanewise(ADD, v, m); } /** * Adds this vector to the broadcast of an input scalar, * selecting lane elements controlled by a mask. * * This is a masked lane-wise binary operation which applies * the primitive addition operation ({@code +}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte,VectorMask) * lanewise}{@code (}{@link VectorOperators#ADD * ADD}{@code , s, m)}. * * @param e the input scalar * @param m the mask controlling lane selection * @return the result of adding each lane of this vector to the scalar * @see #add(Vector,VectorMask) * @see #broadcast(byte) * @see #add(byte) * @see VectorOperators#ADD * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector add(byte e, VectorMask m) { return lanewise(ADD, e, m); } /** * {@inheritDoc} * @see #sub(byte) */ @Override @ForceInline public final ByteVector sub(Vector v) { return lanewise(SUB, v); } /** * Subtracts an input scalar from this vector. * * This is a masked lane-wise binary operation which applies * the primitive subtraction operation ({@code -}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#SUB * SUB}{@code , e)}. * * @param e the input scalar * @return the result of subtracting the scalar from each lane of this vector * @see #sub(Vector) * @see #broadcast(byte) * @see #sub(byte,VectorMask) * @see VectorOperators#SUB * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector sub(byte e) { return lanewise(SUB, e); } /** * {@inheritDoc} * @see #sub(byte,VectorMask) */ @Override @ForceInline public final ByteVector sub(Vector v, VectorMask m) { return lanewise(SUB, v, m); } /** * Subtracts an input scalar from this vector * under the control of a mask. * * This is a masked lane-wise binary operation which applies * the primitive subtraction operation ({@code -}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte,VectorMask) * lanewise}{@code (}{@link VectorOperators#SUB * SUB}{@code , s, m)}. * * @param e the input scalar * @param m the mask controlling lane selection * @return the result of subtracting the scalar from each lane of this vector * @see #sub(Vector,VectorMask) * @see #broadcast(byte) * @see #sub(byte) * @see VectorOperators#SUB * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector sub(byte e, VectorMask m) { return lanewise(SUB, e, m); } /** * {@inheritDoc} * @see #mul(byte) */ @Override @ForceInline public final ByteVector mul(Vector v) { return lanewise(MUL, v); } /** * Multiplies this vector by the broadcast of an input scalar. * * This is a lane-wise binary operation which applies * the primitive multiplication operation ({@code *}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#MUL * MUL}{@code , e)}. * * @param e the input scalar * @return the result of multiplying this vector by the given scalar * @see #mul(Vector) * @see #broadcast(byte) * @see #mul(byte,VectorMask) * @see VectorOperators#MUL * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector mul(byte e) { return lanewise(MUL, e); } /** * {@inheritDoc} * @see #mul(byte,VectorMask) */ @Override @ForceInline public final ByteVector mul(Vector v, VectorMask m) { return lanewise(MUL, v, m); } /** * Multiplies this vector by the broadcast of an input scalar, * selecting lane elements controlled by a mask. * * This is a masked lane-wise binary operation which applies * the primitive multiplication operation ({@code *}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte,VectorMask) * lanewise}{@code (}{@link VectorOperators#MUL * MUL}{@code , s, m)}. * * @param e the input scalar * @param m the mask controlling lane selection * @return the result of muling each lane of this vector to the scalar * @see #mul(Vector,VectorMask) * @see #broadcast(byte) * @see #mul(byte) * @see VectorOperators#MUL * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector mul(byte e, VectorMask m) { return lanewise(MUL, e, m); } /** * {@inheritDoc} * @apiNote If there is a zero divisor, {@code * ArithmeticException} will be thrown. */ @Override @ForceInline public final ByteVector div(Vector v) { return lanewise(DIV, v); } /** * Divides this vector by the broadcast of an input scalar. * * This is a lane-wise binary operation which applies * the primitive division operation ({@code /}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#DIV * DIV}{@code , e)}. * * @apiNote If there is a zero divisor, {@code * ArithmeticException} will be thrown. * * @param e the input scalar * @return the result of dividing each lane of this vector by the scalar * @see #div(Vector) * @see #broadcast(byte) * @see #div(byte,VectorMask) * @see VectorOperators#DIV * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector div(byte e) { return lanewise(DIV, e); } /** * {@inheritDoc} * @see #div(byte,VectorMask) * @apiNote If there is a zero divisor, {@code * ArithmeticException} will be thrown. */ @Override @ForceInline public final ByteVector div(Vector v, VectorMask m) { return lanewise(DIV, v, m); } /** * Divides this vector by the broadcast of an input scalar, * selecting lane elements controlled by a mask. * * This is a masked lane-wise binary operation which applies * the primitive division operation ({@code /}) to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte,VectorMask) * lanewise}{@code (}{@link VectorOperators#DIV * DIV}{@code , s, m)}. * * @apiNote If there is a zero divisor, {@code * ArithmeticException} will be thrown. * * @param e the input scalar * @param m the mask controlling lane selection * @return the result of dividing each lane of this vector by the scalar * @see #div(Vector,VectorMask) * @see #broadcast(byte) * @see #div(byte) * @see VectorOperators#DIV * @see #lanewise(VectorOperators.Binary,Vector) * @see #lanewise(VectorOperators.Binary,byte) */ @ForceInline public final ByteVector div(byte e, VectorMask m) { return lanewise(DIV, e, m); } /// END OF FULL-SERVICE BINARY METHODS /// SECOND-TIER BINARY METHODS // // There are no masked versions. /** * {@inheritDoc} */ @Override @ForceInline public final ByteVector min(Vector v) { return lanewise(MIN, v); } // FIXME: "broadcast of an input scalar" is really wordy. Reduce? /** * Computes the smaller of this vector and the broadcast of an input scalar. * * This is a lane-wise binary operation which applies the * operation {@code Math.min()} to each pair of * corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#MIN * MIN}{@code , e)}. * * @param e the input scalar * @return the result of multiplying this vector by the given scalar * @see #min(Vector) * @see #broadcast(byte) * @see VectorOperators#MIN * @see #lanewise(VectorOperators.Binary,byte,VectorMask) */ @ForceInline public final ByteVector min(byte e) { return lanewise(MIN, e); } /** * {@inheritDoc} */ @Override @ForceInline public final ByteVector max(Vector v) { return lanewise(MAX, v); } /** * Computes the larger of this vector and the broadcast of an input scalar. * * This is a lane-wise binary operation which applies the * operation {@code Math.max()} to each pair of * corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,byte) * lanewise}{@code (}{@link VectorOperators#MAX * MAX}{@code , e)}. * * @param e the input scalar * @return the result of multiplying this vector by the given scalar * @see #max(Vector) * @see #broadcast(byte) * @see VectorOperators#MAX * @see #lanewise(VectorOperators.Binary,byte,VectorMask) */ @ForceInline public final ByteVector max(byte e) { return lanewise(MAX, e); } // common bitwise operators: and, or, not (with scalar versions) /** * Computes the bitwise logical conjunction ({@code &}) * of this vector and a second input vector. * * This is a lane-wise binary operation which applies * the primitive bitwise "and" operation ({@code &}) * to each pair of corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,Vector) * lanewise}{@code (}{@link VectorOperators#AND * AND}{@code , v)}. * *

* This is not a full-service named operation like * {@link #add(Vector) add}. A masked version of * this operation is not directly available * but may be obtained via the masked version of * {@code lanewise}. * * @param v a second input vector * @return the bitwise {@code &} of this vector and the second input vector * @see #and(byte) * @see #or(Vector) * @see #not() * @see VectorOperators#AND * @see #lanewise(VectorOperators.Binary,Vector,VectorMask) */ @ForceInline public final ByteVector and(Vector v) { return lanewise(AND, v); } /** * Computes the bitwise logical conjunction ({@code &}) * of this vector and a scalar. * * This is a lane-wise binary operation which applies * the primitive bitwise "and" operation ({@code &}) * to each pair of corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,Vector) * lanewise}{@code (}{@link VectorOperators#AND * AND}{@code , e)}. * * @param e an input scalar * @return the bitwise {@code &} of this vector and scalar * @see #and(Vector) * @see VectorOperators#AND * @see #lanewise(VectorOperators.Binary,Vector,VectorMask) */ @ForceInline public final ByteVector and(byte e) { return lanewise(AND, e); } /** * Computes the bitwise logical disjunction ({@code |}) * of this vector and a second input vector. * * This is a lane-wise binary operation which applies * the primitive bitwise "or" operation ({@code |}) * to each pair of corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,Vector) * lanewise}{@code (}{@link VectorOperators#OR * AND}{@code , v)}. * *

* This is not a full-service named operation like * {@link #add(Vector) add}. A masked version of * this operation is not directly available * but may be obtained via the masked version of * {@code lanewise}. * * @param v a second input vector * @return the bitwise {@code |} of this vector and the second input vector * @see #or(byte) * @see #and(Vector) * @see #not() * @see VectorOperators#OR * @see #lanewise(VectorOperators.Binary,Vector,VectorMask) */ @ForceInline public final ByteVector or(Vector v) { return lanewise(OR, v); } /** * Computes the bitwise logical disjunction ({@code |}) * of this vector and a scalar. * * This is a lane-wise binary operation which applies * the primitive bitwise "or" operation ({@code |}) * to each pair of corresponding lane values. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Binary,Vector) * lanewise}{@code (}{@link VectorOperators#OR * OR}{@code , e)}. * * @param e an input scalar * @return the bitwise {@code |} of this vector and scalar * @see #or(Vector) * @see VectorOperators#OR * @see #lanewise(VectorOperators.Binary,Vector,VectorMask) */ @ForceInline public final ByteVector or(byte e) { return lanewise(OR, e); } /// UNARY METHODS /** * {@inheritDoc} */ @Override @ForceInline public final ByteVector neg() { return lanewise(NEG); } /** * {@inheritDoc} */ @Override @ForceInline public final ByteVector abs() { return lanewise(ABS); } static int bitCount(byte a) { return Integer.bitCount((int)a & 0xFF); } static int numberOfTrailingZeros(byte a) { return a != 0 ? Integer.numberOfTrailingZeros(a) : 8; } static int numberOfLeadingZeros(byte a) { return a >= 0 ? Integer.numberOfLeadingZeros(a) - 24 : 0; } static byte reverse(byte a) { if (a == 0 || a == -1) return a; byte b = rotateLeft(a, 4); b = (byte) (((b & 0x55) << 1) | ((b & 0xAA) >>> 1)); b = (byte) (((b & 0x33) << 2) | ((b & 0xCC) >>> 2)); return b; } // not (~) /** * Computes the bitwise logical complement ({@code ~}) * of this vector. * * This is a lane-wise binary operation which applies * the primitive bitwise "not" operation ({@code ~}) * to each lane value. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Unary) * lanewise}{@code (}{@link VectorOperators#NOT * NOT}{@code )}. * *

* This is not a full-service named operation like * {@link #add(Vector) add}. A masked version of * this operation is not directly available * but may be obtained via the masked version of * {@code lanewise}. * * @return the bitwise complement {@code ~} of this vector * @see #and(Vector) * @see VectorOperators#NOT * @see #lanewise(VectorOperators.Unary,VectorMask) */ @ForceInline public final ByteVector not() { return lanewise(NOT); } /// COMPARISONS /** * {@inheritDoc} */ @Override @ForceInline public final VectorMask eq(Vector v) { return compare(EQ, v); } /** * Tests if this vector is equal to an input scalar. * * This is a lane-wise binary test operation which applies * the primitive equals operation ({@code ==}) to each lane. * The result is the same as {@code compare(VectorOperators.Comparison.EQ, e)}. * * @param e the input scalar * @return the result mask of testing if this vector * is equal to {@code e} * @see #compare(VectorOperators.Comparison,byte) */ @ForceInline public final VectorMask eq(byte e) { return compare(EQ, e); } /** * {@inheritDoc} */ @Override @ForceInline public final VectorMask lt(Vector v) { return compare(LT, v); } /** * Tests if this vector is less than an input scalar. * * This is a lane-wise binary test operation which applies * the primitive less than operation ({@code <}) to each lane. * The result is the same as {@code compare(VectorOperators.LT, e)}. * * @param e the input scalar * @return the mask result of testing if this vector * is less than the input scalar * @see #compare(VectorOperators.Comparison,byte) */ @ForceInline public final VectorMask lt(byte e) { return compare(LT, e); } /** * {@inheritDoc} */ @Override public abstract VectorMask test(VectorOperators.Test op); /*package-private*/ @ForceInline final > M testTemplate(Class maskType, Test op) { ByteSpecies vsp = vspecies(); if (opKind(op, VO_SPECIAL)) { VectorMask m; if (op == IS_DEFAULT) { m = compare(EQ, (byte) 0); } else if (op == IS_NEGATIVE) { m = compare(LT, (byte) 0); } else { throw new AssertionError(op); } return maskType.cast(m); } int opc = opCode(op); throw new AssertionError(op); } /** * {@inheritDoc} */ @Override public abstract VectorMask test(VectorOperators.Test op, VectorMask m); /*package-private*/ @ForceInline final > M testTemplate(Class maskType, Test op, M mask) { ByteSpecies vsp = vspecies(); mask.check(maskType, this); if (opKind(op, VO_SPECIAL)) { VectorMask m = mask; if (op == IS_DEFAULT) { m = compare(EQ, (byte) 0, m); } else if (op == IS_NEGATIVE) { m = compare(LT, (byte) 0, m); } else { throw new AssertionError(op); } return maskType.cast(m); } int opc = opCode(op); throw new AssertionError(op); } /** * {@inheritDoc} */ @Override public abstract VectorMask compare(VectorOperators.Comparison op, Vector v); /*package-private*/ @ForceInline final > M compareTemplate(Class maskType, Comparison op, Vector v) { ByteVector that = (ByteVector) v; that.check(this); int opc = opCode(op); return VectorSupport.compare( opc, getClass(), maskType, byte.class, length(), this, that, null, (cond, v0, v1, m1) -> { AbstractMask m = v0.bTest(cond, v1, (cond_, i, a, b) -> compareWithOp(cond, a, b)); @SuppressWarnings("unchecked") M m2 = (M) m; return m2; }); } /*package-private*/ @ForceInline final > M compareTemplate(Class maskType, Comparison op, Vector v, M m) { ByteVector that = (ByteVector) v; that.check(this); m.check(maskType, this); int opc = opCode(op); return VectorSupport.compare( opc, getClass(), maskType, byte.class, length(), this, that, m, (cond, v0, v1, m1) -> { AbstractMask cmpM = v0.bTest(cond, v1, (cond_, i, a, b) -> compareWithOp(cond, a, b)); @SuppressWarnings("unchecked") M m2 = (M) cmpM.and(m1); return m2; }); } @ForceInline private static boolean compareWithOp(int cond, byte a, byte b) { return switch (cond) { case BT_eq -> a == b; case BT_ne -> a != b; case BT_lt -> a < b; case BT_le -> a <= b; case BT_gt -> a > b; case BT_ge -> a >= b; case BT_ult -> Byte.compareUnsigned(a, b) < 0; case BT_ule -> Byte.compareUnsigned(a, b) <= 0; case BT_ugt -> Byte.compareUnsigned(a, b) > 0; case BT_uge -> Byte.compareUnsigned(a, b) >= 0; default -> throw new AssertionError(); }; } /** * Tests this vector by comparing it with an input scalar, * according to the given comparison operation. * * This is a lane-wise binary test operation which applies * the comparison operation to each lane. *

* The result is the same as * {@code compare(op, broadcast(species(), e))}. * That is, the scalar may be regarded as broadcast to * a vector of the same species, and then compared * against the original vector, using the selected * comparison operation. * * @param op the operation used to compare lane values * @param e the input scalar * @return the mask result of testing lane-wise if this vector * compares to the input, according to the selected * comparison operator * @see ByteVector#compare(VectorOperators.Comparison,Vector) * @see #eq(byte) * @see #lt(byte) */ public abstract VectorMask compare(Comparison op, byte e); /*package-private*/ @ForceInline final > M compareTemplate(Class maskType, Comparison op, byte e) { return compareTemplate(maskType, op, broadcast(e)); } /** * Tests this vector by comparing it with an input scalar, * according to the given comparison operation, * in lanes selected by a mask. * * This is a masked lane-wise binary test operation which applies * to each pair of corresponding lane values. * * The returned result is equal to the expression * {@code compare(op,s).and(m)}. * * @param op the operation used to compare lane values * @param e the input scalar * @param m the mask controlling lane selection * @return the mask result of testing lane-wise if this vector * compares to the input, according to the selected * comparison operator, * and only in the lanes selected by the mask * @see ByteVector#compare(VectorOperators.Comparison,Vector,VectorMask) */ @ForceInline public final VectorMask compare(VectorOperators.Comparison op, byte e, VectorMask m) { return compare(op, broadcast(e), m); } /** * {@inheritDoc} */ @Override public abstract VectorMask compare(Comparison op, long e); /*package-private*/ @ForceInline final > M compareTemplate(Class maskType, Comparison op, long e) { return compareTemplate(maskType, op, broadcast(e)); } /** * {@inheritDoc} */ @Override @ForceInline public final VectorMask compare(Comparison op, long e, VectorMask m) { return compare(op, broadcast(e), m); } /** * {@inheritDoc} */ @Override public abstract ByteVector blend(Vector v, VectorMask m); /*package-private*/ @ForceInline final > ByteVector blendTemplate(Class maskType, ByteVector v, M m) { v.check(this); return VectorSupport.blend( getClass(), maskType, byte.class, length(), this, v, m, (v0, v1, m_) -> v0.bOp(v1, m_, (i, a, b) -> b)); } /** * {@inheritDoc} */ @Override public abstract ByteVector addIndex(int scale); /*package-private*/ @ForceInline final ByteVector addIndexTemplate(int scale) { ByteSpecies vsp = vspecies(); // make sure VLENGTH*scale doesn't overflow: vsp.checkScale(scale); return VectorSupport.indexVector( getClass(), byte.class, length(), this, scale, vsp, (v, scale_, s) -> { // If the platform doesn't support an INDEX // instruction directly, load IOTA from memory // and multiply. ByteVector iota = s.iota(); byte sc = (byte) scale_; return v.add(sc == 1 ? iota : iota.mul(sc)); }); } /** * Replaces selected lanes of this vector with * a scalar value * under the control of a mask. * * This is a masked lane-wise binary operation which * selects each lane value from one or the other input. * * The returned result is equal to the expression * {@code blend(broadcast(e),m)}. * * @param e the input scalar, containing the replacement lane value * @param m the mask controlling lane selection of the scalar * @return the result of blending the lane elements of this vector with * the scalar value */ @ForceInline public final ByteVector blend(byte e, VectorMask m) { return blend(broadcast(e), m); } /** * Replaces selected lanes of this vector with * a scalar value * under the control of a mask. * * This is a masked lane-wise binary operation which * selects each lane value from one or the other input. * * The returned result is equal to the expression * {@code blend(broadcast(e),m)}. * * @param e the input scalar, containing the replacement lane value * @param m the mask controlling lane selection of the scalar * @return the result of blending the lane elements of this vector with * the scalar value */ @ForceInline public final ByteVector blend(long e, VectorMask m) { return blend(broadcast(e), m); } /** * {@inheritDoc} */ @Override public abstract ByteVector slice(int origin, Vector v1); /*package-private*/ final @ForceInline ByteVector sliceTemplate(int origin, Vector v1) { ByteVector that = (ByteVector) v1; that.check(this); Objects.checkIndex(origin, length() + 1); ByteVector iotaVector = (ByteVector) iotaShuffle().toBitsVector(); ByteVector filter = broadcast((byte)(length() - origin)); VectorMask blendMask = iotaVector.compare(VectorOperators.LT, filter); AbstractShuffle iota = iotaShuffle(origin, 1, true); return that.rearrange(iota).blend(this.rearrange(iota), blendMask); } /** * {@inheritDoc} */ @Override @ForceInline public final ByteVector slice(int origin, Vector w, VectorMask m) { return broadcast(0).blend(slice(origin, w), m); } /** * {@inheritDoc} */ @Override public abstract ByteVector slice(int origin); /*package-private*/ final @ForceInline ByteVector sliceTemplate(int origin) { Objects.checkIndex(origin, length() + 1); ByteVector iotaVector = (ByteVector) iotaShuffle().toBitsVector(); ByteVector filter = broadcast((byte)(length() - origin)); VectorMask blendMask = iotaVector.compare(VectorOperators.LT, filter); AbstractShuffle iota = iotaShuffle(origin, 1, true); return vspecies().zero().blend(this.rearrange(iota), blendMask); } /** * {@inheritDoc} */ @Override public abstract ByteVector unslice(int origin, Vector w, int part); /*package-private*/ final @ForceInline ByteVector unsliceTemplate(int origin, Vector w, int part) { ByteVector that = (ByteVector) w; that.check(this); Objects.checkIndex(origin, length() + 1); ByteVector iotaVector = (ByteVector) iotaShuffle().toBitsVector(); ByteVector filter = broadcast((byte)origin); VectorMask blendMask = iotaVector.compare((part == 0) ? VectorOperators.GE : VectorOperators.LT, filter); AbstractShuffle iota = iotaShuffle(-origin, 1, true); return that.blend(this.rearrange(iota), blendMask); } /*package-private*/ final @ForceInline > ByteVector unsliceTemplate(Class maskType, int origin, Vector w, int part, M m) { ByteVector that = (ByteVector) w; that.check(this); ByteVector slice = that.sliceTemplate(origin, that); slice = slice.blendTemplate(maskType, this, m); return slice.unsliceTemplate(origin, w, part); } /** * {@inheritDoc} */ @Override public abstract ByteVector unslice(int origin, Vector w, int part, VectorMask m); /** * {@inheritDoc} */ @Override public abstract ByteVector unslice(int origin); /*package-private*/ final @ForceInline ByteVector unsliceTemplate(int origin) { Objects.checkIndex(origin, length() + 1); ByteVector iotaVector = (ByteVector) iotaShuffle().toBitsVector(); ByteVector filter = broadcast((byte)origin); VectorMask blendMask = iotaVector.compare(VectorOperators.GE, filter); AbstractShuffle iota = iotaShuffle(-origin, 1, true); return vspecies().zero().blend(this.rearrange(iota), blendMask); } private ArrayIndexOutOfBoundsException wrongPartForSlice(int part) { String msg = String.format("bad part number %d for slice operation", part); return new ArrayIndexOutOfBoundsException(msg); } /** * {@inheritDoc} */ @Override public abstract ByteVector rearrange(VectorShuffle shuffle); /*package-private*/ @ForceInline final > ByteVector rearrangeTemplate(Class shuffletype, S shuffle) { Objects.requireNonNull(shuffle); return VectorSupport.rearrangeOp( getClass(), shuffletype, null, byte.class, length(), this, shuffle, null, (v1, s_, m_) -> v1.uOp((i, a) -> { int ei = Integer.remainderUnsigned(s_.laneSource(i), v1.length()); return v1.lane(ei); })); } /** * {@inheritDoc} */ @Override public abstract ByteVector rearrange(VectorShuffle s, VectorMask m); /*package-private*/ @ForceInline final , M extends VectorMask> ByteVector rearrangeTemplate(Class shuffletype, Class masktype, S shuffle, M m) { Objects.requireNonNull(shuffle); m.check(masktype, this); return VectorSupport.rearrangeOp( getClass(), shuffletype, masktype, byte.class, length(), this, shuffle, m, (v1, s_, m_) -> v1.uOp((i, a) -> { int ei = Integer.remainderUnsigned(s_.laneSource(i), v1.length()); return !m_.laneIsSet(i) ? 0 : v1.lane(ei); })); } /** * {@inheritDoc} */ @Override public abstract ByteVector rearrange(VectorShuffle s, Vector v); /*package-private*/ @ForceInline final > ByteVector rearrangeTemplate(Class shuffletype, S shuffle, ByteVector v) { VectorMask valid = shuffle.laneIsValid(); ByteVector r0 = VectorSupport.rearrangeOp( getClass(), shuffletype, null, byte.class, length(), this, shuffle, null, (v0, s_, m_) -> v0.uOp((i, a) -> { int ei = Integer.remainderUnsigned(s_.laneSource(i), v0.length()); return v0.lane(ei); })); ByteVector r1 = VectorSupport.rearrangeOp( getClass(), shuffletype, null, byte.class, length(), v, shuffle, null, (v1, s_, m_) -> v1.uOp((i, a) -> { int ei = Integer.remainderUnsigned(s_.laneSource(i), v1.length()); return v1.lane(ei); })); return r1.blend(r0, valid); } @Override @ForceInline final VectorShuffle bitsToShuffle0(AbstractSpecies dsp) { assert(dsp.length() == vspecies().length()); byte[] a = toArray(); int[] sa = new int[a.length]; for (int i = 0; i < a.length; i++) { sa[i] = (int) a[i]; } return VectorShuffle.fromArray(dsp, sa, 0); } @ForceInline final VectorShuffle toShuffle(AbstractSpecies dsp, boolean wrap) { assert(dsp.elementSize() == vspecies().elementSize()); ByteVector idx = this; ByteVector wrapped = idx.lanewise(VectorOperators.AND, length() - 1); if (!wrap) { ByteVector wrappedEx = wrapped.lanewise(VectorOperators.SUB, length()); VectorMask inBound = wrapped.compare(VectorOperators.EQ, idx); wrapped = wrappedEx.blend(wrapped, inBound); } return wrapped.bitsToShuffle(dsp); } /** * {@inheritDoc} * @since 19 */ @Override public abstract ByteVector compress(VectorMask m); /*package-private*/ @ForceInline final > ByteVector compressTemplate(Class masktype, M m) { m.check(masktype, this); return (ByteVector) VectorSupport.compressExpandOp(VectorSupport.VECTOR_OP_COMPRESS, getClass(), masktype, byte.class, length(), this, m, (v1, m1) -> compressHelper(v1, m1)); } /** * {@inheritDoc} * @since 19 */ @Override public abstract ByteVector expand(VectorMask m); /*package-private*/ @ForceInline final > ByteVector expandTemplate(Class masktype, M m) { m.check(masktype, this); return (ByteVector) VectorSupport.compressExpandOp(VectorSupport.VECTOR_OP_EXPAND, getClass(), masktype, byte.class, length(), this, m, (v1, m1) -> expandHelper(v1, m1)); } /** * {@inheritDoc} */ @Override public abstract ByteVector selectFrom(Vector v); /*package-private*/ @ForceInline final ByteVector selectFromTemplate(ByteVector v) { return (ByteVector)VectorSupport.selectFromOp(getClass(), null, byte.class, length(), this, v, null, (v1, v2, _m) -> v2.rearrange(v1.toShuffle())); } /** * {@inheritDoc} */ @Override public abstract ByteVector selectFrom(Vector s, VectorMask m); /*package-private*/ @ForceInline final > ByteVector selectFromTemplate(ByteVector v, Class masktype, M m) { m.check(masktype, this); return (ByteVector)VectorSupport.selectFromOp(getClass(), masktype, byte.class, length(), this, v, m, (v1, v2, _m) -> v2.rearrange(v1.toShuffle(), _m)); } /** * {@inheritDoc} */ @Override public abstract ByteVector selectFrom(Vector v1, Vector v2); /*package-private*/ @ForceInline final ByteVector selectFromTemplate(ByteVector v1, ByteVector v2) { return VectorSupport.selectFromTwoVectorOp(getClass(), byte.class, length(), this, v1, v2, (vec1, vec2, vec3) -> selectFromTwoVectorHelper(vec1, vec2, vec3)); } /// Ternary operations /** * Blends together the bits of two vectors under * the control of a third, which supplies mask bits. * * This is a lane-wise ternary operation which performs * a bitwise blending operation {@code (a&~c)|(b&c)} * to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Ternary,Vector,Vector) * lanewise}{@code (}{@link VectorOperators#BITWISE_BLEND * BITWISE_BLEND}{@code , bits, mask)}. * * @param bits input bits to blend into the current vector * @param mask a bitwise mask to enable blending of the input bits * @return the bitwise blend of the given bits into the current vector, * under control of the bitwise mask * @see #bitwiseBlend(byte,byte) * @see #bitwiseBlend(byte,Vector) * @see #bitwiseBlend(Vector,byte) * @see VectorOperators#BITWISE_BLEND * @see #lanewise(VectorOperators.Ternary,Vector,Vector,VectorMask) */ @ForceInline public final ByteVector bitwiseBlend(Vector bits, Vector mask) { return lanewise(BITWISE_BLEND, bits, mask); } /** * Blends together the bits of a vector and a scalar under * the control of another scalar, which supplies mask bits. * * This is a lane-wise ternary operation which performs * a bitwise blending operation {@code (a&~c)|(b&c)} * to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Ternary,Vector,Vector) * lanewise}{@code (}{@link VectorOperators#BITWISE_BLEND * BITWISE_BLEND}{@code , bits, mask)}. * * @param bits input bits to blend into the current vector * @param mask a bitwise mask to enable blending of the input bits * @return the bitwise blend of the given bits into the current vector, * under control of the bitwise mask * @see #bitwiseBlend(Vector,Vector) * @see VectorOperators#BITWISE_BLEND * @see #lanewise(VectorOperators.Ternary,byte,byte,VectorMask) */ @ForceInline public final ByteVector bitwiseBlend(byte bits, byte mask) { return lanewise(BITWISE_BLEND, bits, mask); } /** * Blends together the bits of a vector and a scalar under * the control of another vector, which supplies mask bits. * * This is a lane-wise ternary operation which performs * a bitwise blending operation {@code (a&~c)|(b&c)} * to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Ternary,Vector,Vector) * lanewise}{@code (}{@link VectorOperators#BITWISE_BLEND * BITWISE_BLEND}{@code , bits, mask)}. * * @param bits input bits to blend into the current vector * @param mask a bitwise mask to enable blending of the input bits * @return the bitwise blend of the given bits into the current vector, * under control of the bitwise mask * @see #bitwiseBlend(Vector,Vector) * @see VectorOperators#BITWISE_BLEND * @see #lanewise(VectorOperators.Ternary,byte,Vector,VectorMask) */ @ForceInline public final ByteVector bitwiseBlend(byte bits, Vector mask) { return lanewise(BITWISE_BLEND, bits, mask); } /** * Blends together the bits of two vectors under * the control of a scalar, which supplies mask bits. * * This is a lane-wise ternary operation which performs * a bitwise blending operation {@code (a&~c)|(b&c)} * to each lane. * * This method is also equivalent to the expression * {@link #lanewise(VectorOperators.Ternary,Vector,Vector) * lanewise}{@code (}{@link VectorOperators#BITWISE_BLEND * BITWISE_BLEND}{@code , bits, mask)}. * * @param bits input bits to blend into the current vector * @param mask a bitwise mask to enable blending of the input bits * @return the bitwise blend of the given bits into the current vector, * under control of the bitwise mask * @see #bitwiseBlend(Vector,Vector) * @see VectorOperators#BITWISE_BLEND * @see #lanewise(VectorOperators.Ternary,Vector,byte,VectorMask) */ @ForceInline public final ByteVector bitwiseBlend(Vector bits, byte mask) { return lanewise(BITWISE_BLEND, bits, mask); } // Type specific horizontal reductions /** * Returns a value accumulated from all the lanes of this vector. * * This is an associative cross-lane reduction operation which * applies the specified operation to all the lane elements. *

~~* A few reduction operations do not support arbitrary reordering * of their operands, yet are included here because of their * usefulness. *~~

*
* In the case of {@code FIRST_NONZERO}, the reduction returns * the value from the lowest-numbered non-zero lane. *
* All other reduction operations are fully commutative and * associative. The implementation can choose any order of * processing, yet it will always produce the same result. *

* * @param op the operation used to combine lane values * @return the accumulated result * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #reduceLanes(VectorOperators.Associative,VectorMask) * @see #add(Vector) * @see #mul(Vector) * @see #min(Vector) * @see #max(Vector) * @see #and(Vector) * @see #or(Vector) * @see VectorOperators#XOR * @see VectorOperators#FIRST_NONZERO */ public abstract byte reduceLanes(VectorOperators.Associative op); /** * Returns a value accumulated from selected lanes of this vector, * controlled by a mask. * * This is an associative cross-lane reduction operation which * applies the specified operation to the selected lane elements. *
* If no elements are selected, an operation-specific identity * value is returned. *
*
* If the operation is * {@code ADD}, {@code XOR}, {@code OR}, * or {@code FIRST_NONZERO}, * then the identity value is zero, the default {@code byte} value. *
* If the operation is {@code MUL}, * then the identity value is one. *
* If the operation is {@code AND}, * then the identity value is minus one (all bits set). *
* If the operation is {@code MAX}, * then the identity value is {@code Byte.MIN_VALUE}. *
* If the operation is {@code MIN}, * then the identity value is {@code Byte.MAX_VALUE}. *
*
* A few reduction operations do not support arbitrary reordering * of their operands, yet are included here because of their * usefulness. *
*
* In the case of {@code FIRST_NONZERO}, the reduction returns * the value from the lowest-numbered non-zero lane. *
* All other reduction operations are fully commutative and * associative. The implementation can choose any order of * processing, yet it will always produce the same result. *
* * @param op the operation used to combine lane values * @param m the mask controlling lane selection * @return the reduced result accumulated from the selected lane values * @throws UnsupportedOperationException if this vector does * not support the requested operation * @see #reduceLanes(VectorOperators.Associative) */ public abstract byte reduceLanes(VectorOperators.Associative op, VectorMask m); /*package-private*/ @ForceInline final byte reduceLanesTemplate(VectorOperators.Associative op, Class> maskClass, VectorMask m) { m.check(maskClass, this); if (op == FIRST_NONZERO) { // FIXME: The JIT should handle this. ByteVector v = broadcast((byte) 0).blend(this, m); return v.reduceLanesTemplate(op); } int opc = opCode(op); return fromBits(VectorSupport.reductionCoerced( opc, getClass(), maskClass, byte.class, length(), this, m, REDUCE_IMPL.find(op, opc, ByteVector::reductionOperations))); } /*package-private*/ @ForceInline final byte reduceLanesTemplate(VectorOperators.Associative op) { if (op == FIRST_NONZERO) { // FIXME: The JIT should handle this. VectorMask thisNZ = this.viewAsIntegralLanes().compare(NE, (byte) 0); int ft = thisNZ.firstTrue(); return ft < length() ? this.lane(ft) : (byte) 0; } int opc = opCode(op); return fromBits(VectorSupport.reductionCoerced( opc, getClass(), null, byte.class, length(), this, null, REDUCE_IMPL.find(op, opc, ByteVector::reductionOperations))); } private static final ImplCache>> REDUCE_IMPL = new ImplCache<>(Associative.class, ByteVector.class); private static ReductionOperation> reductionOperations(int opc_) { switch (opc_) { case VECTOR_OP_ADD: return (v, m) -> toBits(v.rOp((byte)0, m, (i, a, b) -> (byte)(a + b))); case VECTOR_OP_MUL: return (v, m) -> toBits(v.rOp((byte)1, m, (i, a, b) -> (byte)(a * b))); case VECTOR_OP_MIN: return (v, m) -> toBits(v.rOp(MAX_OR_INF, m, (i, a, b) -> (byte) Math.min(a, b))); case VECTOR_OP_MAX: return (v, m) -> toBits(v.rOp(MIN_OR_INF, m, (i, a, b) -> (byte) Math.max(a, b))); case VECTOR_OP_UMIN: return (v, m) -> toBits(v.rOp(MAX_OR_INF, m, (i, a, b) -> (byte) VectorMath.minUnsigned(a, b))); case VECTOR_OP_UMAX: return (v, m) -> toBits(v.rOp(MIN_OR_INF, m, (i, a, b) -> (byte) VectorMath.maxUnsigned(a, b))); case VECTOR_OP_AND: return (v, m) -> toBits(v.rOp((byte)-1, m, (i, a, b) -> (byte)(a & b))); case VECTOR_OP_OR: return (v, m) -> toBits(v.rOp((byte)0, m, (i, a, b) -> (byte)(a | b))); case VECTOR_OP_XOR: return (v, m) -> toBits(v.rOp((byte)0, m, (i, a, b) -> (byte)(a ^ b))); default: return null; } } private static final byte MIN_OR_INF = Byte.MIN_VALUE; private static final byte MAX_OR_INF = Byte.MAX_VALUE; public @Override abstract long reduceLanesToLong(VectorOperators.Associative op); public @Override abstract long reduceLanesToLong(VectorOperators.Associative op, VectorMask m); // Type specific accessors /** * Gets the lane element at lane index {@code i} * * @param i the lane index * @return the lane element at lane index {@code i} * @throws IllegalArgumentException if the index is out of range * ({@code < 0 || >= length()}) */ public abstract byte lane(int i); /** * Replaces the lane element of this vector at lane index {@code i} with * value {@code e}. * * This is a cross-lane operation and behaves as if it returns the result * of blending this vector with an input vector that is the result of * broadcasting {@code e} and a mask that has only one lane set at lane * index {@code i}. * * @param i the lane index of the lane element to be replaced * @param e the value to be placed * @return the result of replacing the lane element of this vector at lane * index {@code i} with value {@code e}. * @throws IllegalArgumentException if the index is out of range * ({@code < 0 || >= length()}) */ public abstract ByteVector withLane(int i, byte e); // Memory load operations /** * Returns an array of type {@code byte[]} * containing all the lane values. * The array length is the same as the vector length. * The array elements are stored in lane order. *
* This method behaves as if it stores * this vector into an allocated array * (using {@link #intoArray(byte[], int) intoArray}) * and returns the array as follows: *
{@code * byte[] a = new byte[this.length()]; * this.intoArray(a, 0); * return a; * }
* * @return an array containing the lane values of this vector */ @ForceInline @Override public final byte[] toArray() { byte[] a = new byte[vspecies().laneCount()]; intoArray(a, 0); return a; } /** {@inheritDoc} * @implNote * When this method is used on vectors * of type {@code ByteVector}, * there will be no loss of precision or range, * and so no {@code UnsupportedOperationException} will * be thrown. */ @ForceInline @Override public final int[] toIntArray() { byte[] a = toArray(); int[] res = new int[a.length]; for (int i = 0; i < a.length; i++) { byte e = a[i]; res[i] = (int) ByteSpecies.toIntegralChecked(e, true); } return res; } /** {@inheritDoc} * @implNote * When this method is used on vectors * of type {@code ByteVector}, * there will be no loss of precision or range, * and so no {@code UnsupportedOperationException} will * be thrown. */ @ForceInline @Override public final long[] toLongArray() { byte[] a = toArray(); long[] res = new long[a.length]; for (int i = 0; i < a.length; i++) { byte e = a[i]; res[i] = ByteSpecies.toIntegralChecked(e, false); } return res; } /** {@inheritDoc} * @implNote * When this method is used on vectors * of type {@code ByteVector}, * there will be no loss of precision. */ @ForceInline @Override public final double[] toDoubleArray() { byte[] a = toArray(); double[] res = new double[a.length]; for (int i = 0; i < a.length; i++) { res[i] = (double) a[i]; } return res; } /** * Loads a vector from an array of type {@code byte[]} * starting at an offset. * For each vector lane, where {@code N} is the vector lane index, the * array element at index {@code offset + N} is placed into the * resulting vector at lane index {@code N}. * * @param species species of desired vector * @param a the array * @param offset the offset into the array * @return the vector loaded from an array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector */ @ForceInline public static ByteVector fromArray(VectorSpecies species, byte[] a, int offset) { offset = checkFromIndexSize(offset, species.length(), a.length); ByteSpecies vsp = (ByteSpecies) species; return vsp.dummyVector().fromArray0(a, offset); } /** * Loads a vector from an array of type {@code byte[]} * starting at an offset and using a mask. * Lanes where the mask is unset are filled with the default * value of {@code byte} (zero). * For each vector lane, where {@code N} is the vector lane index, * if the mask lane at index {@code N} is set then the array element at * index {@code offset + N} is placed into the resulting vector at lane index * {@code N}, otherwise the default element value is placed into the * resulting vector at lane index {@code N}. * * @param species species of desired vector * @param a the array * @param offset the offset into the array * @param m the mask controlling lane selection * @return the vector loaded from an array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector * where the mask is set */ @ForceInline public static ByteVector fromArray(VectorSpecies species, byte[] a, int offset, VectorMask m) { ByteSpecies vsp = (ByteSpecies) species; if (VectorIntrinsics.indexInRange(offset, vsp.length(), a.length)) { return vsp.dummyVector().fromArray0(a, offset, m, OFFSET_IN_RANGE); } ((AbstractMask)m) .checkIndexByLane(offset, a.length, vsp.iota(), 1); return vsp.dummyVector().fromArray0(a, offset, m, OFFSET_OUT_OF_RANGE); } /** * Gathers a new vector composed of elements from an array of type * {@code byte[]}, * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * the lane is loaded from the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * * @param species species of desired vector * @param a the array * @param offset the offset into the array, may be negative if relative * indexes in the index map compensate to produce a value within the * array bounds * @param indexMap the index map * @param mapOffset the offset into the index map * @return the vector loaded from the indexed elements of the array * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * @see ByteVector#toIntArray() */ @ForceInline public static ByteVector fromArray(VectorSpecies species, byte[] a, int offset, int[] indexMap, int mapOffset) { ByteSpecies vsp = (ByteSpecies) species; IntVector.IntSpecies isp = IntVector.species(vsp.indexShape()); Objects.requireNonNull(a); Objects.requireNonNull(indexMap); Class vectorType = vsp.vectorType(); // Constant folding should sweep out following conditonal logic. VectorSpecies lsp; if (isp.length() > IntVector.SPECIES_PREFERRED.length()) { lsp = IntVector.SPECIES_PREFERRED; } else { lsp = isp; } // Check indices are within array bounds. for (int i = 0; i < vsp.length(); i += lsp.length()) { IntVector vix = IntVector .fromArray(lsp, indexMap, mapOffset + i) .add(offset); VectorIntrinsics.checkIndex(vix, a.length); } return VectorSupport.loadWithMap( vectorType, null, byte.class, vsp.laneCount(), lsp.vectorType(), a, ARRAY_BASE, null, null, a, offset, indexMap, mapOffset, vsp, (c, idx, iMap, idy, s, vm) -> s.vOp(n -> c[idx + iMap[idy+n]])); } /** * Gathers a new vector composed of elements from an array of type * {@code byte[]}, * under the control of a mask, and * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * if the lane is set in the mask, * the lane is loaded from the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * Unset lanes in the resulting vector are set to zero. * * @param species species of desired vector * @param a the array * @param offset the offset into the array, may be negative if relative * indexes in the index map compensate to produce a value within the * array bounds * @param indexMap the index map * @param mapOffset the offset into the index map * @param m the mask controlling lane selection * @return the vector loaded from the indexed elements of the array * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * where the mask is set * @see ByteVector#toIntArray() */ @ForceInline public static ByteVector fromArray(VectorSpecies species, byte[] a, int offset, int[] indexMap, int mapOffset, VectorMask m) { if (m.allTrue()) { return fromArray(species, a, offset, indexMap, mapOffset); } else { ByteSpecies vsp = (ByteSpecies) species; return vsp.dummyVector().fromArray0(a, offset, indexMap, mapOffset, m); } } /** * Loads a vector from an array of type {@code boolean[]} * starting at an offset. * For each vector lane, where {@code N} is the vector lane index, the * array element at index {@code offset + N} * is first converted to a {@code byte} value and then * placed into the resulting vector at lane index {@code N}. *
* A {@code boolean} value is converted to a {@code byte} value by applying the * expression {@code (byte) (b ? 1 : 0)}, where {@code b} is the {@code boolean} value. * * @param species species of desired vector * @param a the array * @param offset the offset into the array * @return the vector loaded from an array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector */ @ForceInline public static ByteVector fromBooleanArray(VectorSpecies species, boolean[] a, int offset) { offset = checkFromIndexSize(offset, species.length(), a.length); ByteSpecies vsp = (ByteSpecies) species; return vsp.dummyVector().fromBooleanArray0(a, offset); } /** * Loads a vector from an array of type {@code boolean[]} * starting at an offset and using a mask. * Lanes where the mask is unset are filled with the default * value of {@code byte} (zero). * For each vector lane, where {@code N} is the vector lane index, * if the mask lane at index {@code N} is set then the array element at * index {@code offset + N} * is first converted to a {@code byte} value and then * placed into the resulting vector at lane index * {@code N}, otherwise the default element value is placed into the * resulting vector at lane index {@code N}. *
* A {@code boolean} value is converted to a {@code byte} value by applying the * expression {@code (byte) (b ? 1 : 0)}, where {@code b} is the {@code boolean} value. * * @param species species of desired vector * @param a the array * @param offset the offset into the array * @param m the mask controlling lane selection * @return the vector loaded from an array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector * where the mask is set */ @ForceInline public static ByteVector fromBooleanArray(VectorSpecies species, boolean[] a, int offset, VectorMask m) { ByteSpecies vsp = (ByteSpecies) species; if (VectorIntrinsics.indexInRange(offset, vsp.length(), a.length)) { ByteVector zero = vsp.zero(); return vsp.dummyVector().fromBooleanArray0(a, offset, m, OFFSET_IN_RANGE); } ((AbstractMask)m) .checkIndexByLane(offset, a.length, vsp.iota(), 1); return vsp.dummyVector().fromBooleanArray0(a, offset, m, OFFSET_OUT_OF_RANGE); } /** * Gathers a new vector composed of elements from an array of type * {@code boolean[]}, * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * the lane is loaded from the expression * {@code (byte) (a[f(N)] ? 1 : 0)}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * * @param species species of desired vector * @param a the array * @param offset the offset into the array, may be negative if relative * indexes in the index map compensate to produce a value within the * array bounds * @param indexMap the index map * @param mapOffset the offset into the index map * @return the vector loaded from the indexed elements of the array * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * @see ByteVector#toIntArray() */ @ForceInline public static ByteVector fromBooleanArray(VectorSpecies species, boolean[] a, int offset, int[] indexMap, int mapOffset) { // FIXME: optimize ByteSpecies vsp = (ByteSpecies) species; return vsp.vOp(n -> (byte) (a[offset + indexMap[mapOffset + n]] ? 1 : 0)); } /** * Gathers a new vector composed of elements from an array of type * {@code boolean[]}, * under the control of a mask, and * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * if the lane is set in the mask, * the lane is loaded from the expression * {@code (byte) (a[f(N)] ? 1 : 0)}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * Unset lanes in the resulting vector are set to zero. * * @param species species of desired vector * @param a the array * @param offset the offset into the array, may be negative if relative * indexes in the index map compensate to produce a value within the * array bounds * @param indexMap the index map * @param mapOffset the offset into the index map * @param m the mask controlling lane selection * @return the vector loaded from the indexed elements of the array * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * where the mask is set * @see ByteVector#toIntArray() */ @ForceInline public static ByteVector fromBooleanArray(VectorSpecies species, boolean[] a, int offset, int[] indexMap, int mapOffset, VectorMask m) { // FIXME: optimize ByteSpecies vsp = (ByteSpecies) species; return vsp.vOp(m, n -> (byte) (a[offset + indexMap[mapOffset + n]] ? 1 : 0)); } /** * Loads a vector from a {@linkplain MemorySegment memory segment} * starting at an offset into the memory segment. * Bytes are composed into primitive lane elements according * to the specified byte order. * The vector is arranged into lanes according to * memory ordering. *
* This method behaves as if it returns the result of calling * {@link #fromMemorySegment(VectorSpecies,MemorySegment,long,ByteOrder,VectorMask) * fromMemorySegment()} as follows: *
{@code * var m = species.maskAll(true); * return fromMemorySegment(species, ms, offset, bo, m); * }
* * @param species species of desired vector * @param ms the memory segment * @param offset the offset into the memory segment * @param bo the intended byte order * @return a vector loaded from the memory segment * @throws IndexOutOfBoundsException * if {@code offset+N*1 < 0} * or {@code offset+N*1 >= ms.byteSize()} * for any lane {@code N} in the vector * @throws IllegalStateException if the memory segment's session is not alive, * or if access occurs from a thread other than the thread owning the session. * @since 19 */ @ForceInline public static ByteVector fromMemorySegment(VectorSpecies species, MemorySegment ms, long offset, ByteOrder bo) { offset = checkFromIndexSize(offset, species.vectorByteSize(), ms.byteSize()); ByteSpecies vsp = (ByteSpecies) species; return vsp.dummyVector().fromMemorySegment0(ms, offset).maybeSwap(bo); } /** * Loads a vector from a {@linkplain MemorySegment memory segment} * starting at an offset into the memory segment * and using a mask. * Lanes where the mask is unset are filled with the default * value of {@code byte} (zero). * Bytes are composed into primitive lane elements according * to the specified byte order. * The vector is arranged into lanes according to * memory ordering. *
* The following pseudocode illustrates the behavior: *
{@code * var slice = ms.asSlice(offset); * byte[] ar = new byte[species.length()]; * for (int n = 0; n < ar.length; n++) { * if (m.laneIsSet(n)) { * ar[n] = slice.getAtIndex(ValuaLayout.JAVA_BYTE.withByteAlignment(1), n); * } * } * ByteVector r = ByteVector.fromArray(species, ar, 0); * }
* @implNote * The byte order argument is ignored. * * @param species species of desired vector * @param ms the memory segment * @param offset the offset into the memory segment * @param bo the intended byte order * @param m the mask controlling lane selection * @return a vector loaded from the memory segment * @throws IndexOutOfBoundsException * if {@code offset+N*1 < 0} * or {@code offset+N*1 >= ms.byteSize()} * for any lane {@code N} in the vector * where the mask is set * @throws IllegalStateException if the memory segment's session is not alive, * or if access occurs from a thread other than the thread owning the session. * @since 19 */ @ForceInline public static ByteVector fromMemorySegment(VectorSpecies species, MemorySegment ms, long offset, ByteOrder bo, VectorMask m) { ByteSpecies vsp = (ByteSpecies) species; if (VectorIntrinsics.indexInRange(offset, vsp.vectorByteSize(), ms.byteSize())) { return vsp.dummyVector().fromMemorySegment0(ms, offset, m, OFFSET_IN_RANGE).maybeSwap(bo); } ((AbstractMask)m) .checkIndexByLane(offset, ms.byteSize(), vsp.iota(), 1); return vsp.dummyVector().fromMemorySegment0(ms, offset, m, OFFSET_OUT_OF_RANGE).maybeSwap(bo); } // Memory store operations /** * Stores this vector into an array of type {@code byte[]} * starting at an offset. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} is stored into the array * element {@code a[offset+N]}. * * @param a the array, of type {@code byte[]} * @param offset the offset into the array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector */ @ForceInline public final void intoArray(byte[] a, int offset) { offset = checkFromIndexSize(offset, length(), a.length); ByteSpecies vsp = vspecies(); VectorSupport.store( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), a, arrayAddress(a, offset), false, this, a, offset, (arr, off, v) -> v.stOp(arr, (int) off, (arr_, off_, i, e) -> arr_[off_ + i] = e)); } /** * Stores this vector into an array of type {@code byte[]} * starting at offset and using a mask. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} is stored into the array * element {@code a[offset+N]}. * If the mask lane at {@code N} is unset then the corresponding * array element {@code a[offset+N]} is left unchanged. *
* Array range checking is done for lanes where the mask is set. * Lanes where the mask is unset are not stored and do not need * to correspond to legitimate elements of {@code a}. * That is, unset lanes may correspond to array indexes less than * zero or beyond the end of the array. * * @param a the array, of type {@code byte[]} * @param offset the offset into the array * @param m the mask controlling lane storage * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector * where the mask is set */ @ForceInline public final void intoArray(byte[] a, int offset, VectorMask m) { if (m.allTrue()) { intoArray(a, offset); } else { ByteSpecies vsp = vspecies(); if (!VectorIntrinsics.indexInRange(offset, vsp.length(), a.length)) { ((AbstractMask)m) .checkIndexByLane(offset, a.length, vsp.iota(), 1); } intoArray0(a, offset, m); } } /** * Scatters this vector into an array of type {@code byte[]} * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} is stored into the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * * @param a the array * @param offset an offset to combine with the index map offsets * @param indexMap the index map * @param mapOffset the offset into the index map * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * @see ByteVector#toIntArray() */ @ForceInline public final void intoArray(byte[] a, int offset, int[] indexMap, int mapOffset) { stOp(a, offset, (arr, off, i, e) -> { int j = indexMap[mapOffset + i]; arr[off + j] = e; }); } /** * Scatters this vector into an array of type {@code byte[]}, * under the control of a mask, and * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * if the mask lane at index {@code N} is set then * the lane element at index {@code N} is stored into the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. * * @param a the array * @param offset an offset to combine with the index map offsets * @param indexMap the index map * @param mapOffset the offset into the index map * @param m the mask * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * where the mask is set * @see ByteVector#toIntArray() */ @ForceInline public final void intoArray(byte[] a, int offset, int[] indexMap, int mapOffset, VectorMask m) { stOp(a, offset, m, (arr, off, i, e) -> { int j = indexMap[mapOffset + i]; arr[off + j] = e; }); } /** * Stores this vector into an array of type {@code boolean[]} * starting at an offset. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} * is first converted to a {@code boolean} value and then * stored into the array element {@code a[offset+N]}. *
* A {@code byte} value is converted to a {@code boolean} value by applying the * expression {@code (b & 1) != 0} where {@code b} is the byte value. * * @param a the array * @param offset the offset into the array * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector */ @ForceInline public final void intoBooleanArray(boolean[] a, int offset) { offset = checkFromIndexSize(offset, length(), a.length); ByteSpecies vsp = vspecies(); ByteVector normalized = this.and((byte) 1); VectorSupport.store( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), a, booleanArrayAddress(a, offset), false, normalized, a, offset, (arr, off, v) -> v.stOp(arr, (int) off, (arr_, off_, i, e) -> arr_[off_ + i] = (e & 1) != 0)); } /** * Stores this vector into an array of type {@code boolean[]} * starting at offset and using a mask. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} * is first converted to a {@code boolean} value and then * stored into the array element {@code a[offset+N]}. * If the mask lane at {@code N} is unset then the corresponding * array element {@code a[offset+N]} is left unchanged. *
* A {@code byte} value is converted to a {@code boolean} value by applying the * expression {@code (b & 1) != 0} where {@code b} is the byte value. *
* Array range checking is done for lanes where the mask is set. * Lanes where the mask is unset are not stored and do not need * to correspond to legitimate elements of {@code a}. * That is, unset lanes may correspond to array indexes less than * zero or beyond the end of the array. * * @param a the array * @param offset the offset into the array * @param m the mask controlling lane storage * @throws IndexOutOfBoundsException * if {@code offset+N < 0} or {@code offset+N >= a.length} * for any lane {@code N} in the vector * where the mask is set */ @ForceInline public final void intoBooleanArray(boolean[] a, int offset, VectorMask m) { if (m.allTrue()) { intoBooleanArray(a, offset); } else { ByteSpecies vsp = vspecies(); if (!VectorIntrinsics.indexInRange(offset, vsp.length(), a.length)) { ((AbstractMask)m) .checkIndexByLane(offset, a.length, vsp.iota(), 1); } intoBooleanArray0(a, offset, m); } } /** * Scatters this vector into an array of type {@code boolean[]} * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * the lane element at index {@code N} * is first converted to a {@code boolean} value and then * stored into the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. *
* A {@code byte} value is converted to a {@code boolean} value by applying the * expression {@code (b & 1) != 0} where {@code b} is the byte value. * * @param a the array * @param offset an offset to combine with the index map offsets * @param indexMap the index map * @param mapOffset the offset into the index map * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * @see ByteVector#toIntArray() */ @ForceInline public final void intoBooleanArray(boolean[] a, int offset, int[] indexMap, int mapOffset) { // FIXME: optimize stOp(a, offset, (arr, off, i, e) -> { int j = indexMap[mapOffset + i]; arr[off + j] = (e & 1) != 0; }); } /** * Scatters this vector into an array of type {@code boolean[]}, * under the control of a mask, and * using indexes obtained by adding a fixed {@code offset} to a * series of secondary offsets from an index map. * The index map is a contiguous sequence of {@code VLENGTH} * elements in a second array of {@code int}s, starting at a given * {@code mapOffset}. *
* For each vector lane, where {@code N} is the vector lane index, * if the mask lane at index {@code N} is set then * the lane element at index {@code N} * is first converted to a {@code boolean} value and then * stored into the array * element {@code a[f(N)]}, where {@code f(N)} is the * index mapping expression * {@code offset + indexMap[mapOffset + N]]}. *
* A {@code byte} value is converted to a {@code boolean} value by applying the * expression {@code (b & 1) != 0} where {@code b} is the byte value. * * @param a the array * @param offset an offset to combine with the index map offsets * @param indexMap the index map * @param mapOffset the offset into the index map * @param m the mask * @throws IndexOutOfBoundsException * if {@code mapOffset+N < 0} * or if {@code mapOffset+N >= indexMap.length}, * or if {@code f(N)=offset+indexMap[mapOffset+N]} * is an invalid index into {@code a}, * for any lane {@code N} in the vector * where the mask is set * @see ByteVector#toIntArray() */ @ForceInline public final void intoBooleanArray(boolean[] a, int offset, int[] indexMap, int mapOffset, VectorMask m) { // FIXME: optimize stOp(a, offset, m, (arr, off, i, e) -> { int j = indexMap[mapOffset + i]; arr[off + j] = (e & 1) != 0; }); } /** * {@inheritDoc} * @since 19 */ @Override @ForceInline public final void intoMemorySegment(MemorySegment ms, long offset, ByteOrder bo) { if (ms.isReadOnly()) { throw new UnsupportedOperationException("Attempt to write a read-only segment"); } offset = checkFromIndexSize(offset, byteSize(), ms.byteSize()); maybeSwap(bo).intoMemorySegment0(ms, offset); } /** * {@inheritDoc} * @since 19 */ @Override @ForceInline public final void intoMemorySegment(MemorySegment ms, long offset, ByteOrder bo, VectorMask m) { if (m.allTrue()) { intoMemorySegment(ms, offset, bo); } else { if (ms.isReadOnly()) { throw new UnsupportedOperationException("Attempt to write a read-only segment"); } ByteSpecies vsp = vspecies(); if (!VectorIntrinsics.indexInRange(offset, vsp.vectorByteSize(), ms.byteSize())) { ((AbstractMask)m) .checkIndexByLane(offset, ms.byteSize(), vsp.iota(), 1); } maybeSwap(bo).intoMemorySegment0(ms, offset, m); } } // ================================================ // Low-level memory operations. // // Note that all of these operations *must* inline into a context // where the exact species of the involved vector is a // compile-time constant. Otherwise, the intrinsic generation // will fail and performance will suffer. // // In many cases this is achieved by re-deriving a version of the // method in each concrete subclass (per species). The re-derived // method simply calls one of these generic methods, with exact // parameters for the controlling metadata, which is either a // typed vector or constant species instance. // Unchecked loading operations in native byte order. // Caller is responsible for applying index checks, masking, and // byte swapping. /*package-private*/ abstract ByteVector fromArray0(byte[] a, int offset); @ForceInline final ByteVector fromArray0Template(byte[] a, int offset) { ByteSpecies vsp = vspecies(); return VectorSupport.load( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), a, arrayAddress(a, offset), false, a, offset, vsp, (arr, off, s) -> s.ldOp(arr, (int) off, (arr_, off_, i) -> arr_[off_ + i])); } /*package-private*/ abstract ByteVector fromArray0(byte[] a, int offset, VectorMask m, int offsetInRange); @ForceInline final > ByteVector fromArray0Template(Class maskClass, byte[] a, int offset, M m, int offsetInRange) { m.check(species()); ByteSpecies vsp = vspecies(); return VectorSupport.loadMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), a, arrayAddress(a, offset), false, m, offsetInRange, a, offset, vsp, (arr, off, s, vm) -> s.ldOp(arr, (int) off, vm, (arr_, off_, i) -> arr_[off_ + i])); } /*package-private*/ abstract ByteVector fromArray0(byte[] a, int offset, int[] indexMap, int mapOffset, VectorMask m); @ForceInline final > ByteVector fromArray0Template(Class maskClass, byte[] a, int offset, int[] indexMap, int mapOffset, M m) { ByteSpecies vsp = vspecies(); IntVector.IntSpecies isp = IntVector.species(vsp.indexShape()); Objects.requireNonNull(a); Objects.requireNonNull(indexMap); m.check(vsp); Class vectorType = vsp.vectorType(); // Constant folding should sweep out following conditonal logic. VectorSpecies lsp; if (isp.length() > IntVector.SPECIES_PREFERRED.length()) { lsp = IntVector.SPECIES_PREFERRED; } else { lsp = isp; } // Check indices are within array bounds. // FIXME: Check index under mask controlling. for (int i = 0; i < vsp.length(); i += lsp.length()) { IntVector vix = IntVector .fromArray(lsp, indexMap, mapOffset + i) .add(offset); VectorIntrinsics.checkIndex(vix, a.length); } return VectorSupport.loadWithMap( vectorType, maskClass, byte.class, vsp.laneCount(), lsp.vectorType(), a, ARRAY_BASE, null, m, a, offset, indexMap, mapOffset, vsp, (c, idx, iMap, idy, s, vm) -> s.vOp(vm, n -> c[idx + iMap[idy+n]])); } /*package-private*/ abstract ByteVector fromBooleanArray0(boolean[] a, int offset); @ForceInline final ByteVector fromBooleanArray0Template(boolean[] a, int offset) { ByteSpecies vsp = vspecies(); return VectorSupport.load( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), a, booleanArrayAddress(a, offset), false, a, offset, vsp, (arr, off, s) -> s.ldOp(arr, (int) off, (arr_, off_, i) -> (byte) (arr_[off_ + i] ? 1 : 0))); } /*package-private*/ abstract ByteVector fromBooleanArray0(boolean[] a, int offset, VectorMask m, int offsetInRange); @ForceInline final > ByteVector fromBooleanArray0Template(Class maskClass, boolean[] a, int offset, M m, int offsetInRange) { m.check(species()); ByteSpecies vsp = vspecies(); return VectorSupport.loadMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), a, booleanArrayAddress(a, offset), false, m, offsetInRange, a, offset, vsp, (arr, off, s, vm) -> s.ldOp(arr, (int) off, vm, (arr_, off_, i) -> (byte) (arr_[off_ + i] ? 1 : 0))); } abstract ByteVector fromMemorySegment0(MemorySegment bb, long offset); @ForceInline final ByteVector fromMemorySegment0Template(MemorySegment ms, long offset) { ByteSpecies vsp = vspecies(); return ScopedMemoryAccess.loadFromMemorySegment( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), (AbstractMemorySegmentImpl) ms, offset, vsp, (msp, off, s) -> { return s.ldLongOp((MemorySegment) msp, off, ByteVector::memorySegmentGet); }); } abstract ByteVector fromMemorySegment0(MemorySegment ms, long offset, VectorMask m, int offsetInRange); @ForceInline final > ByteVector fromMemorySegment0Template(Class maskClass, MemorySegment ms, long offset, M m, int offsetInRange) { ByteSpecies vsp = vspecies(); m.check(vsp); return ScopedMemoryAccess.loadFromMemorySegmentMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), (AbstractMemorySegmentImpl) ms, offset, m, vsp, offsetInRange, (msp, off, s, vm) -> { return s.ldLongOp((MemorySegment) msp, off, vm, ByteVector::memorySegmentGet); }); } // Unchecked storing operations in native byte order. // Caller is responsible for applying index checks, masking, and // byte swapping. abstract void intoArray0(byte[] a, int offset); @ForceInline final void intoArray0Template(byte[] a, int offset) { ByteSpecies vsp = vspecies(); VectorSupport.store( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), a, arrayAddress(a, offset), false, this, a, offset, (arr, off, v) -> v.stOp(arr, (int) off, (arr_, off_, i, e) -> arr_[off_+i] = e)); } abstract void intoArray0(byte[] a, int offset, VectorMask m); @ForceInline final > void intoArray0Template(Class maskClass, byte[] a, int offset, M m) { m.check(species()); ByteSpecies vsp = vspecies(); VectorSupport.storeMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), a, arrayAddress(a, offset), false, this, m, a, offset, (arr, off, v, vm) -> v.stOp(arr, (int) off, vm, (arr_, off_, i, e) -> arr_[off_ + i] = e)); } abstract void intoBooleanArray0(boolean[] a, int offset, VectorMask m); @ForceInline final > void intoBooleanArray0Template(Class maskClass, boolean[] a, int offset, M m) { m.check(species()); ByteSpecies vsp = vspecies(); ByteVector normalized = this.and((byte) 1); VectorSupport.storeMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), a, booleanArrayAddress(a, offset), false, normalized, m, a, offset, (arr, off, v, vm) -> v.stOp(arr, (int) off, vm, (arr_, off_, i, e) -> arr_[off_ + i] = (e & 1) != 0)); } @ForceInline final void intoMemorySegment0(MemorySegment ms, long offset) { ByteSpecies vsp = vspecies(); ScopedMemoryAccess.storeIntoMemorySegment( vsp.vectorType(), vsp.elementType(), vsp.laneCount(), this, (AbstractMemorySegmentImpl) ms, offset, (msp, off, v) -> { v.stLongOp((MemorySegment) msp, off, ByteVector::memorySegmentSet); }); } abstract void intoMemorySegment0(MemorySegment bb, long offset, VectorMask m); @ForceInline final > void intoMemorySegment0Template(Class maskClass, MemorySegment ms, long offset, M m) { ByteSpecies vsp = vspecies(); m.check(vsp); ScopedMemoryAccess.storeIntoMemorySegmentMasked( vsp.vectorType(), maskClass, vsp.elementType(), vsp.laneCount(), this, m, (AbstractMemorySegmentImpl) ms, offset, (msp, off, v, vm) -> { v.stLongOp((MemorySegment) msp, off, vm, ByteVector::memorySegmentSet); }); } // End of low-level memory operations. @ForceInline private void conditionalStoreNYI(int offset, ByteSpecies vsp, VectorMask m, int scale, int limit) { if (offset < 0 || offset + vsp.laneCount() * scale > limit) { String msg = String.format("unimplemented: store @%d in [0..%d), %s in %s", offset, limit, m, vsp); throw new AssertionError(msg); } } /*package-private*/ @Override @ForceInline final ByteVector maybeSwap(ByteOrder bo) { return this; } static final int ARRAY_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_BYTE_INDEX_SCALE); static final long ARRAY_BASE = Unsafe.ARRAY_BYTE_BASE_OFFSET; @ForceInline static long arrayAddress(byte[] a, int index) { return ARRAY_BASE + (((long)index) << ARRAY_SHIFT); } static final int ARRAY_BOOLEAN_SHIFT = 31 - Integer.numberOfLeadingZeros(Unsafe.ARRAY_BOOLEAN_INDEX_SCALE); static final long ARRAY_BOOLEAN_BASE = Unsafe.ARRAY_BOOLEAN_BASE_OFFSET; @ForceInline static long booleanArrayAddress(boolean[] a, int index) { return ARRAY_BOOLEAN_BASE + (((long)index) << ARRAY_BOOLEAN_SHIFT); } @ForceInline static long byteArrayAddress(byte[] a, int index) { return Unsafe.ARRAY_BYTE_BASE_OFFSET + index; } // ================================================ /// Reinterpreting view methods: // lanewise reinterpret: viewAsXVector() // keep shape, redraw lanes: reinterpretAsEs() /** * {@inheritDoc} */ @ForceInline @Override public final ByteVector reinterpretAsBytes() { return this; } /** * {@inheritDoc} */ @ForceInline @Override public final ByteVector viewAsIntegralLanes() { return this; } /** * {@inheritDoc} * * @implNote This method always throws * {@code UnsupportedOperationException}, because there is no floating * point type of the same size as {@code byte}. The return type * of this method is arbitrarily designated as * {@code Vector}. Future versions of this API may change the return * type if additional floating point types become available. */ @ForceInline @Override public final Vector viewAsFloatingLanes() { LaneType flt = LaneType.BYTE.asFloating(); // asFloating() will throw UnsupportedOperationException for the unsupported type byte throw new AssertionError("Cannot reach here"); } // ================================================ /// Object methods: toString, equals, hashCode // // Object methods are defined as if via Arrays.toString, etc., // is applied to the array of elements. Two equal vectors // are required to have equal species and equal lane values. /** * Returns a string representation of this vector, of the form * {@code "[0,1,2...]"}, reporting the lane values of this vector, * in lane order. * * The string is produced as if by a call to {@link * java.util.Arrays#toString(byte[]) Arrays.toString()}, * as appropriate to the {@code byte} array returned by * {@link #toArray this.toArray()}. * * @return a string of the form {@code "[0,1,2...]"} * reporting the lane values of this vector */ @Override @ForceInline public final String toString() { // now that toArray is strongly typed, we can define this return Arrays.toString(toArray()); } /** * {@inheritDoc} */ @Override @ForceInline public final boolean equals(Object obj) { if (obj instanceof Vector) { Vector that = (Vector) obj; if (this.species().equals(that.species())) { return this.eq(that.check(this.species())).allTrue(); } } return false; } /** * {@inheritDoc} */ @Override @ForceInline public final int hashCode() { // now that toArray is strongly typed, we can define this return Objects.hash(species(), Arrays.hashCode(toArray())); } // ================================================ // Species /** * Class representing {@link ByteVector}'s of the same {@link VectorShape VectorShape}. */ /*package-private*/ static final class ByteSpecies extends AbstractSpecies { private ByteSpecies(VectorShape shape, Class vectorType, Class> maskType, Class> shuffleType, Function vectorFactory) { super(shape, LaneType.of(byte.class), vectorType, maskType, shuffleType, vectorFactory); assert(this.elementSize() == Byte.SIZE); } // Specializing overrides: @Override @ForceInline public final Class elementType() { return byte.class; } @Override @ForceInline final Class genericElementType() { return Byte.class; } @SuppressWarnings("unchecked") @Override @ForceInline public final Class vectorType() { return (Class) vectorType; } @Override @ForceInline public final long checkValue(long e) { longToElementBits(e); // only for exception return e; } /*package-private*/ @Override @ForceInline final ByteVector broadcastBits(long bits) { return (ByteVector) VectorSupport.fromBitsCoerced( vectorType, byte.class, laneCount, bits, MODE_BROADCAST, this, (bits_, s_) -> s_.rvOp(i -> bits_)); } /*package-private*/ @ForceInline final ByteVector broadcast(byte e) { return broadcastBits(toBits(e)); } @Override @ForceInline public final ByteVector broadcast(long e) { return broadcastBits(longToElementBits(e)); } /*package-private*/ final @Override @ForceInline long longToElementBits(long value) { // Do the conversion, and then test it for failure. byte e = (byte) value; if ((long) e != value) { throw badElementBits(value, e); } return toBits(e); } /*package-private*/ @ForceInline static long toIntegralChecked(byte e, boolean convertToInt) { long value = convertToInt ? (int) e : (long) e; if ((byte) value != e) { throw badArrayBits(e, convertToInt, value); } return value; } /* this non-public one is for internal conversions */ @Override @ForceInline final ByteVector fromIntValues(int[] values) { VectorIntrinsics.requireLength(values.length, laneCount); byte[] va = new byte[laneCount()]; for (int i = 0; i < va.length; i++) { int lv = values[i]; byte v = (byte) lv; va[i] = v; if ((int)v != lv) { throw badElementBits(lv, v); } } return dummyVector().fromArray0(va, 0); } // Virtual constructors @ForceInline @Override final public ByteVector fromArray(Object a, int offset) { // User entry point // Defer only to the equivalent method on the vector class, using the same inputs return ByteVector .fromArray(this, (byte[]) a, offset); } @ForceInline @Override final public ByteVector fromMemorySegment(MemorySegment ms, long offset, ByteOrder bo) { // User entry point // Defer only to the equivalent method on the vector class, using the same inputs return ByteVector .fromMemorySegment(this, ms, offset, bo); } @ForceInline @Override final ByteVector dummyVector() { return (ByteVector) super.dummyVector(); } /*package-private*/ final @Override @ForceInline ByteVector rvOp(RVOp f) { byte[] res = new byte[laneCount()]; for (int i = 0; i < res.length; i++) { byte bits = (byte) f.apply(i); res[i] = fromBits(bits); } return dummyVector().vectorFactory(res); } ByteVector vOp(FVOp f) { byte[] res = new byte[laneCount()]; for (int i = 0; i < res.length; i++) { res[i] = f.apply(i); } return dummyVector().vectorFactory(res); } ByteVector vOp(VectorMask m, FVOp f) { byte[] res = new byte[laneCount()]; boolean[] mbits = ((AbstractMask)m).getBits(); for (int i = 0; i < res.length; i++) { if (mbits[i]) { res[i] = f.apply(i); } } return dummyVector().vectorFactory(res); } /*package-private*/ @ForceInline ByteVector ldOp(M memory, int offset, FLdOp f) { return dummyVector().ldOp(memory, offset, f); } /*package-private*/ @ForceInline ByteVector ldOp(M memory, int offset, VectorMask m, FLdOp f) { return dummyVector().ldOp(memory, offset, m, f); } /*package-private*/ @ForceInline ByteVector ldLongOp(MemorySegment memory, long offset, FLdLongOp f) { return dummyVector().ldLongOp(memory, offset, f); } /*package-private*/ @ForceInline ByteVector ldLongOp(MemorySegment memory, long offset, VectorMask m, FLdLongOp f) { return dummyVector().ldLongOp(memory, offset, m, f); } /*package-private*/ @ForceInline void stOp(M memory, int offset, FStOp f) { dummyVector().stOp(memory, offset, f); } /*package-private*/ @ForceInline void stOp(M memory, int offset, AbstractMask m, FStOp f) { dummyVector().stOp(memory, offset, m, f); } /*package-private*/ @ForceInline void stLongOp(MemorySegment memory, long offset, FStLongOp f) { dummyVector().stLongOp(memory, offset, f); } /*package-private*/ @ForceInline void stLongOp(MemorySegment memory, long offset, AbstractMask m, FStLongOp f) { dummyVector().stLongOp(memory, offset, m, f); } // N.B. Make sure these constant vectors and // masks load up correctly into registers. // // Also, see if we can avoid all that switching. // Could we cache both vectors and both masks in // this species object? // Zero and iota vector access @Override @ForceInline public final ByteVector zero() { if ((Class) vectorType() == ByteMaxVector.class) return ByteMaxVector.ZERO; switch (vectorBitSize()) { case 64: return Byte64Vector.ZERO; case 128: return Byte128Vector.ZERO; case 256: return Byte256Vector.ZERO; case 512: return Byte512Vector.ZERO; } throw new AssertionError(); } @Override @ForceInline public final ByteVector iota() { if ((Class) vectorType() == ByteMaxVector.class) return ByteMaxVector.IOTA; switch (vectorBitSize()) { case 64: return Byte64Vector.IOTA; case 128: return Byte128Vector.IOTA; case 256: return Byte256Vector.IOTA; case 512: return Byte512Vector.IOTA; } throw new AssertionError(); } // Mask access @Override @ForceInline public final VectorMask maskAll(boolean bit) { if ((Class) vectorType() == ByteMaxVector.class) return ByteMaxVector.ByteMaxMask.maskAll(bit); switch (vectorBitSize()) { case 64: return Byte64Vector.Byte64Mask.maskAll(bit); case 128: return Byte128Vector.Byte128Mask.maskAll(bit); case 256: return Byte256Vector.Byte256Mask.maskAll(bit); case 512: return Byte512Vector.Byte512Mask.maskAll(bit); } throw new AssertionError(); } } /** * Finds a species for an element type of {@code byte} and shape. * * @param s the shape * @return a species for an element type of {@code byte} and shape * @throws IllegalArgumentException if no such species exists for the shape */ static ByteSpecies species(VectorShape s) { Objects.requireNonNull(s); switch (s.switchKey) { case VectorShape.SK_64_BIT: return (ByteSpecies) SPECIES_64; case VectorShape.SK_128_BIT: return (ByteSpecies) SPECIES_128; case VectorShape.SK_256_BIT: return (ByteSpecies) SPECIES_256; case VectorShape.SK_512_BIT: return (ByteSpecies) SPECIES_512; case VectorShape.SK_Max_BIT: return (ByteSpecies) SPECIES_MAX; default: throw new IllegalArgumentException("Bad shape: " + s); } } /** Species representing {@link ByteVector}s of {@link VectorShape#S_64_BIT VectorShape.S_64_BIT}. */ public static final VectorSpecies SPECIES_64 = new ByteSpecies(VectorShape.S_64_BIT, Byte64Vector.class, Byte64Vector.Byte64Mask.class, Byte64Vector.Byte64Shuffle.class, Byte64Vector::new); /** Species representing {@link ByteVector}s of {@link VectorShape#S_128_BIT VectorShape.S_128_BIT}. */ public static final VectorSpecies SPECIES_128 = new ByteSpecies(VectorShape.S_128_BIT, Byte128Vector.class, Byte128Vector.Byte128Mask.class, Byte128Vector.Byte128Shuffle.class, Byte128Vector::new); /** Species representing {@link ByteVector}s of {@link VectorShape#S_256_BIT VectorShape.S_256_BIT}. */ public static final VectorSpecies SPECIES_256 = new ByteSpecies(VectorShape.S_256_BIT, Byte256Vector.class, Byte256Vector.Byte256Mask.class, Byte256Vector.Byte256Shuffle.class, Byte256Vector::new); /** Species representing {@link ByteVector}s of {@link VectorShape#S_512_BIT VectorShape.S_512_BIT}. */ public static final VectorSpecies SPECIES_512 = new ByteSpecies(VectorShape.S_512_BIT, Byte512Vector.class, Byte512Vector.Byte512Mask.class, Byte512Vector.Byte512Shuffle.class, Byte512Vector::new); /** Species representing {@link ByteVector}s of {@link VectorShape#S_Max_BIT VectorShape.S_Max_BIT}. */ public static final VectorSpecies SPECIES_MAX = new ByteSpecies(VectorShape.S_Max_BIT, ByteMaxVector.class, ByteMaxVector.ByteMaxMask.class, ByteMaxVector.ByteMaxShuffle.class, ByteMaxVector::new); /** * Preferred species for {@link ByteVector}s. * A preferred species is a species of maximal bit-size for the platform. */ public static final VectorSpecies SPECIES_PREFERRED = (ByteSpecies) VectorSpecies.ofPreferred(byte.class); }