/*
 * Copyright (c) 1999, 2025, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.  Oracle designates this
 * particular file as subject to the "Classpath" exception as provided
 * by Oracle in the LICENSE file that accompanied this code.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

package com.sun.tools.javac.util;

/** Utility class for static conversion methods between numbers
 *  and strings in various formats.
 *
 *  <p>Note regarding UTF-8.
 *  The JVMS defines its own version of the UTF-8 format so that it
 *  contains no zero bytes (modified UTF-8). This is not actually the same
 *  as Charset.forName("UTF-8").
 *
 *  <p>
 *  See also:
 *  <ul>
 *  <li><a href="http://docs.oracle.com/javase/specs/jvms/se7/html/jvms-4.html#jvms-4.4.7">
 *    JVMS 4.4.7 </a></li>
 *  <li><a href="http://docs.oracle.com/javase/7/docs/api/java/io/DataInput.html#modified-utf-8">
      java.io.DataInput: Modified UTF-8 </a></li>
    <li><a href="https://en.wikipedia.org/wiki/UTF-8#Modified_UTF-8">
      Modified UTF-8 (Wikipedia) </a></li>
 *  </ul>
 *
 *  The methods here support modified UTF-8.
 *
 *  <p><b>This is NOT part of any supported API.
 *  If you write code that depends on this, you do so at your own risk.
 *  This code and its internal interfaces are subject to change or
 *  deletion without notice.</b>
 */
public class Convert {

    /** Convert string to integer.
     */
    public static int string2int(String s, int radix)
        throws NumberFormatException {
        if (radix == 10) {
            return Integer.parseInt(s, radix);
        } else {
            char[] cs = s.toCharArray();
            int limit = Integer.MAX_VALUE / (radix/2);
            int n = 0;
            for (char c : cs) {
                int d = Character.digit(c, radix);
                if (n < 0 ||
                    n > limit ||
                    n * radix > Integer.MAX_VALUE - d)
                    throw new NumberFormatException();
                n = n * radix + d;
            }
            return n;
        }
    }

    /** Convert string to long integer.
     */
    public static long string2long(String s, int radix)
        throws NumberFormatException {
        if (radix == 10) {
            return Long.parseLong(s, radix);
        } else {
            char[] cs = s.toCharArray();
            long limit = Long.MAX_VALUE / (radix/2);
            long n = 0;
            for (char c : cs) {
                int d = Character.digit(c, radix);
                if (n < 0 ||
                    n > limit ||
                    n * radix > Long.MAX_VALUE - d)
                    throw new NumberFormatException();
                n = n * radix + d;
            }
            return n;
        }
    }

/* Conversion routines between names, strings, and byte arrays in Utf8 format
 */

    /** Validate the given Modified UTF-8 encoding using the given validation level.
     *  Reject invalid data by throwing an {@link InvalidUtfException}.
     *  Note: there is no point in calling this method with {@link Validation#NONE}.
     *  @param buf        Buffer containing data
     *  @param off        Data starting offset
     *  @param len        Data length
     *  @param validation Level of validation
     *  @throws InvalidUtfException if {@code validation} is not {@link Validation#NONE}
     *      and invalid Modified UTF-8 is encountered
     */
    public static void utfValidate(byte[] buf, int off, int len, Validation validation) throws InvalidUtfException {
        utf2chars(buf, off, null, 0, len, validation);
    }

    /** Decode characters encoded in Modified UTF-8 encoding using the given validation level.
     *  Reject any invalid data by throwing an {@link InvalidUtfException}.
     *  Parameters are as in System.arraycopy():
     *  @param src        The array holding the bytes to convert.
     *  @param soff       The start index from which bytes are converted.
     *  @param dst        The array holding the converted characters,
     *                    or null to just validate
     *  @param doff       The start index from which converted characters
     *                    are written.
     *  @param len        The maximum number of bytes to convert.
     *  @param validation Level of validation
     *  @throws InvalidUtfException if invalid Modified UTF-8 is encountered
     *  @return the index in {@code dst} just after the last copied char
     *  @throws InvalidUtfException if {@code validation} is not {@link Validation#NONE}
     *      and invalid Modified UTF-8 is encountered
     */
    public static int utf2chars(byte[] src, int soff, char[] dst, int doff, int len, Validation validation)
      throws InvalidUtfException {
        final int doff0 = doff;
        while (len-- > 0) {
            final int soff0 = soff;
            int value = src[soff++];
            if (value < 0) {
                if ((value & 0xe0) == 0xc0) {
                    int value2;
                    if (len-- > 0)
                        value2 = src[soff++];
                    else if (validation.allowAnything())
                        value2 = 0;
                    else
                        throw new InvalidUtfException(soff0);
                    if (!validation.allowAnything() && (value2 & 0xc0) != 0x80)
                        throw new InvalidUtfException(soff0);
                    value = ((value & 0x1f) << 6) | (value2 & 0x3f);
                    if (!validation.allowLongEncoding() && (value & ~0x7f) == 0 && value != 0)
                        throw new InvalidUtfException(soff0);   // could have been one byte
                } else if ((value & 0xf0) == 0xe0) {
                    int value2;
                    int value3;
                    if ((len -= 2) >= 0) {
                        value2 = src[soff++];
                        value3 = src[soff++];
                    } else if (validation.allowAnything()) {
                        value2 = 0;
                        value3 = 0;
                    } else
                        throw new InvalidUtfException(soff0);
                    if (!validation.allowAnything() && ((value2 & 0xc0) != 0x80 || (value3 & 0xc0) != 0x80))
                        throw new InvalidUtfException(soff0);
                    value = ((value & 0x0f) << 12) | ((value2 & 0x3f) << 6) | (value3 & 0x3f);
                    if (!validation.allowLongEncoding() && (value & ~0x7ff) == 0)
                        throw new InvalidUtfException(soff0);   // could have been two bytes
                } else if (validation.allowAnything())
                    value &= 0xff;
                else
                    throw new InvalidUtfException(soff0);
            } else if (!validation.allowSingleByteNul() && value == 0)
                throw new InvalidUtfException(soff0);           // 0x0000 must be encoded as two bytes
            if (dst != null)
                dst[doff] = (char)value;
            doff++;
        }
        return doff - doff0;
    }

    /** Decode characters encoded in Modified UTF-8 encoding.
     *  @param src        The array holding the bytes.
     *  @param sindex     The start index from which bytes are converted.
     *  @param len        The maximum number of bytes to convert.
     *  @param validation Level of validation
     *  @return           The decoded characters in an array.
     *  @throws InvalidUtfException if {@code validation} is not {@link Validation#NONE}
     *      and invalid Modified UTF-8 is encountered
     */
    public static char[] utf2chars(byte[] src, int sindex, int len, Validation validation)
      throws InvalidUtfException {
        char[] dst = new char[len];
        int len1 = utf2chars(src, sindex, dst, 0, len, validation);
        if (len1 == len)
            return dst;
        char[] result = new char[len1];
        System.arraycopy(dst, 0, result, 0, len1);
        return result;
    }

    /** Decode a {@link String} encoded in Modified UTF-8 encoding.
     *  @param src        The array holding the bytes.
     *  @param sindex     The start index from which bytes are converted.
     *  @param len        The maximum number of bytes to convert.
     *  @param validation Level of validation
     *  @throws InvalidUtfException if {@code validation} is not {@link Validation#NONE}
     *      and invalid Modified UTF-8 is encountered
     */
    public static String utf2string(byte[] src, int sindex, int len, Validation validation)
      throws InvalidUtfException {
        char dst[] = new char[len];
        int len1 = utf2chars(src, sindex, dst, 0, len, validation);
        return new String(dst, 0, len1);
    }

    /** Count the number of characters encoded in a Modified UTF-8 encoding.
     *  This method does not check for invalid data.
     *  @param buf data buffer
     *  @param off starting offset of UTF-8 data
     *  @param len number of bytes of UTF-8 data
     *  @return the number of encoded characters
     */
    public static int utfNumChars(byte[] buf, int off, int len) {
        int numChars = 0;
        while (len-- > 0) {
            if ((buf[off++] & 0xc0) != 0x80)
                numChars++;
        }
        return numChars;
    }

    /** Copy characters in source array to bytes in target array,
     *  converting them to Utf8 representation.
     *  The target array must be large enough to hold the result.
     *  returns first index in `dst' past the last copied byte.
     *  @param src        The array holding the characters to convert.
     *  @param sindex     The start index from which characters are converted.
     *  @param dst        The array holding the converted characters..
     *  @param dindex     The start index from which converted bytes
     *                    are written.
     *  @param len        The maximum number of characters to convert.
     */
    public static int chars2utf(char[] src, int sindex,
                                byte[] dst, int dindex,
                                int len) {
        int j = dindex;
        int limit = sindex + len;
        for (int i = sindex; i < limit; i++) {
            char ch = src[i];
            if (1 <= ch && ch <= 0x7F) {
                dst[j++] = (byte)ch;
            } else if (ch <= 0x7FF) {
                dst[j++] = (byte)(0xC0 | (ch >> 6));
                dst[j++] = (byte)(0x80 | (ch & 0x3F));
            } else {
                dst[j++] = (byte)(0xE0 | (ch >> 12));
                dst[j++] = (byte)(0x80 | ((ch >> 6) & 0x3F));
                dst[j++] = (byte)(0x80 | (ch & 0x3F));
            }
        }
        return j;
    }

    /** Return characters as an array of bytes in Utf8 representation.
     *  @param src        The array holding the characters.
     *  @param sindex     The start index from which characters are converted.
     *  @param len        The maximum number of characters to convert.
     */
    public static byte[] chars2utf(char[] src, int sindex, int len) {
        byte[] dst = new byte[len * 3];
        int len1 = chars2utf(src, sindex, dst, 0, len);
        byte[] result = new byte[len1];
        System.arraycopy(dst, 0, result, 0, len1);
        return result;
    }

    /** Return all characters in given array as an array of bytes
     *  in Utf8 representation.
     *  @param src        The array holding the characters.
     */
    public static byte[] chars2utf(char[] src) {
        return chars2utf(src, 0, src.length);
    }

    /** Return string as an array of bytes in in Utf8 representation.
     */
    public static byte[] string2utf(String s) {
        return chars2utf(s.toCharArray());
    }

    /**
     * Escapes each character in a string that has an escape sequence or
     * is non-printable ASCII.  Leaves non-ASCII characters alone.
     */
    public static String quote(String s) {
        StringBuilder buf = new StringBuilder();
        for (int i = 0; i < s.length(); i++) {
            buf.append(quote(s.charAt(i), false));
        }
        return buf.toString();
    }

    /**
     * Escapes a character if it has an escape sequence or is
     * non-printable ASCII.  Leaves non-ASCII characters alone.
     */
    public static String quote(char ch, boolean charContext) {
        /*
         * In a char context, single quote (') must be escaped and
         * double quote (") need not be escaped. In a non-char
         * context, in other words a string context, the reverse is
         * true.
         */
        switch (ch) {
        case '\b':  return "\\b";
        case '\f':  return "\\f";
        case '\n':  return "\\n";
        case '\r':  return "\\r";
        case '\t':  return "\\t";
        case '\'':  return (charContext ? "\\'" : "'");
        case '\"':  return (charContext ? "\""  : "\\\"");
        case '\\':  return "\\\\";
        default:
            return (isPrintableAscii(ch))
                ? String.valueOf(ch)
                : String.format("\\u%04x", (int) ch);
        }
    }

    /**
     * Is a character printable ASCII?
     */
    private static boolean isPrintableAscii(char ch) {
        return ch >= ' ' && ch <= '~';
    }

    /** Escape all unicode characters in string.
     */
    public static String escapeUnicode(String s) {
        int len = s.length();
        int i = 0;
        while (i < len) {
            char ch = s.charAt(i);
            if (ch > 255) {
                StringBuilder buf = new StringBuilder();
                buf.append(s.substring(0, i));
                while (i < len) {
                    ch = s.charAt(i);
                    if (ch > 255) {
                        buf.append("\\u");
                        buf.append(Character.forDigit((ch >> 12) % 16, 16));
                        buf.append(Character.forDigit((ch >>  8) % 16, 16));
                        buf.append(Character.forDigit((ch >>  4) % 16, 16));
                        buf.append(Character.forDigit((ch      ) % 16, 16));
                    } else {
                        buf.append(ch);
                    }
                    i++;
                }
                s = buf.toString();
            } else {
                i++;
            }
        }
        return s;
    }

/* Conversion routines for qualified name splitting
 */

    /** Return the last part of a qualified name.
     *  @param name the qualified name
     *  @return the last part of the qualified name
     */
    public static Name shortName(Name name) {
        int start = name.lastIndexOfAscii('.') + 1;
        return start > 0 ? name.subName(start) : name;
    }

    /** Return the last part of a qualified name from its string representation
     *  @param name the string representation of the qualified name
     *  @return the last part of the qualified name
     */
    public static String shortName(String name) {
        return name.substring(name.lastIndexOf('.') + 1);
    }

    /** Return the package name of a class name, excluding the trailing '.',
     *  "" if not existent.
     */
    public static Name packagePart(Name classname) {
        int end = Math.max(classname.lastIndexOfAscii('.'), 0);
        return classname.subName(0, end);
    }

    public static String packagePart(String classname) {
        int lastDot = classname.lastIndexOf('.');
        return (lastDot < 0 ? "" : classname.substring(0, lastDot));
    }

    public static List<Name> enclosingCandidates(Name name) {
        List<Name> names = List.nil();
        int index;
        while ((index = name.lastIndexOfAscii('$')) > 0) {
            name = name.subName(0, index);
            names = names.prepend(name);
        }
        return names;
    }

    public static List<Name> classCandidates(Name name) {
        List<Name> names = List.nil();
        String nameStr = name.toString();
        int index = -1;
        while ((index = nameStr.indexOf('.', index + 1)) > 0) {
            String pack = nameStr.substring(0, index + 1);
            String clz = nameStr.substring(index + 1).replace('.', '$');
            names = names.prepend(name.table.names.fromString(pack + clz));
        }
        return names.reverse();
    }

    /**
     * Modified UTF-8 decoding validation levels.
     */
    public enum Validation {

        /**
         * Do zero validation of UTF-8, i.e., always decode something without error.
         * When this is used, {@link InvalidUtfException} is never thrown.
         */
        NONE(true, true, true),

        /**
         * Do validation in accordance with the pre-JDK 1.4 Java class file format,
         * which allows (a) the NUL character {@code &#92;u0000} to be encoded as a single byte
         * and (b) longer-than-necessary encodings (e.g., three bytes instead of two).
         */
        PREJDK14(true, true, false),

        /**
         * Do strict validation. At this level, each character has only one valid encoding.
         */
        STRICT(false, false, false);

        private final boolean allowSingleByteNul;
        private final boolean allowLongEncoding;
        private final boolean allowAnything;

        private Validation(boolean allowSingleByteNul, boolean allowLongEncoding, boolean allowAnything) {
            this.allowSingleByteNul = allowSingleByteNul;
            this.allowLongEncoding = allowLongEncoding;
            this.allowAnything = allowAnything;
        }

        /**
         * Whether to allow the NUL character {@code &#92;u0000} to be encoded as a single byte.
         * Modified UTF-8 specifies that it be encoded in two bytes.
         */
        public boolean allowSingleByteNul() {
            return allowSingleByteNul;
        }

        /**
         * Whether to allow characters to be encoded using more bytes than required.
         */
        public boolean allowLongEncoding() {
            return allowLongEncoding;
        }

        /**
         * Whether to allow anything, including truncated characters and bogus flag bits.
         */
        public boolean allowAnything() {
            return allowAnything;
        }
    }
}
