339 lines
12 KiB
Java
339 lines
12 KiB
Java
/*
|
|
* Copyright (c) 1999, 2013, Oracle and/or its affiliates. All rights reserved.
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* This code is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License version 2 only, as
|
|
* published by the Free Software Foundation. Oracle designates this
|
|
* particular file as subject to the "Classpath" exception as provided
|
|
* by Oracle in the LICENSE file that accompanied this code.
|
|
*
|
|
* This code is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* version 2 for more details (a copy is included in the LICENSE file that
|
|
* accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU General Public License version
|
|
* 2 along with this work; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*
|
|
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
|
|
* or visit www.oracle.com if you need additional information or have any
|
|
* questions.
|
|
*/
|
|
|
|
package com.sun.tools.javac.util;
|
|
|
|
/** Utility class for static conversion methods between numbers
|
|
* and strings in various formats.
|
|
*
|
|
* <p>Note regarding UTF-8.
|
|
* The JVMS defines its own version of the UTF-8 format so that it
|
|
* contains no zero bytes (modified UTF-8). This is not actually the same
|
|
* as Charset.forName("UTF-8").
|
|
*
|
|
* <p>
|
|
* See also:
|
|
* <ul>
|
|
* <li><a href="https://docs.oracle.com/javase/specs/jvms/se7/html/jvms-4.html#jvms-4.4.7">
|
|
* JVMS 4.4.7 </a></li>
|
|
* <li><a href="https://docs.oracle.com/javase/7/docs/api/java/io/DataInput.html#modified-utf-8">
|
|
java.io.DataInput: Modified UTF-8 </a></li>
|
|
<li><a href="https://en.wikipedia.org/wiki/UTF-8#Modified_UTF-8">
|
|
Modified UTF-8 (wikipedia) </a></li>
|
|
* </ul>
|
|
*
|
|
* The methods here support modified UTF-8.
|
|
*
|
|
* <p><b>This is NOT part of any supported API.
|
|
* If you write code that depends on this, you do so at your own risk.
|
|
* This code and its internal interfaces are subject to change or
|
|
* deletion without notice.</b>
|
|
*/
|
|
public class Convert {
|
|
|
|
/** Convert string to integer.
|
|
*/
|
|
public static int string2int(String s, int radix)
|
|
throws NumberFormatException {
|
|
if (radix == 10) {
|
|
return Integer.parseInt(s, radix);
|
|
} else {
|
|
char[] cs = s.toCharArray();
|
|
int limit = Integer.MAX_VALUE / (radix/2);
|
|
int n = 0;
|
|
for (int i = 0; i < cs.length; i++) {
|
|
int d = Character.digit(cs[i], radix);
|
|
if (n < 0 ||
|
|
n > limit ||
|
|
n * radix > Integer.MAX_VALUE - d)
|
|
throw new NumberFormatException();
|
|
n = n * radix + d;
|
|
}
|
|
return n;
|
|
}
|
|
}
|
|
|
|
/** Convert string to long integer.
|
|
*/
|
|
public static long string2long(String s, int radix)
|
|
throws NumberFormatException {
|
|
if (radix == 10) {
|
|
return Long.parseLong(s, radix);
|
|
} else {
|
|
char[] cs = s.toCharArray();
|
|
long limit = Long.MAX_VALUE / (radix/2);
|
|
long n = 0;
|
|
for (int i = 0; i < cs.length; i++) {
|
|
int d = Character.digit(cs[i], radix);
|
|
if (n < 0 ||
|
|
n > limit ||
|
|
n * radix > Long.MAX_VALUE - d)
|
|
throw new NumberFormatException();
|
|
n = n * radix + d;
|
|
}
|
|
return n;
|
|
}
|
|
}
|
|
|
|
/* Conversion routines between names, strings, and byte arrays in Utf8 format
|
|
*/
|
|
|
|
/** Convert `len' bytes from utf8 to characters.
|
|
* Parameters are as in System.arraycopy
|
|
* Return first index in `dst' past the last copied char.
|
|
* @param src The array holding the bytes to convert.
|
|
* @param sindex The start index from which bytes are converted.
|
|
* @param dst The array holding the converted characters..
|
|
* @param dindex The start index from which converted characters
|
|
* are written.
|
|
* @param len The maximum number of bytes to convert.
|
|
*/
|
|
public static int utf2chars(byte[] src, int sindex,
|
|
char[] dst, int dindex,
|
|
int len) {
|
|
int i = sindex;
|
|
int j = dindex;
|
|
int limit = sindex + len;
|
|
while (i < limit) {
|
|
int b = src[i++] & 0xFF;
|
|
if (b >= 0xE0) {
|
|
b = (b & 0x0F) << 12;
|
|
b = b | (src[i++] & 0x3F) << 6;
|
|
b = b | (src[i++] & 0x3F);
|
|
} else if (b >= 0xC0) {
|
|
b = (b & 0x1F) << 6;
|
|
b = b | (src[i++] & 0x3F);
|
|
}
|
|
dst[j++] = (char)b;
|
|
}
|
|
return j;
|
|
}
|
|
|
|
/** Return bytes in Utf8 representation as an array of characters.
|
|
* @param src The array holding the bytes.
|
|
* @param sindex The start index from which bytes are converted.
|
|
* @param len The maximum number of bytes to convert.
|
|
*/
|
|
public static char[] utf2chars(byte[] src, int sindex, int len) {
|
|
char[] dst = new char[len];
|
|
int len1 = utf2chars(src, sindex, dst, 0, len);
|
|
char[] result = new char[len1];
|
|
System.arraycopy(dst, 0, result, 0, len1);
|
|
return result;
|
|
}
|
|
|
|
/** Return all bytes of a given array in Utf8 representation
|
|
* as an array of characters.
|
|
* @param src The array holding the bytes.
|
|
*/
|
|
public static char[] utf2chars(byte[] src) {
|
|
return utf2chars(src, 0, src.length);
|
|
}
|
|
|
|
/** Return bytes in Utf8 representation as a string.
|
|
* @param src The array holding the bytes.
|
|
* @param sindex The start index from which bytes are converted.
|
|
* @param len The maximum number of bytes to convert.
|
|
*/
|
|
public static String utf2string(byte[] src, int sindex, int len) {
|
|
char dst[] = new char[len];
|
|
int len1 = utf2chars(src, sindex, dst, 0, len);
|
|
return new String(dst, 0, len1);
|
|
}
|
|
|
|
/** Return all bytes of a given array in Utf8 representation
|
|
* as a string.
|
|
* @param src The array holding the bytes.
|
|
*/
|
|
public static String utf2string(byte[] src) {
|
|
return utf2string(src, 0, src.length);
|
|
}
|
|
|
|
/** Copy characters in source array to bytes in target array,
|
|
* converting them to Utf8 representation.
|
|
* The target array must be large enough to hold the result.
|
|
* returns first index in `dst' past the last copied byte.
|
|
* @param src The array holding the characters to convert.
|
|
* @param sindex The start index from which characters are converted.
|
|
* @param dst The array holding the converted characters..
|
|
* @param dindex The start index from which converted bytes
|
|
* are written.
|
|
* @param len The maximum number of characters to convert.
|
|
*/
|
|
public static int chars2utf(char[] src, int sindex,
|
|
byte[] dst, int dindex,
|
|
int len) {
|
|
int j = dindex;
|
|
int limit = sindex + len;
|
|
for (int i = sindex; i < limit; i++) {
|
|
char ch = src[i];
|
|
if (1 <= ch && ch <= 0x7F) {
|
|
dst[j++] = (byte)ch;
|
|
} else if (ch <= 0x7FF) {
|
|
dst[j++] = (byte)(0xC0 | (ch >> 6));
|
|
dst[j++] = (byte)(0x80 | (ch & 0x3F));
|
|
} else {
|
|
dst[j++] = (byte)(0xE0 | (ch >> 12));
|
|
dst[j++] = (byte)(0x80 | ((ch >> 6) & 0x3F));
|
|
dst[j++] = (byte)(0x80 | (ch & 0x3F));
|
|
}
|
|
}
|
|
return j;
|
|
}
|
|
|
|
/** Return characters as an array of bytes in Utf8 representation.
|
|
* @param src The array holding the characters.
|
|
* @param sindex The start index from which characters are converted.
|
|
* @param len The maximum number of characters to convert.
|
|
*/
|
|
public static byte[] chars2utf(char[] src, int sindex, int len) {
|
|
byte[] dst = new byte[len * 3];
|
|
int len1 = chars2utf(src, sindex, dst, 0, len);
|
|
byte[] result = new byte[len1];
|
|
System.arraycopy(dst, 0, result, 0, len1);
|
|
return result;
|
|
}
|
|
|
|
/** Return all characters in given array as an array of bytes
|
|
* in Utf8 representation.
|
|
* @param src The array holding the characters.
|
|
*/
|
|
public static byte[] chars2utf(char[] src) {
|
|
return chars2utf(src, 0, src.length);
|
|
}
|
|
|
|
/** Return string as an array of bytes in in Utf8 representation.
|
|
*/
|
|
public static byte[] string2utf(String s) {
|
|
return chars2utf(s.toCharArray());
|
|
}
|
|
|
|
/**
|
|
* Escapes each character in a string that has an escape sequence or
|
|
* is non-printable ASCII. Leaves non-ASCII characters alone.
|
|
*/
|
|
public static String quote(String s) {
|
|
StringBuilder buf = new StringBuilder();
|
|
for (int i = 0; i < s.length(); i++) {
|
|
buf.append(quote(s.charAt(i)));
|
|
}
|
|
return buf.toString();
|
|
}
|
|
|
|
/**
|
|
* Escapes a character if it has an escape sequence or is
|
|
* non-printable ASCII. Leaves non-ASCII characters alone.
|
|
*/
|
|
public static String quote(char ch) {
|
|
switch (ch) {
|
|
case '\b': return "\\b";
|
|
case '\f': return "\\f";
|
|
case '\n': return "\\n";
|
|
case '\r': return "\\r";
|
|
case '\t': return "\\t";
|
|
case '\'': return "\\'";
|
|
case '\"': return "\\\"";
|
|
case '\\': return "\\\\";
|
|
default:
|
|
return (isPrintableAscii(ch))
|
|
? String.valueOf(ch)
|
|
: String.format("\\u%04x", (int) ch);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Is a character printable ASCII?
|
|
*/
|
|
private static boolean isPrintableAscii(char ch) {
|
|
return ch >= ' ' && ch <= '~';
|
|
}
|
|
|
|
/** Escape all unicode characters in string.
|
|
*/
|
|
public static String escapeUnicode(String s) {
|
|
int len = s.length();
|
|
int i = 0;
|
|
while (i < len) {
|
|
char ch = s.charAt(i);
|
|
if (ch > 255) {
|
|
StringBuilder buf = new StringBuilder();
|
|
buf.append(s.substring(0, i));
|
|
while (i < len) {
|
|
ch = s.charAt(i);
|
|
if (ch > 255) {
|
|
buf.append("\\u");
|
|
buf.append(Character.forDigit((ch >> 12) % 16, 16));
|
|
buf.append(Character.forDigit((ch >> 8) % 16, 16));
|
|
buf.append(Character.forDigit((ch >> 4) % 16, 16));
|
|
buf.append(Character.forDigit((ch ) % 16, 16));
|
|
} else {
|
|
buf.append(ch);
|
|
}
|
|
i++;
|
|
}
|
|
s = buf.toString();
|
|
} else {
|
|
i++;
|
|
}
|
|
}
|
|
return s;
|
|
}
|
|
|
|
/* Conversion routines for qualified name splitting
|
|
*/
|
|
/** Return the last part of a class name.
|
|
*/
|
|
public static Name shortName(Name classname) {
|
|
return classname.subName(
|
|
classname.lastIndexOf((byte)'.') + 1, classname.getByteLength());
|
|
}
|
|
|
|
public static String shortName(String classname) {
|
|
return classname.substring(classname.lastIndexOf('.') + 1);
|
|
}
|
|
|
|
/** Return the package name of a class name, excluding the trailing '.',
|
|
* "" if not existent.
|
|
*/
|
|
public static Name packagePart(Name classname) {
|
|
return classname.subName(0, classname.lastIndexOf((byte)'.'));
|
|
}
|
|
|
|
public static String packagePart(String classname) {
|
|
int lastDot = classname.lastIndexOf('.');
|
|
return (lastDot < 0 ? "" : classname.substring(0, lastDot));
|
|
}
|
|
|
|
public static List<Name> enclosingCandidates(Name name) {
|
|
List<Name> names = List.nil();
|
|
int index;
|
|
while ((index = name.lastIndexOf((byte)'$')) > 0) {
|
|
name = name.subName(0, index);
|
|
names = names.prepend(name);
|
|
}
|
|
return names;
|
|
}
|
|
}
|