blob: 9bf3ad3988c7bc2b711f595ea1d940f0ef96310d [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.common.util;
import io.netty.buffer.ByteBuf;
import org.apache.commons.text.StringEscapeUtils;
import org.apache.commons.lang3.StringUtils;
import java.util.Arrays;
import java.util.stream.Collectors;
public class DrillStringUtils {
/**
* Converts the long number into more human readable string.
*/
public static String readable(long bytes) {
int unit = 1024;
long absBytes = Math.abs(bytes);
if (absBytes < unit) {
return bytes + " B";
}
int exp = (int) (Math.log(absBytes) / Math.log(unit));
char pre = ("KMGTPE").charAt(exp-1);
return String.format("%s%.1f %ciB", (bytes == absBytes ? "" : "-"), absBytes / Math.pow(unit, exp), pre);
}
/**
* Unescapes any Java literals found in the {@code String}.
* For example, it will turn a sequence of {@code '\'} and
* {@code 'n'} into a newline character, unless the {@code '\'}
* is preceded by another {@code '\'}.
*
* @param input the {@code String} to unescape, may be null
* @return a new unescaped {@code String}, {@code null} if null string input
*/
public static String unescapeJava(String input) {
return StringEscapeUtils.unescapeJava(input);
}
/**
* Escapes the characters in a {@code String} according to Java string literal
* rules.
*
* Deals correctly with quotes and control-chars (tab, backslash, cr, ff,
* etc.) so, for example, a tab becomes the characters {@code '\\'} and
* {@code 't'}.
*
* Example:
* <pre>
* input string: He didn't say, "Stop!"
* output string: He didn't say, \"Stop!\"
* </pre>
*
* @param input String to escape values in, may be null
* @return String with escaped values, {@code null} if null string input
*/
public static String escapeJava(String input) {
return StringEscapeUtils.escapeJava(input);
}
public static String escapeNewLines(String input) {
if (input == null) {
return null;
}
StringBuilder result = new StringBuilder();
boolean sawNewline = false;
for (int i = 0; i < input.length(); i++) {
char curChar = input.charAt(i);
if (curChar == '\r' || curChar == '\n') {
if (sawNewline) {
continue;
}
sawNewline = true;
result.append("\\n");
} else {
sawNewline = false;
result.append(curChar);
}
}
return result.toString();
}
/**
* Copied form commons-lang 2.x code as common-lang 3.x has this API removed.
* (http://commons.apache.org/proper/commons-lang/article3_0.html#StringEscapeUtils.escapeSql)
* @param str
* @return
*/
public static String escapeSql(String str) {
return (str == null) ? null : StringUtils.replace(str, "'", "''");
}
/**
* Return a printable representation of a byte buffer, escaping the non-printable
* bytes as '\\xNN' where NN is the hexadecimal representation of such bytes.
*
* This function does not modify the {@code readerIndex} and {@code writerIndex}
* of the byte buffer.
*/
public static String toBinaryString(ByteBuf buf, int strStart, int strEnd) {
StringBuilder result = new StringBuilder();
for (int i = strStart; i < strEnd; ++i) {
appendByte(result, buf.getByte(i));
}
return result.toString();
}
/**
* Return a printable representation of a byte array, escaping the non-printable
* bytes as '\\xNN' where NN is the hexadecimal representation of such bytes.
*/
public static String toBinaryString(byte[] buf) {
return toBinaryString(buf, 0, buf.length);
}
/**
* Return a printable representation of a byte array, escaping the non-printable
* bytes as '\\xNN' where NN is the hexadecimal representation of such bytes.
*/
public static String toBinaryString(byte[] buf, int strStart, int strEnd) {
StringBuilder result = new StringBuilder();
for (int i = strStart; i < strEnd; ++i) {
appendByte(result, buf[i]);
}
return result.toString();
}
private static void appendByte(StringBuilder result, byte b) {
int ch = b & 0xFF;
if ( (ch >= '0' && ch <= '9')
|| (ch >= 'A' && ch <= 'Z')
|| (ch >= 'a' && ch <= 'z')
|| " `~!@#$%^&*()-_=+[]{}|;:'\",.<>/?".indexOf(ch) >= 0 ) {
result.append((char)ch);
} else {
result.append(String.format("\\x%02X", ch));
}
}
/**
* parsing a hex encoded binary string and write to an output buffer.
*
* This function does not modify the {@code readerIndex} and {@code writerIndex}
* of the byte buffer.
*
* @return Index in the byte buffer just after the last written byte.
*/
public static int parseBinaryString(ByteBuf str, int strStart, int strEnd, ByteBuf out) {
int dstEnd = 0;
for (int i = strStart; i < strEnd; i++) {
byte b = str.getByte(i);
if (b == '\\'
&& strEnd > i+3
&& (str.getByte(i+1) == 'x' || str.getByte(i+1) == 'X')) {
// ok, take next 2 hex digits.
byte hd1 = str.getByte(i+2);
byte hd2 = str.getByte(i+3);
if (isHexDigit(hd1) && isHexDigit(hd2)) { // [a-fA-F0-9]
// turn hex ASCII digit -> number
b = (byte) ((toBinaryFromHex(hd1) << 4) + toBinaryFromHex(hd2));
i += 3; // skip 3
}
}
out.setByte(dstEnd++, b);
}
return dstEnd;
}
/**
* Takes a ASCII digit in the range A-F0-9 and returns
* the corresponding integer/ordinal value.
* @param ch The hex digit.
* @return The converted hex value as a byte.
*/
private static byte toBinaryFromHex(byte ch) {
if ( ch >= 'A' && ch <= 'F' ) {
return (byte) ((byte)10 + (byte) (ch - 'A'));
} else if ( ch >= 'a' && ch <= 'f' ) {
return (byte) ((byte)10 + (byte) (ch - 'a'));
}
return (byte) (ch - '0');
}
private static boolean isHexDigit(byte c) {
return (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F') || (c >= '0' && c <= '9');
}
/**
* Removes extra spaces and empty values in a CSV String
* @param csv The CSV string to be sanitized
* @return The sanitized CSV string
*/
public static String sanitizeCSV(String csv) {
String[] tokens = csv.split(",");
return Arrays.stream(tokens)
.map(String::trim)
.filter(StringUtils::isNotEmpty)
.collect(Collectors.joining(","));
}
/**
* Removes all leading slash characters from specified string.
*
* @param path string to remove all leading slash characters
* @return string with removed leading slash characters
*/
public static String removeLeadingSlash(String path) {
return StringUtils.stripStart(path, "/");
}
}