fe/src/main/java/org/apache/doris/http/WebUtils.java - doris - Git at Google

 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
 // regarding copyright ownership.  The ASF licenses this file
 // to you under the Apache License, Version 2.0 (the
 // "License"); you may not use this file except in compliance
 // with the License.  You may obtain a copy of the License at
 //
 //   http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing,
 // software distributed under the License is distributed on an
 // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.

 package org.apache.doris.http;

 import org.apache.doris.common.path.PathTrie;

 import com.google.common.base.Charsets;

 import java.nio.charset.Charset;
 import java.util.Map;

 public class WebUtils {
     public static final String HTTP_CORS_ALLOW_ORIGIN_SETTING = "http.cors.allow-origin";

     public static final PathTrie.Decoder REST_DECODER = new PathTrie.Decoder() {
         @Override
         public String decode(String value) {
             return WebUtils.decodeComponent(value);
         }
     };

     public static boolean isBrowser(String userAgent) {
         if (userAgent == null) {
             return false;
         }
         // chrome, safari, firefox, ie
         if (userAgent.startsWith("Mozilla")) {
             return true;
         }
         return false;
     }

     public static void decodeQueryString(String s, int fromIndex, Map<String, String> params) {
         if (fromIndex < 0) {
             return;
         }
         if (fromIndex >= s.length()) {
             return;
         }

         String name = null;
         int pos = fromIndex; // Beginning of the unprocessed region
         int i;       // End of the unprocessed region
         char c = 0;  // Current character
         for (i = fromIndex; i < s.length(); i++) {
             c = s.charAt(i);
             if (c == '=' && name == null) {
                 if (pos != i) {
                     name = decodeComponent(s.substring(pos, i));
                 }
                 pos = i + 1;
             } else if (c == '&') {
                 if (name == null && pos != i) {
                     // We haven't seen an `=' so far but moved forward.
                     // Must be a param of the form '&a&' so add it with
                     // an empty value.
                     addParam(params, decodeComponent(s.substring(pos, i)), "");
                 } else if (name != null) {
                     addParam(params, name, decodeComponent(s.substring(pos, i)));
                     name = null;
                 }
                 pos = i + 1;
             }
         }

         if (pos != i) {  // Are there characters we haven't dealt with?
             if (name == null) {     // Yes and we haven't seen any `='.
                 addParam(params, decodeComponent(s.substring(pos, i)), "");
             } else {                // Yes and this must be the last value.
                 addParam(params, name, decodeComponent(s.substring(pos, i)));
             }
         } else if (name != null) {  // Have we seen a name without value?
             addParam(params, name, "");
         }
     }

     private static void addParam(Map<String, String> params, String name, String value) {
         params.put(name, value);
     }

     /**
      * Decodes a bit of an URL encoded by a browser.
      * <p/>
      * This is equivalent to calling {@link #decodeComponent(String, Charset)}
      * with the UTF-8 charset (recommended to comply with RFC 3986, Section 2).
      *
      * @param s The string to decode (can be empty).
      * @return The decoded string, or {@code s} if there's nothing to decode.
      *         If the string to decode is {@code null}, returns an empty string.
      * @throws IllegalArgumentException if the string contains a malformed
      *                                  escape sequence.
      */
     public static String decodeComponent(final String s) {
         return decodeComponent(s, Charsets.UTF_8);
     }

     /**
      * Decodes a bit of an URL encoded by a browser.
      * <p/>
      * The string is expected to be encoded as per RFC 3986, Section 2.
      * This is the encoding used by JavaScript functions {@code encodeURI}
      * and {@code encodeURIComponent}, but not {@code escape}.  For example
      * in this encoding, &eacute; (in Unicode {@code U+00E9} or in UTF-8
      * {@code 0xC3 0xA9}) is encoded as {@code %C3%A9} or {@code %c3%a9}.
      * <p/>
      * This is essentially equivalent to calling
      * <code>{@link java.net.URLDecoder URLDecoder}.{@link
      * java.net.URLDecoder#decode(String, String)}</code>
      * except that it's over 2x faster and generates less garbage for the GC.
      * Actually this function doesn't allocate any memory if there's nothing
      * to decode, the argument itself is returned.
      *
      * @param s       The string to decode (can be empty).
      * @param charset The charset to use to decode the string (should really
      *                be {@link Charsets#UTF_8}.
      * @return The decoded string, or {@code s} if there's nothing to decode.
      *         If the string to decode is {@code null}, returns an empty string.
      * @throws IllegalArgumentException if the string contains a malformed
      *                                  escape sequence.
      */
     @SuppressWarnings("fallthrough")
     public static String decodeComponent(final String s, final Charset charset) {
         if (s == null) {
             return "";
         }
         final int size = s.length();
         boolean modified = false;
         for (int i = 0; i < size; i++) {
             final char c = s.charAt(i);
             switch (c) {
                 case '%':
                     i++;  // We can skip at least one char, e.g. `%%'.
                     // Fall through.
                 case '+':
                     modified = true;
                     break;
             }
         }
         if (!modified) {
             return s;
         }
         final byte[] buf = new byte[size];
         int pos = 0;  // position in `buf'.
         for (int i = 0; i < size; i++) {
             char c = s.charAt(i);
             switch (c) {
                 case '+':
                     buf[pos++] = ' ';  // "+" -> " "
                     break;
                 case '%':
                     if (i == size - 1) {
                         throw new IllegalArgumentException("unterminated escape"
                                 + " sequence at end of string: " + s);
                     }
                     c = s.charAt(++i);
                     if (c == '%') {
                         buf[pos++] = '%';  // "%%" -> "%"
                         break;
                     } else if (i == size - 1) {
                         throw new IllegalArgumentException("partial escape"
                                 + " sequence at end of string: " + s);
                     }
                     c = decodeHexNibble(c);
                     final char c2 = decodeHexNibble(s.charAt(++i));
                     if (c == Character.MAX_VALUE || c2 == Character.MAX_VALUE) {
                         throw new IllegalArgumentException(
                                 "invalid escape sequence `%" + s.charAt(i - 1)
                                         + s.charAt(i) + "' at index " + (i - 2)
                                         + " of: " + s);
                     }
                     c = (char) (c * 16 + c2);
                     // Fall through.
                 default:
                     buf[pos++] = (byte) c;
                     break;
             }
         }
         return new String(buf, 0, pos, charset);
     }

     /**
      * Helper to decode half of a hexadecimal number from a string.
      *
      * @param c The ASCII character of the hexadecimal number to decode.
      *          Must be in the range {@code [0-9a-fA-F]}.
      * @return The hexadecimal value represented in the ASCII character
      *         given, or {@link Character#MAX_VALUE} if the character is invalid.
      */
     private static char decodeHexNibble(final char c) {
         if ('0' <= c && c <= '9') {
             return (char) (c - '0');
         } else if ('a' <= c && c <= 'f') {
             return (char) (c - 'a' + 10);
         } else if ('A' <= c && c <= 'F') {
             return (char) (c - 'A' + 10);
         } else {
             return Character.MAX_VALUE;
         }
     }

     /**
      * Determine if CORS setting is a regex
      */
 //    public static Pattern getCorsSettingRegex(Settings settings) {
 //        String corsSetting = settings.get(HTTP_CORS_ALLOW_ORIGIN_SETTING, "*");
 //        int len = corsSetting.length();
 //        boolean isRegex = len > 2 &&  corsSetting.startsWith("/") && corsSetting.endsWith("/");
 //
 //        if (isRegex) {
 //            return Pattern.compile(corsSetting.substring(1, corsSetting.length()-1));
 //        }
 //
 //        return null;
 //    }
 }
	// Licensed to the Apache Software Foundation (ASF) under one
	// or more contributor license agreements. See the NOTICE file
	// distributed with this work for additional information
	// regarding copyright ownership. The ASF licenses this file
	// to you under the Apache License, Version 2.0 (the
	// "License"); you may not use this file except in compliance
	// with the License. You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing,
	// software distributed under the License is distributed on an
	// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	// KIND, either express or implied. See the License for the
	// specific language governing permissions and limitations
	// under the License.

	package org.apache.doris.http;

	import org.apache.doris.common.path.PathTrie;

	import com.google.common.base.Charsets;

	import java.nio.charset.Charset;
	import java.util.Map;

	public class WebUtils {
	public static final String HTTP_CORS_ALLOW_ORIGIN_SETTING = "http.cors.allow-origin";

	public static final PathTrie.Decoder REST_DECODER = new PathTrie.Decoder() {
	@Override
	public String decode(String value) {
	return WebUtils.decodeComponent(value);
	}
	};

	public static boolean isBrowser(String userAgent) {
	if (userAgent == null) {
	return false;
	}
	// chrome, safari, firefox, ie
	if (userAgent.startsWith("Mozilla")) {
	return true;
	}
	return false;
	}

	public static void decodeQueryString(String s, int fromIndex, Map<String, String> params) {
	if (fromIndex < 0) {
	return;
	}
	if (fromIndex >= s.length()) {
	return;
	}

	String name = null;
	int pos = fromIndex; // Beginning of the unprocessed region
	int i; // End of the unprocessed region
	char c = 0; // Current character
	for (i = fromIndex; i < s.length(); i++) {
	c = s.charAt(i);
	if (c == '=' && name == null) {
	if (pos != i) {
	name = decodeComponent(s.substring(pos, i));
	}
	pos = i + 1;
	} else if (c == '&') {
	if (name == null && pos != i) {
	// We haven't seen an `=' so far but moved forward.
	// Must be a param of the form '&a&' so add it with
	// an empty value.
	addParam(params, decodeComponent(s.substring(pos, i)), "");
	} else if (name != null) {
	addParam(params, name, decodeComponent(s.substring(pos, i)));
	name = null;
	}
	pos = i + 1;
	}
	}

	if (pos != i) { // Are there characters we haven't dealt with?
	if (name == null) { // Yes and we haven't seen any `='.
	addParam(params, decodeComponent(s.substring(pos, i)), "");
	} else { // Yes and this must be the last value.
	addParam(params, name, decodeComponent(s.substring(pos, i)));
	}
	} else if (name != null) { // Have we seen a name without value?
	addParam(params, name, "");
	}
	}

	private static void addParam(Map<String, String> params, String name, String value) {
	params.put(name, value);
	}

	/**
	* Decodes a bit of an URL encoded by a browser.
	* <p/>
	* This is equivalent to calling {@link #decodeComponent(String, Charset)}
	* with the UTF-8 charset (recommended to comply with RFC 3986, Section 2).
	*
	* @param s The string to decode (can be empty).
	* @return The decoded string, or {@code s} if there's nothing to decode.
	* If the string to decode is {@code null}, returns an empty string.
	* @throws IllegalArgumentException if the string contains a malformed
	* escape sequence.
	*/
	public static String decodeComponent(final String s) {
	return decodeComponent(s, Charsets.UTF_8);
	}

	/**
	* Decodes a bit of an URL encoded by a browser.
	* <p/>
	* The string is expected to be encoded as per RFC 3986, Section 2.
	* This is the encoding used by JavaScript functions {@code encodeURI}
	* and {@code encodeURIComponent}, but not {@code escape}. For example
	* in this encoding, é (in Unicode {@code U+00E9} or in UTF-8
	* {@code 0xC3 0xA9}) is encoded as {@code %C3%A9} or {@code %c3%a9}.
	* <p/>
	* This is essentially equivalent to calling
	* <code>{@link java.net.URLDecoder URLDecoder}.{@link
	* java.net.URLDecoder#decode(String, String)}</code>
	* except that it's over 2x faster and generates less garbage for the GC.
	* Actually this function doesn't allocate any memory if there's nothing
	* to decode, the argument itself is returned.
	*
	* @param s The string to decode (can be empty).
	* @param charset The charset to use to decode the string (should really
	* be {@link Charsets#UTF_8}.
	* @return The decoded string, or {@code s} if there's nothing to decode.
	* If the string to decode is {@code null}, returns an empty string.
	* @throws IllegalArgumentException if the string contains a malformed
	* escape sequence.
	*/
	@SuppressWarnings("fallthrough")
	public static String decodeComponent(final String s, final Charset charset) {
	if (s == null) {
	return "";
	}
	final int size = s.length();
	boolean modified = false;
	for (int i = 0; i < size; i++) {
	final char c = s.charAt(i);
	switch (c) {
	case '%':
	i++; // We can skip at least one char, e.g. `%%'.
	// Fall through.
	case '+':
	modified = true;
	break;
	}
	}
	if (!modified) {
	return s;
	}
	final byte[] buf = new byte[size];
	int pos = 0; // position in `buf'.
	for (int i = 0; i < size; i++) {
	char c = s.charAt(i);
	switch (c) {
	case '+':
	buf[pos++] = ' '; // "+" -> " "
	break;
	case '%':
	if (i == size - 1) {
	throw new IllegalArgumentException("unterminated escape"
	+ " sequence at end of string: " + s);
	}
	c = s.charAt(++i);
	if (c == '%') {
	buf[pos++] = '%'; // "%%" -> "%"
	break;
	} else if (i == size - 1) {
	throw new IllegalArgumentException("partial escape"
	+ " sequence at end of string: " + s);
	}
	c = decodeHexNibble(c);
	final char c2 = decodeHexNibble(s.charAt(++i));
	if (c == Character.MAX_VALUE \|\| c2 == Character.MAX_VALUE) {
	throw new IllegalArgumentException(
	"invalid escape sequence `%" + s.charAt(i - 1)
	+ s.charAt(i) + "' at index " + (i - 2)
	+ " of: " + s);
	}
	c = (char) (c * 16 + c2);
	// Fall through.
	default:
	buf[pos++] = (byte) c;
	break;
	}
	}
	return new String(buf, 0, pos, charset);
	}

	/**
	* Helper to decode half of a hexadecimal number from a string.
	*
	* @param c The ASCII character of the hexadecimal number to decode.
	* Must be in the range {@code [0-9a-fA-F]}.
	* @return The hexadecimal value represented in the ASCII character
	* given, or {@link Character#MAX_VALUE} if the character is invalid.
	*/
	private static char decodeHexNibble(final char c) {
	if ('0' <= c && c <= '9') {
	return (char) (c - '0');
	} else if ('a' <= c && c <= 'f') {
	return (char) (c - 'a' + 10);
	} else if ('A' <= c && c <= 'F') {
	return (char) (c - 'A' + 10);
	} else {
	return Character.MAX_VALUE;
	}
	}

	/**
	* Determine if CORS setting is a regex
	*/
	// public static Pattern getCorsSettingRegex(Settings settings) {
	// String corsSetting = settings.get(HTTP_CORS_ALLOW_ORIGIN_SETTING, "*");
	// int len = corsSetting.length();
	// boolean isRegex = len > 2 && corsSetting.startsWith("/") && corsSetting.endsWith("/");
	//
	// if (isRegex) {
	// return Pattern.compile(corsSetting.substring(1, corsSetting.length()-1));
	// }
	//
	// return null;
	// }
	}