| #!/bin/sh |
| # Licensed to the Apache Software Foundation (ASF) under one or more |
| # contributor license agreements. See the NOTICE file distributed with |
| # this work for additional information regarding copyright ownership. |
| # The ASF licenses this file to You under the Apache License, Version 2.0 |
| # (the "License"); you may not use this file except in compliance with |
| # the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| |
| #Test script to tell if the server is accepting UTF-8 |
| #The python writer currently escapes non-ascii chars, so it's good for testing |
| |
| SOLR_URL=http://localhost:8983/solr |
| |
| if [ ! -z $1 ]; then |
| SOLR_URL=$1 |
| fi |
| |
| curl "$SOLR_URL/select?q=hello¶ms=explicit&wt=python" 2> /dev/null | grep 'hello' > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "Solr server is up." |
| else |
| echo "ERROR: Could not curl to Solr - is curl installed? Is Solr not running?" |
| exit 1 |
| fi |
| |
| curl "$SOLR_URL/select?q=h%C3%A9llo&echoParams=explicit&wt=python" 2> /dev/null | grep 'h\\u00e9llo' > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP GET is accepting UTF-8" |
| else |
| echo "ERROR: HTTP GET is not accepting UTF-8" |
| fi |
| |
| curl $SOLR_URL/select --data-binary 'q=h%C3%A9llo&echoParams=explicit&wt=python' -H 'Content-type:application/x-www-form-urlencoded; charset=UTF-8' 2> /dev/null | grep 'h\\u00e9llo' > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP POST is accepting UTF-8" |
| else |
| echo "ERROR: HTTP POST is not accepting UTF-8" |
| fi |
| |
| curl $SOLR_URL/select --data-binary 'q=h%C3%A9llo&echoParams=explicit&wt=python' 2> /dev/null | grep 'h\\u00e9llo' > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP POST defaults to UTF-8" |
| else |
| echo "HTTP POST does not default to UTF-8" |
| fi |
| |
| |
| #A unicode character outside of the BMP (a circle with an x inside) |
| CHAR="𐌈" |
| CODEPOINT='0x10308' |
| #URL encoded UTF8 of the codepoint |
| UTF8_Q='%F0%90%8C%88' |
| #expected return of the python writer (currently uses UTF-16 surrogates) |
| EXPECTED='\\ud800\\udf08' |
| |
| curl "$SOLR_URL/select?q=$UTF8_Q&echoParams=explicit&wt=python" 2> /dev/null | grep $EXPECTED > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP GET is accepting UTF-8 beyond the basic multilingual plane" |
| else |
| echo "ERROR: HTTP GET is not accepting UTF-8 beyond the basic multilingual plane" |
| fi |
| |
| curl $SOLR_URL/select --data-binary "q=$UTF8_Q&echoParams=explicit&wt=python" -H 'Content-type:application/x-www-form-urlencoded; charset=UTF-8' 2> /dev/null | grep $EXPECTED > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP POST is accepting UTF-8 beyond the basic multilingual plane" |
| else |
| echo "ERROR: HTTP POST is not accepting UTF-8 beyond the basic multilingual plane" |
| fi |
| |
| curl "$SOLR_URL/select?q=$UTF8_Q&echoParams=explicit&wt=python" --data-binary '' 2> /dev/null | grep $EXPECTED > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "HTTP POST + URL params is accepting UTF-8 beyond the basic multilingual plane" |
| else |
| echo "ERROR: HTTP POST + URL params is not accepting UTF-8 beyond the basic multilingual plane" |
| fi |
| |
| #curl "$SOLR_URL/select?q=$UTF8_Q&echoParams=explicit" 2> /dev/null | od -tx1 -w1000 | sed 's/ //g' | grep 'f4808198' > /dev/null 2>&1 |
| curl "$SOLR_URL/select?q=$UTF8_Q&echoParams=explicit" 2> /dev/null | grep "$CHAR" > /dev/null 2>&1 |
| if [ $? = 0 ]; then |
| echo "Response correctly returns UTF-8 beyond the basic multilingual plane" |
| else |
| echo "ERROR: Response can't return UTF-8 beyond the basic multilingual plane" |
| fi |
| |
| |