| /** |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.nutch.net.urlnormalizer.ajax; |
| |
| import org.apache.hadoop.conf.Configuration; |
| import org.apache.nutch.net.URLNormalizers; |
| import org.apache.nutch.util.NutchConfiguration; |
| |
| import junit.framework.TestCase; |
| |
| /** Unit tests for AjaxURLNormalizer. */ |
| public class TestAjaxURLNormalizer extends TestCase { |
| private AjaxURLNormalizer normalizer; |
| private Configuration conf; |
| |
| public TestAjaxURLNormalizer(String name) { |
| super(name); |
| normalizer = new AjaxURLNormalizer(); |
| conf = NutchConfiguration.create(); |
| normalizer.setConf(conf); |
| } |
| |
| public void testNormalizer() throws Exception { |
| // check if AJAX URL's are normalized to an _escaped_frament_ form |
| normalizeTest("http://example.org/#!k=v", "http://example.org/?_escaped_fragment_=k=v"); |
| |
| // Check with some escaped chars |
| normalizeTest("http://example.org/#!k=v&something=is wrong", "http://example.org/?_escaped_fragment_=k=v%26something=is%20wrong"); |
| |
| // Check with query string and multiple fragment params |
| normalizeTest("http://example.org/path.html?queryparam=queryvalue#!key1=value1&key2=value2", "http://example.org/path.html?queryparam=queryvalue&_escaped_fragment_=key1=value1%26key2=value2"); |
| } |
| |
| public void testNormalizerWhenIndexing() throws Exception { |
| // check if it works the other way around |
| normalizeTest("http://example.org/?_escaped_fragment_=key=value", "http://example.org/#!key=value", URLNormalizers.SCOPE_INDEXER); |
| normalizeTest("http://example.org/?key=value&_escaped_fragment_=key=value", "http://example.org/?key=value#!key=value", URLNormalizers.SCOPE_INDEXER); |
| normalizeTest("http://example.org/page.html?key=value&_escaped_fragment_=key=value%26something=is%20wrong", "http://example.org/page.html?key=value#!key=value&something=is wrong", URLNormalizers.SCOPE_INDEXER); |
| } |
| |
| private void normalizeTest(String weird, String normal) throws Exception { |
| assertEquals(normal, normalizer.normalize(weird, URLNormalizers.SCOPE_DEFAULT)); |
| } |
| |
| private void normalizeTest(String weird, String normal, String scope) throws Exception { |
| assertEquals(normal, normalizer.normalize(weird, scope)); |
| } |
| |
| public static void main(String[] args) throws Exception { |
| new TestAjaxURLNormalizer("test").testNormalizer(); |
| } |
| } |