blob: 104907cc596b32c6c6ab85afadab39a84f50703d [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nutch.util;
import org.junit.Assert;
import org.junit.Test;
/** Unit tests for SuffixStringMatcher. */
public class TestSuffixStringMatcher {
private final static int NUM_TEST_ROUNDS = 20;
private final static int MAX_TEST_SUFFIXES = 100;
private final static int MAX_SUFFIX_LEN = 10;
private final static int NUM_TEST_INPUTS_PER_ROUND = 100;
private final static int MAX_INPUT_LEN = 20;
private final static char[] alphabet = new char[] { 'a', 'b', 'c', 'd',
// 'e', 'f', 'g', 'h', 'i', 'j',
// 'k', 'l', 'm', 'n', 'o', 'p', 'q', 'r', 's', 't',
// 'u', 'v', 'w', 'x', 'y', 'z', '1', '2', '3', '4',
// '5', '6', '7', '8', '9', '0'
};
private String makeRandString(int minLen, int maxLen) {
int len = minLen + (int) (Math.random() * (maxLen - minLen));
char[] chars = new char[len];
for (int pos = 0; pos < len; pos++) {
chars[pos] = alphabet[(int) (Math.random() * alphabet.length)];
}
return new String(chars);
}
@Test
public void testSuffixMatcher() {
int numMatches = 0;
int numInputsTested = 0;
for (int round = 0; round < NUM_TEST_ROUNDS; round++) {
// build list of suffixes
int numSuffixes = (int) (Math.random() * MAX_TEST_SUFFIXES);
String[] suffixes = new String[numSuffixes];
for (int i = 0; i < numSuffixes; i++) {
suffixes[i] = makeRandString(0, MAX_SUFFIX_LEN);
}
SuffixStringMatcher sufmatcher = new SuffixStringMatcher(suffixes);
// test random strings for suffix matches
for (int i = 0; i < NUM_TEST_INPUTS_PER_ROUND; i++) {
String input = makeRandString(0, MAX_INPUT_LEN);
boolean matches = false;
int longestMatch = -1;
int shortestMatch = -1;
for (int j = 0; j < suffixes.length; j++) {
if ((suffixes[j].length() > 0) && input.endsWith(suffixes[j])) {
matches = true;
int matchSize = suffixes[j].length();
if (matchSize > longestMatch)
longestMatch = matchSize;
if ((matchSize < shortestMatch) || (shortestMatch == -1))
shortestMatch = matchSize;
}
}
if (matches)
numMatches++;
numInputsTested++;
Assert.assertTrue("'" + input + "' should " + (matches ? "" : "not ")
+ "match!", matches == sufmatcher.matches(input));
if (matches) {
Assert.assertTrue(shortestMatch == sufmatcher.shortestMatch(input)
.length());
Assert.assertTrue(input.substring(input.length() - shortestMatch)
.equals(sufmatcher.shortestMatch(input)));
Assert.assertTrue(longestMatch == sufmatcher.longestMatch(input)
.length());
Assert.assertTrue(input.substring(input.length() - longestMatch)
.equals(sufmatcher.longestMatch(input)));
}
}
}
System.out.println("got " + numMatches + " matches out of "
+ numInputsTested + " tests");
}
}