blob: d549d88745daa9d19bc69c1257f0ae3f00482524 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package htmltext
import (
"fmt"
"testing"
"github.com/stretchr/testify/assert"
)
func TestClearText(t *testing.T) {
var (
expected,
clearedText string
)
// test code clear text
expected = "hello{code...}"
clearedText = ClearText("<p>hello<pre>var a = \"good\"</pre></p>")
assert.Equal(t, expected, clearedText)
// test link clear text
expected = "hello [example.com]"
clearedText = ClearText("<p>hello <a href=\"http://example.com/\">example.com</a></p>")
assert.Equal(t, expected, clearedText)
clearedText = ClearText("<p>hello<a href=\"https://example.com/\">example.com</a></p>")
assert.Equal(t, expected, clearedText)
expected = "hello world"
clearedText = ClearText("<div> hello</div>\n<div>world</div>")
assert.Equal(t, expected, clearedText)
}
func TestFetchExcerpt(t *testing.T) {
var (
expected,
text string
)
// test english string
expected = "hello..."
text = FetchExcerpt("<p>hello world</p>", "...", 5)
assert.Equal(t, expected, text)
// test mixed string
expected = "hello你好..."
text = FetchExcerpt("<p>hello你好world</p>", "...", 7)
assert.Equal(t, expected, text)
// test mixed string with emoticon
expected = "hello你好😂..."
text = FetchExcerpt("<p>hello你好😂world</p>", "...", 8)
assert.Equal(t, expected, text)
expected = "hello你好"
text = FetchExcerpt("<p>hello你好</p>", "...", 8)
assert.Equal(t, expected, text)
}
func TestUrlTitle(t *testing.T) {
list := []string{
"hello你好😂...",
"这是一个,标题,title",
}
for _, title := range list {
formatTitle := UrlTitle(title)
fmt.Println(formatTitle)
}
}
func TestFindFirstMatchedWord(t *testing.T) {
var (
expectedWord,
actualWord string
expectedIndex,
actualIndex int
)
text := "Hello, I have 中文 and 😂 and I am supposed to work fine."
// test find nothing
expectedWord, expectedIndex = "", 0
actualWord, actualIndex = findFirstMatchedWord(text, []string{"youcantfindme"})
assert.Equal(t, expectedWord, actualWord)
assert.Equal(t, expectedIndex, actualIndex)
// test find one word
expectedWord, expectedIndex = "文", 17
actualWord, actualIndex = findFirstMatchedWord(text, []string{"文"})
assert.Equal(t, expectedWord, actualWord)
assert.Equal(t, expectedIndex, actualIndex)
// test find multiple matched words
expectedWord, expectedIndex = "Hello", 0
actualWord, actualIndex = findFirstMatchedWord(text, []string{"Hello", "文"})
assert.Equal(t, expectedWord, actualWord)
assert.Equal(t, expectedIndex, actualIndex)
}
func TestGetRuneRange(t *testing.T) {
var (
expectedBegin,
expectedEnd,
actualBegin,
actualEnd int
)
runeText := []rune("Hello, I have 中文 and 😂.")
runeLen := len(runeText)
// test get range of negative offset and negative limit
expectedBegin, expectedEnd = 0, 0
actualBegin, actualEnd = getRuneRange(runeText, -1, -1)
assert.Equal(t, expectedBegin, actualBegin)
assert.Equal(t, expectedEnd, actualEnd)
// test get range of exceeding offset and exceeding limit
expectedBegin, expectedEnd = runeLen, runeLen
actualBegin, actualEnd = getRuneRange(runeText, runeLen+1, runeLen+1)
assert.Equal(t, expectedBegin, actualBegin)
assert.Equal(t, expectedEnd, actualEnd)
// test get range of normal offset and exceeding limit
expectedBegin, expectedEnd = 3, runeLen
actualBegin, actualEnd = getRuneRange(runeText, 3, runeLen)
assert.Equal(t, expectedBegin, actualBegin)
assert.Equal(t, expectedEnd, actualEnd)
// test get range of normal offset and normal limit
expectedBegin, expectedEnd = 3, 10
actualBegin, actualEnd = getRuneRange(runeText, 3, 7)
assert.Equal(t, expectedBegin, actualBegin)
assert.Equal(t, expectedEnd, actualEnd)
}
func TestFetchRangedExcerpt(t *testing.T) {
var (
expected,
actual string
)
// test english string
expected = "hello..."
actual = FetchRangedExcerpt("<p>hello world</p>", "...", 0, 5)
assert.Equal(t, expected, actual)
// test string with offset
expected = "...llo你好..."
actual = FetchRangedExcerpt("<p>hello你好world</p>", "...", 2, 5)
assert.Equal(t, expected, actual)
// test mixed string with emoticon with offset
expected = "...你好😂..."
actual = FetchRangedExcerpt("<p>hello你好😂world</p>", "...", 5, 3)
assert.Equal(t, expected, actual)
// test mixed string with offset and exceeding limit
expected = "...你好😂world"
actual = FetchRangedExcerpt("<p>hello你好😂world</p>", "...", 5, 100)
assert.Equal(t, expected, actual)
}
func TestFetchMatchedExcerpt(t *testing.T) {
var (
expected,
actual string
)
html := "<p>Hello, I have 中文 and 😂 and I am supposed to work fine</p>"
// test find nothing
// it should return from the begin with double trimLength text
expected = "Hello, I h..."
actual = FetchMatchedExcerpt(html, []string{"youcantfindme"}, "...", 5)
assert.Equal(t, expected, actual)
// test find the word at the end
// it should return the word beginning with double trimLenth plus len(word)
expected = "... work fine"
actual = FetchMatchedExcerpt(html, []string{"youcant", "fine"}, "...", 3)
assert.Equal(t, expected, actual)
// test find multiple words
// it should return the first matched word with trimmedText
expected = "... have 中文 and 😂..."
actual = FetchMatchedExcerpt(html, []string{"中文", "😂"}, "...", 6)
assert.Equal(t, expected, actual)
}