Rainbond/util/fuzzy/fuzzy_test.go
2020-09-06 11:11:11 +08:00

211 lines
5.6 KiB
Go

package fuzzy
import (
"fmt"
"sort"
"strings"
"testing"
)
const deBelloGallico = `All Gaul is divided into three parts, one of which the Belgae inhabit,
the Aquitani another, those who in their own language are called Celts, in our Gauls, the third.
All these differ from each other in language, customs and laws. The river Garonne separates the
Gauls from the Aquitani; the Marne and the Seine separate them from the Belgae. Of all these,
the Belgae are the bravest, because they are furthest from the civilization and refinement of
[our] Province, and merchants least frequently resort to them, and import those things which tend
to effeminate the mind; and they are the nearest to the Germans, who dwell beyond the Rhine,
with whom they are continually waging war; for which reason the Helvetii also surpass the rest
of the Gauls in valor, as they contend with the Germans in almost daily battles, when they either
repel them from their own territories, or themselves wage war on their frontiers. One part of
these, which it has been said that the Gauls occupy, takes its beginning at the river Rhone;
it is bounded by the river Garonne, the ocean, and the territories of the Belgae; it borders,
too, on the side of the Sequani and the Helvetii, upon the river Rhine, and stretches toward the
north. The Belgae rises from the extreme frontier of Gaul, extend to the lower part of the river
Rhine; and look toward the north and the rising sun. Aquitania extends from the river Garonne to
the Pyrenaean mountains and to that part of the ocean which is near Spain: it looks between the
setting of the sun, and the north star.`
var fuzzyTests = []struct {
source string
target string
wanted bool
rank int
}{
{"zazz", deBelloGallico + " zazz", true, 1544},
{"zazz", "zazz " + deBelloGallico, true, 1544},
{"twl", "cartwheel", true, 6},
{"cart", "cartwheel", true, 5},
{"cw", "cartwheel", true, 7},
{"ee", "cartwheel", true, 7},
{"art", "cartwheel", true, 6},
{"eeel", "cartwheel", false, -1},
{"dog", "cartwheel", false, -1},
{"ёлка", "ёлочка", true, 2},
{"ветер", "ёлочка", false, -1},
{"中国", "中华人民共和国", true, 5},
{"日本", "中华人民共和国", false, -1},
}
func TestFuzzyMatch(t *testing.T) {
for _, val := range fuzzyTests {
match := Match(val.source, val.target)
if match != val.wanted {
t.Errorf("%s in %s expected match to be %t, got %t",
val.source, val.target, val.wanted, match)
}
}
}
func TestFuzzyMatchFold(t *testing.T) {
for _, val := range fuzzyTests {
match := MatchFold(val.source, strings.ToUpper(val.target))
if match != val.wanted {
t.Errorf("%s in %s expected match to be %t, got %t",
val.source, strings.ToUpper(val.target), val.wanted, match)
}
}
}
func TestFuzzyFind(t *testing.T) {
target := []string{"cartwheel", "foobar", "wheel", "baz"}
wanted := []string{"cartwheel", "wheel"}
matches := Find("whl", target)
if len(matches) != len(wanted) {
t.Errorf("expected %s, got %s", wanted, matches)
}
for i := range wanted {
if wanted[i] != matches[i] {
t.Errorf("expected %s, got %s", wanted, matches)
}
}
}
func TestRankMatch(t *testing.T) {
for _, val := range fuzzyTests {
rank := RankMatch(val.source, val.target)
if rank != val.rank {
t.Errorf("expected ranking %d, got %d for %s in %s",
val.rank, rank, val.source, val.target)
}
}
}
func TestRankFind(t *testing.T) {
target := []string{"cartwheel", "foobar", "wheel", "baz"}
wanted := []Rank{
{"whl", "cartwheel", 6},
{"whl", "wheel", 2},
}
ranks := RankFind("whl", target)
if len(ranks) != len(wanted) {
t.Errorf("expected %+v, got %+v", wanted, ranks)
}
for i := range wanted {
if wanted[i] != ranks[i] {
t.Errorf("expected %+v, got %+v", wanted, ranks)
}
}
}
func TestSortingRanks(t *testing.T) {
rs := Ranks{{"a", "b", 1}, {"a", "cc", 2}, {"a", "a", 0}}
wanted := Ranks{rs[2], rs[0], rs[1]}
sort.Sort(rs)
for i := range wanted {
if wanted[i] != rs[i] {
t.Errorf("expected %+v, got %+v", wanted, rs)
}
}
}
func BenchmarkMatch(b *testing.B) {
ft := fuzzyTests[2]
for i := 0; i < b.N; i++ {
Match(ft.source, ft.target)
}
}
func BenchmarkMatchBigLate(b *testing.B) {
ft := fuzzyTests[0]
for i := 0; i < b.N; i++ {
Match(ft.source, ft.target)
}
}
func BenchmarkMatchBigEarly(b *testing.B) {
ft := fuzzyTests[1]
for i := 0; i < b.N; i++ {
Match(ft.source, ft.target)
}
}
func BenchmarkMatchFold(b *testing.B) {
ft := fuzzyTests[2]
for i := 0; i < b.N; i++ {
MatchFold(ft.source, ft.target)
}
}
func BenchmarkMatchFoldBigLate(b *testing.B) {
ft := fuzzyTests[0]
for i := 0; i < b.N; i++ {
MatchFold(ft.source, ft.target)
}
}
func BenchmarkMatchFoldBigEarly(b *testing.B) {
ft := fuzzyTests[1]
for i := 0; i < b.N; i++ {
MatchFold(ft.source, ft.target)
}
}
func BenchmarkRankMatch(b *testing.B) {
ft := fuzzyTests[2]
for i := 0; i < b.N; i++ {
RankMatch(ft.source, ft.target)
}
}
func BenchmarkRankMatchBigLate(b *testing.B) {
ft := fuzzyTests[0]
for i := 0; i < b.N; i++ {
RankMatch(ft.source, ft.target)
}
}
func BenchmarkRankMatchBigEarly(b *testing.B) {
ft := fuzzyTests[1]
for i := 0; i < b.N; i++ {
RankMatch(ft.source, ft.target)
}
}
func ExampleMatch() {
fmt.Print(Match("twl", "cartwheel"))
// Output: true
}
func ExampleFind() {
fmt.Print(Find("whl", []string{"cartwheel", "foobar", "wheel", "baz"}))
// Output: [cartwheel wheel]
}
func ExampleRankMatch() {
fmt.Print(RankMatch("twl", "cartwheel"))
// Output: 6
}
func ExampleRankFind() {
fmt.Printf("%+v", RankFind("whl", []string{"cartwheel", "foobar", "wheel", "baz"}))
// Output: [{Source:whl Target:cartwheel Distance:6} {Source:whl Target:wheel Distance:2}]
}