fzf/src/algo/algo.go

200 lines
4.6 KiB
Go
Raw Normal View History

2015-01-12 03:56:17 +00:00
package algo
2015-01-01 19:49:30 +00:00
2015-04-14 12:45:37 +00:00
import (
2015-06-08 14:16:31 +00:00
"strings"
2015-04-14 12:45:37 +00:00
"unicode"
"github.com/junegunn/fzf/src/util"
2015-04-14 12:45:37 +00:00
)
2015-01-01 19:49:30 +00:00
/*
* String matching algorithms here do not use strings.ToLower to avoid
* performance penalty. And they assume pattern runes are given in lowercase
* letters when caseSensitive is false.
*
* In short: They try to do as little work as possible.
*/
func runeAt(runes []rune, index int, max int, forward bool) rune {
if forward {
return runes[index]
}
return runes[max-index-1]
}
2015-01-11 18:01:24 +00:00
// FuzzyMatch performs fuzzy-match
func FuzzyMatch(caseSensitive bool, forward bool, runes []rune, pattern []rune) (int, int) {
if len(pattern) == 0 {
return 0, 0
}
2015-01-01 19:49:30 +00:00
// 0. (FIXME) How to find the shortest match?
// a_____b__c__abc
// ^^^^^^^^^^ ^^^
// 1. forward scan (abc)
// *-----*-----*>
// a_____b___abc__
// 2. reverse scan (cba)
// a_____b___abc__
// <***
pidx := 0
sidx := -1
eidx := -1
lenRunes := len(runes)
lenPattern := len(pattern)
for index := range runes {
char := runeAt(runes, index, lenRunes, forward)
2015-01-01 19:49:30 +00:00
// This is considerably faster than blindly applying strings.ToLower to the
// whole string
2015-04-14 12:45:37 +00:00
if !caseSensitive {
// Partially inlining `unicode.ToLower`. Ugly, but makes a noticeable
// difference in CPU cost. (Measured on Go 1.4.1. Also note that the Go
// compiler as of now does not inline non-leaf functions.)
if char >= 'A' && char <= 'Z' {
char += 32
} else if char > unicode.MaxASCII {
char = unicode.To(unicode.LowerCase, char)
}
2015-01-01 19:49:30 +00:00
}
pchar := runeAt(pattern, pidx, lenPattern, forward)
if char == pchar {
2015-01-01 19:49:30 +00:00
if sidx < 0 {
sidx = index
}
if pidx++; pidx == lenPattern {
2015-01-01 19:49:30 +00:00
eidx = index + 1
break
}
}
}
if sidx >= 0 && eidx >= 0 {
2015-01-11 18:01:24 +00:00
pidx--
2015-01-01 19:49:30 +00:00
for index := eidx - 1; index >= sidx; index-- {
char := runeAt(runes, index, lenRunes, forward)
if !caseSensitive {
if char >= 'A' && char <= 'Z' {
char += 32
} else if char > unicode.MaxASCII {
char = unicode.To(unicode.LowerCase, char)
}
}
pchar := runeAt(pattern, pidx, lenPattern, forward)
if char == pchar {
2015-01-11 18:01:24 +00:00
if pidx--; pidx < 0 {
2015-01-01 19:49:30 +00:00
sidx = index
break
}
}
}
if forward {
return sidx, eidx
}
return lenRunes - eidx, lenRunes - sidx
2015-01-01 19:49:30 +00:00
}
return -1, -1
}
2015-01-11 18:01:24 +00:00
// ExactMatchNaive is a basic string searching algorithm that handles case
// sensitivity. Although naive, it still performs better than the combination
// of strings.ToLower + strings.Index for typical fzf use cases where input
// strings and patterns are not very long.
//
// We might try to implement better algorithms in the future:
// http://en.wikipedia.org/wiki/String_searching_algorithm
func ExactMatchNaive(caseSensitive bool, forward bool, runes []rune, pattern []rune) (int, int) {
if len(pattern) == 0 {
return 0, 0
}
lenRunes := len(runes)
lenPattern := len(pattern)
if lenRunes < lenPattern {
2015-01-01 19:49:30 +00:00
return -1, -1
}
pidx := 0
for index := 0; index < lenRunes; index++ {
char := runeAt(runes, index, lenRunes, forward)
2015-04-14 12:45:37 +00:00
if !caseSensitive {
if char >= 'A' && char <= 'Z' {
char += 32
} else if char > unicode.MaxASCII {
char = unicode.To(unicode.LowerCase, char)
}
2015-01-01 19:49:30 +00:00
}
pchar := runeAt(pattern, pidx, lenPattern, forward)
if pchar == char {
2015-01-11 18:01:24 +00:00
pidx++
if pidx == lenPattern {
if forward {
return index - lenPattern + 1, index + 1
}
return lenRunes - (index + 1), lenRunes - (index - lenPattern + 1)
2015-01-01 19:49:30 +00:00
}
} else {
index -= pidx
pidx = 0
}
}
return -1, -1
}
2015-01-11 18:01:24 +00:00
// PrefixMatch performs prefix-match
func PrefixMatch(caseSensitive bool, forward bool, runes []rune, pattern []rune) (int, int) {
if len(runes) < len(pattern) {
2015-01-01 19:49:30 +00:00
return -1, -1
}
for index, r := range pattern {
char := runes[index]
2015-04-14 12:45:37 +00:00
if !caseSensitive {
char = unicode.ToLower(char)
2015-01-01 19:49:30 +00:00
}
if char != r {
return -1, -1
}
}
return 0, len(pattern)
}
2015-01-11 18:01:24 +00:00
// SuffixMatch performs suffix-match
func SuffixMatch(caseSensitive bool, forward bool, input []rune, pattern []rune) (int, int) {
runes := util.TrimRight(input)
2015-01-01 19:49:30 +00:00
trimmedLen := len(runes)
diff := trimmedLen - len(pattern)
if diff < 0 {
return -1, -1
}
for index, r := range pattern {
char := runes[index+diff]
2015-04-14 12:45:37 +00:00
if !caseSensitive {
char = unicode.ToLower(char)
2015-01-01 19:49:30 +00:00
}
if char != r {
return -1, -1
}
}
return trimmedLen - len(pattern), trimmedLen
}
2015-06-08 14:16:31 +00:00
2015-08-02 14:54:53 +00:00
// EqualMatch performs equal-match
func EqualMatch(caseSensitive bool, forward bool, runes []rune, pattern []rune) (int, int) {
if len(runes) != len(pattern) {
2015-06-08 14:16:31 +00:00
return -1, -1
}
runesStr := string(runes)
2015-06-08 14:16:31 +00:00
if !caseSensitive {
runesStr = strings.ToLower(runesStr)
}
if runesStr == string(pattern) {
return 0, len(pattern)
}
return -1, -1
}