mihomo/component/trie/domain.go

130 lines
2.5 KiB
Go
Raw Normal View History

2019-07-14 19:29:58 +08:00
package trie
import (
"errors"
"strings"
)
const (
wildcard = "*"
dotWildcard = ""
complexWildcard = "+"
domainStep = "."
2019-07-14 19:29:58 +08:00
)
2021-10-10 23:44:09 +08:00
// ErrInvalidDomain means insert domain is invalid
var ErrInvalidDomain = errors.New("invalid domain")
2019-07-14 19:29:58 +08:00
// DomainTrie contains the main logic for adding and searching nodes for domain segments.
2019-07-14 19:29:58 +08:00
// support wildcard domain (e.g *.google.com)
2022-04-06 04:25:53 +08:00
type DomainTrie[T comparable] struct {
root *Node[T]
2019-07-14 19:29:58 +08:00
}
func ValidAndSplitDomain(domain string) ([]string, bool) {
if domain != "" && domain[len(domain)-1] == '.' {
return nil, false
}
parts := strings.Split(domain, domainStep)
if len(parts) == 1 {
2020-06-07 17:25:51 +08:00
if parts[0] == "" {
return nil, false
}
return parts, true
}
for _, part := range parts[1:] {
if part == "" {
return nil, false
}
}
return parts, true
}
2019-07-14 19:29:58 +08:00
// Insert adds a node to the trie.
// Support
// 1. www.example.com
// 2. *.example.com
// 3. subdomain.*.example.com
// 4. .example.com
// 5. +.example.com
2022-04-06 04:25:53 +08:00
func (t *DomainTrie[T]) Insert(domain string, data T) error {
parts, valid := ValidAndSplitDomain(domain)
if !valid {
2019-07-14 19:29:58 +08:00
return ErrInvalidDomain
}
if parts[0] == complexWildcard {
t.insert(parts[1:], data)
parts[0] = dotWildcard
t.insert(parts, data)
} else {
t.insert(parts, data)
}
return nil
}
2022-04-06 04:25:53 +08:00
func (t *DomainTrie[T]) insert(parts []string, data T) {
2019-07-14 19:29:58 +08:00
node := t.root
// reverse storage domain part to save space
for i := len(parts) - 1; i >= 0; i-- {
part := parts[i]
if !node.hasChild(part) {
2022-04-06 04:25:53 +08:00
node.addChild(part, newNode(getZero[T]()))
2019-07-14 19:29:58 +08:00
}
node = node.getChild(part)
}
node.Data = data
}
// Search is the most important part of the Trie.
// Priority as:
// 1. static part
// 2. wildcard domain
// 2. dot wildcard domain
2022-04-06 04:25:53 +08:00
func (t *DomainTrie[T]) Search(domain string) *Node[T] {
parts, valid := ValidAndSplitDomain(domain)
if !valid || parts[0] == "" {
2019-07-14 19:29:58 +08:00
return nil
}
n := t.search(t.root, parts)
2019-07-14 19:29:58 +08:00
2022-04-06 04:25:53 +08:00
if n == nil || n.Data == getZero[T]() {
return nil
}
2019-07-14 19:29:58 +08:00
return n
}
2020-04-24 23:49:19 +08:00
2022-04-06 04:25:53 +08:00
func (t *DomainTrie[T]) search(node *Node[T], parts []string) *Node[T] {
if len(parts) == 0 {
return node
}
if c := node.getChild(parts[len(parts)-1]); c != nil {
2022-04-06 04:25:53 +08:00
if n := t.search(c, parts[:len(parts)-1]); n != nil && n.Data != getZero[T]() {
return n
2019-07-14 19:29:58 +08:00
}
}
2019-07-14 19:29:58 +08:00
if c := node.getChild(wildcard); c != nil {
2022-04-06 04:25:53 +08:00
if n := t.search(c, parts[:len(parts)-1]); n != nil && n.Data != getZero[T]() {
return n
}
2019-07-14 19:29:58 +08:00
}
2021-03-24 01:00:21 +08:00
return node.getChild(dotWildcard)
2019-07-14 19:29:58 +08:00
}
// New returns a new, empty Trie.
2022-04-06 04:25:53 +08:00
func New[T comparable]() *DomainTrie[T] {
return &DomainTrie[T]{root: newNode[T](getZero[T]())}
2019-07-14 19:29:58 +08:00
}