You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							64 lines
						
					
					
						
							2.2 KiB
						
					
					
				
			
		
		
	
	
							64 lines
						
					
					
						
							2.2 KiB
						
					
					
				| //  Copyright (c) 2018 Couchbase, Inc.
 | |
| //
 | |
| // Licensed under the Apache License, Version 2.0 (the "License");
 | |
| // you may not use this file except in compliance with the License.
 | |
| // You may obtain a copy of the License at
 | |
| //
 | |
| // 		http://www.apache.org/licenses/LICENSE-2.0
 | |
| //
 | |
| // Unless required by applicable law or agreed to in writing, software
 | |
| // distributed under the License is distributed on an "AS IS" BASIS,
 | |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| // See the License for the specific language governing permissions and
 | |
| // limitations under the License.
 | |
| 
 | |
| package levenshtein2
 | |
| 
 | |
| import "fmt"
 | |
| 
 | |
| // StateLimit is the maximum number of states allowed
 | |
| const StateLimit = 10000
 | |
| 
 | |
| // ErrTooManyStates is returned if you attempt to build a Levenshtein
 | |
| // automaton which requires too many states.
 | |
| var ErrTooManyStates = fmt.Errorf("dfa contains more than %d states",
 | |
| 	StateLimit)
 | |
| 
 | |
| // LevenshteinAutomatonBuilder wraps a precomputed
 | |
| // datastructure that allows to produce small (but not minimal) DFA.
 | |
| type LevenshteinAutomatonBuilder struct {
 | |
| 	pDfa *ParametricDFA
 | |
| }
 | |
| 
 | |
| // NewLevenshteinAutomatonBuilder creates a
 | |
| // reusable, threadsafe Levenshtein automaton builder.
 | |
| // `maxDistance` - maximum distance considered by the automaton.
 | |
| // `transposition` - assign a distance of 1 for transposition
 | |
| //
 | |
| // Building this automaton builder is computationally intensive.
 | |
| // While it takes only a few milliseconds for `d=2`, it grows
 | |
| // exponentially with `d`. It is only reasonable to `d <= 5`.
 | |
| func NewLevenshteinAutomatonBuilder(maxDistance uint8,
 | |
| 	transposition bool) (*LevenshteinAutomatonBuilder, error) {
 | |
| 	lnfa := newLevenshtein(maxDistance, transposition)
 | |
| 
 | |
| 	pdfa, err := fromNfa(lnfa)
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 
 | |
| 	return &LevenshteinAutomatonBuilder{pDfa: pdfa}, nil
 | |
| }
 | |
| 
 | |
| // BuildDfa builds the levenshtein automaton for serving
 | |
| // queries with a given edit distance.
 | |
| func (lab *LevenshteinAutomatonBuilder) BuildDfa(query string,
 | |
| 	fuzziness uint8) (*DFA, error) {
 | |
| 	return lab.pDfa.buildDfa(query, fuzziness, false)
 | |
| }
 | |
| 
 | |
| // MaxDistance returns the MaxEdit distance supported by the
 | |
| // LevenshteinAutomatonBuilder builder.
 | |
| func (lab *LevenshteinAutomatonBuilder) MaxDistance() uint8 {
 | |
| 	return lab.pDfa.maxDistance
 | |
| }
 | |
| 
 |