mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
171803d5d3
At the moment, there are some problems with regard to bundler + did_you_mean because of did_you_mean being a bundled gem. Since the vendored version of thor inside bundler and ruby itself explicitly requires did_you_mean, it can become difficult to load it when using Bundler.setup. See this issue: https://github.com/yuki24/did_you_mean/issues/117#issuecomment-482733159 for more details.
46 lines
1.2 KiB
Ruby
46 lines
1.2 KiB
Ruby
# frozen-string-literal: true
|
|
|
|
require_relative "levenshtein"
|
|
require_relative "jaro_winkler"
|
|
|
|
module DidYouMean
|
|
class SpellChecker
|
|
def initialize(dictionary:)
|
|
@dictionary = dictionary
|
|
end
|
|
|
|
def correct(input)
|
|
input = normalize(input)
|
|
threshold = input.length > 3 ? 0.834 : 0.77
|
|
|
|
words = @dictionary.select { |word| JaroWinkler.distance(normalize(word), input) >= threshold }
|
|
words.reject! { |word| input == word.to_s }
|
|
words.sort_by! { |word| JaroWinkler.distance(word.to_s, input) }
|
|
words.reverse!
|
|
|
|
# Correct mistypes
|
|
threshold = (input.length * 0.25).ceil
|
|
corrections = words.select { |c| Levenshtein.distance(normalize(c), input) <= threshold }
|
|
|
|
# Correct misspells
|
|
if corrections.empty?
|
|
corrections = words.select do |word|
|
|
word = normalize(word)
|
|
length = input.length < word.length ? input.length : word.length
|
|
|
|
Levenshtein.distance(word, input) < length
|
|
end.first(1)
|
|
end
|
|
|
|
corrections
|
|
end
|
|
|
|
private
|
|
|
|
def normalize(str_or_symbol) #:nodoc:
|
|
str = str_or_symbol.to_s.downcase
|
|
str.tr!("@", "")
|
|
str
|
|
end
|
|
end
|
|
end
|