diff --git a/lib/twitter_ebooks/nlp.rb b/lib/twitter_ebooks/nlp.rb index b65e162..f971f0c 100644 --- a/lib/twitter_ebooks/nlp.rb +++ b/lib/twitter_ebooks/nlp.rb @@ -14,10 +14,10 @@ module Ebooks # to be using it all of the time # Lazily loads an array of stopwords - # Stopwords are common English words that should often be ignored + # Stopwords are common words that should often be ignored # @return [Array] def self.stopwords - @stopwords ||= File.read(File.join(DATA_PATH, 'stopwords.txt')).split + @stopwords ||= File.exists?('stopwords.txt') ? File.read('stopwords.txt').split : [] end # Lazily loads an array of known English nouns @@ -99,7 +99,7 @@ module Ebooks #set :vowels, 1 # => default: 0 = not considered #set :consonants, 5 # => default: 0 = not considered #set :ignore_case, true # => default: false - set :word_pattern, /(? default: /\w+/ + set :word_pattern, /(? default: /\w+/ #set :stemming, true # => default: false end diff --git a/data/stopwords.txt b/skeleton/stopwords.txt similarity index 100% rename from data/stopwords.txt rename to skeleton/stopwords.txt