From 8f90ef69c4dd38d0e5d298af9f6d7f50b8376bc2 Mon Sep 17 00:00:00 2001 From: Romain Deveaud Date: Mon, 3 Jan 2011 16:43:37 +0100 Subject: [PATCH] calls to the count_words method of Document are no more allowed --- lib/mirimiri/document.rb | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/lib/mirimiri/document.rb b/lib/mirimiri/document.rb index ac7e4c9..bc16dd2 100644 --- a/lib/mirimiri/document.rb +++ b/lib/mirimiri/document.rb @@ -80,11 +80,9 @@ module Mirimiri # entropy("dillinger escape plan") #=> 0.265862076325102 def entropy(s) en = 0.0 - # TODO: count_words as an attribute? - counts = self.count_words s.split.each do |w| - p_wi = counts[w].to_f/@words.count.to_f + p_wi = @count_words[w].to_f/@words.count.to_f en += p_wi*Math.log2(p_wi) end @@ -96,16 +94,17 @@ module Mirimiri # # tf("guitar") #=> 0.000380372765310004 def tf(s) - self.count_words[s].to_f/@words.size.to_f + @count_words[s].to_f/@words.size.to_f end def initialize(content="") @doc_content = content @words = format_words + @count_words = count_words end - protected :format_words + protected :format_words, :count_words end # A WebDocument is a Document with a +url+. -- 1.8.2.3