diff --git a/doc/classes/RIR.html b/doc/classes/RIR.html
index e909f57..77d50d4 100644
--- a/doc/classes/RIR.html
+++ b/doc/classes/RIR.html
@@ -53,9 +53,9 @@
             <td>
 
 
-                <a href="../files/lib/rir/corpus_rb.html">
+                <a href="../files/lib/rir/ttagger_rb.html">
 
-                lib/rir/corpus.rb
+                lib/rir/ttagger.rb
 
                 </a>
 
@@ -73,9 +73,9 @@
         <br />
 
 
-                <a href="../files/lib/rir/string_rb.html">
+                <a href="../files/lib/rir/document_rb.html">
 
-                lib/rir/string.rb
+                lib/rir/document.rb
 
                 </a>
 
@@ -142,27 +142,7 @@ with this program. If not, see <<a
 href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>.
 </p>
 <hr size="1"></hr><p>
-This file is a part of an Information Retrieval oriented Ruby library
-</p>
-<p>
-Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com>
-</p>
-<p>
-This program is free software: you can redistribute it and/or modify it
-under the terms of the GNU General Public License as published by the Free
-Software Foundation, either version 3 of the License, or (at your option)
-any later version.
-</p>
-<p>
-This program is distributed in the hope that it will be useful, but WITHOUT
-ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
-FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
-more details.
-</p>
-<p>
-You should have received a copy of the GNU General Public License along
-with this program. If not, see <<a
-href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>.
+General module for many purposes related to Information Retrieval.
 </p>
 
     </div>
@@ -180,34 +160,14 @@ href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>.
       <h3 class="section-bar">Classes and Modules</h3>
 
       Module <a href="RIR/Indri.html" class="link">RIR::Indri</a><br />
-Class <a href="RIR/Corpus.html" class="link">RIR::Corpus</a><br />
+Module <a href="RIR/TreeTagger.html" class="link">RIR::TreeTagger</a><br />
+Class <a href="RIR/Document.html" class="link">RIR::Document</a><br />
 Class <a href="RIR/Query.html" class="link">RIR::Query</a><br />
+Class <a href="RIR/WebDocument.html" class="link">RIR::WebDocument</a><br />
+Class <a href="RIR/WikipediaPage.html" class="link">RIR::WikipediaPage</a><br />
 
     </div>
 
-    <div id="constants-list">
-      <h3 class="section-bar">Constants</h3>
-
-      <div class="name-list">
-        <table summary="Constants">
-
-        <tr class="top-aligned-row context-row">
-          <td class="context-item-name">Stoplist</td>
-          <td>=</td>
-          <td class="context-item-value">[   &quot;a&quot;, &quot;anything&quot;, &quot;anyway&quot;, &quot;anywhere&quot;, &quot;apart&quot;, &quot;are&quot;, &quot;around&quot;, &quot;as&quot;, &quot;at&quot;, &quot;av&quot;,   &quot;be&quot;, &quot;became&quot;, &quot;because&quot;, &quot;become&quot;, &quot;becomes&quot;, &quot;becoming&quot;, &quot;been&quot;, &quot;before&quot;, &quot;beforehand&quot;,   &quot;behind&quot;, &quot;being&quot;, &quot;below&quot;, &quot;beside&quot;, &quot;besides&quot;, &quot;between&quot;, &quot;beyond&quot;, &quot;both&quot;, &quot;but&quot;, &quot;by&quot;,   &quot;can&quot;, &quot;cannot&quot;, &quot;canst&quot;, &quot;certain&quot;, &quot;cf&quot;, &quot;choose&quot;, &quot;contrariwise&quot;, &quot;cos&quot;, &quot;could&quot;, &quot;cu&quot;,   &quot;day&quot;, &quot;do&quot;, &quot;does&quot;, &quot;doesn't&quot;, &quot;doing&quot;, &quot;dost&quot;, &quot;doth&quot;, &quot;double&quot;, &quot;down&quot;, &quot;dual&quot;, &quot;during&quot;,   &quot;each&quot;, &quot;either&quot;, &quot;else&quot;, &quot;elsewhere&quot;, &quot;enough&quot;, &quot;et&quot;, &quot;etc&quot;, &quot;even&quot;, &quot;ever&quot;, &quot;every&quot;,   &quot;everybody&quot;, &quot;everyone&quot;, &quot;everything&quot;, &quot;everywhere&quot;, &quot;except&quot;, &quot;excepted&quot;, &quot;excepting&quot;,   &quot;exception&quot;, &quot;exclude&quot;, &quot;excluding&quot;, &quot;exclusive&quot;, &quot;far&quot;, &quot;farther&quot;, &quot;farthest&quot;, &quot;few&quot;, &quot;ff&quot;,   &quot;first&quot;, &quot;for&quot;, &quot;formerly&quot;, &quot;forth&quot;, &quot;forward&quot;, &quot;from&quot;, &quot;front&quot;, &quot;further&quot;, &quot;furthermore&quot;,   &quot;furthest&quot;, &quot;get&quot;, &quot;go&quot;, &quot;had&quot;, &quot;halves&quot;, &quot;hardly&quot;, &quot;has&quot;, &quot;hast&quot;, &quot;hath&quot;, &quot;have&quot;, &quot;he&quot;,   &quot;hence&quot;, &quot;henceforth&quot;, &quot;her&quot;, &quot;here&quot;, &quot;hereabouts&quot;, &quot;hereafter&quot;, &quot;hereby&quot;, &quot;herein&quot;, &quot;hereto&quot;,   &quot;hereupon&quot;, &quot;hers&quot;, &quot;herself&quot;, &quot;him&quot;, &quot;himself&quot;, &quot;hindmost&quot;, &quot;his&quot;, &quot;hither&quot;, &quot;hitherto&quot;,   &quot;how&quot;, &quot;however&quot;, &quot;howsoever&quot;, &quot;i&quot;, &quot;ie&quot;, &quot;if&quot;, &quot;in&quot;, &quot;inasmuch&quot;, &quot;inc&quot;, &quot;include&quot;,   &quot;included&quot;, &quot;including&quot;, &quot;indeed&quot;, &quot;indoors&quot;, &quot;inside&quot;, &quot;insomuch&quot;, &quot;instead&quot;, &quot;into&quot;,   &quot;inward&quot;, &quot;inwards&quot;, &quot;is&quot;, &quot;it&quot;, &quot;its&quot;, &quot;itself&quot;, &quot;just&quot;, &quot;kind&quot;, &quot;kg&quot;, &quot;km&quot;, &quot;last&quot;,   &quot;latter&quot;, &quot;latterly&quot;, &quot;less&quot;, &quot;lest&quot;, &quot;let&quot;, &quot;like&quot;, &quot;little&quot;, &quot;ltd&quot;, &quot;many&quot;, &quot;may&quot;, &quot;maybe&quot;,   &quot;me&quot;, &quot;meantime&quot;, &quot;meanwhile&quot;, &quot;might&quot;, &quot;moreover&quot;, &quot;most&quot;, &quot;mostly&quot;, &quot;more&quot;, &quot;mr&quot;, &quot;mrs&quot;,   &quot;ms&quot;, &quot;much&quot;, &quot;must&quot;, &quot;my&quot;, &quot;myself&quot;, &quot;namely&quot;, &quot;need&quot;, &quot;neither&quot;, &quot;never&quot;, &quot;nevertheless&quot;,   &quot;next&quot;, &quot;no&quot;, &quot;nobody&quot;, &quot;none&quot;, &quot;nonetheless&quot;, &quot;noone&quot;, &quot;nope&quot;, &quot;nor&quot;, &quot;not&quot;, &quot;nothing&quot;,   &quot;notwithstanding&quot;, &quot;now&quot;, &quot;nowadays&quot;, &quot;nowhere&quot;, &quot;of&quot;, &quot;off&quot;, &quot;often&quot;, &quot;ok&quot;, &quot;on&quot;, &quot;once&quot;,   &quot;one&quot;, &quot;only&quot;, &quot;onto&quot;, &quot;or&quot;, &quot;other&quot;, &quot;others&quot;, &quot;otherwise&quot;, &quot;ought&quot;, &quot;our&quot;, &quot;ours&quot;,   &quot;ourselves&quot;, &quot;out&quot;, &quot;outside&quot;, &quot;over&quot;, &quot;own&quot;, &quot;per&quot;, &quot;perhaps&quot;, &quot;plenty&quot;, &quot;provide&quot;, &quot;quite&quot;,   &quot;rather&quot;, &quot;really&quot;, &quot;round&quot;, &quot;said&quot;, &quot;sake&quot;, &quot;same&quot;, &quot;sang&quot;, &quot;save&quot;, &quot;saw&quot;, &quot;see&quot;, &quot;seeing&quot;,   &quot;seem&quot;, &quot;seemed&quot;, &quot;seeming&quot;, &quot;seems&quot;, &quot;seen&quot;, &quot;seldom&quot;, &quot;selves&quot;, &quot;sent&quot;, &quot;several&quot;, &quot;shalt&quot;,   &quot;she&quot;, &quot;should&quot;, &quot;shown&quot;, &quot;sideways&quot;, &quot;since&quot;, &quot;slept&quot;, &quot;slew&quot;, &quot;slung&quot;, &quot;slunk&quot;, &quot;smote&quot;,   &quot;so&quot;, &quot;some&quot;, &quot;somebody&quot;, &quot;somehow&quot;, &quot;someone&quot;, &quot;something&quot;, &quot;sometime&quot;, &quot;sometimes&quot;,   &quot;somewhat&quot;, &quot;somewhere&quot;, &quot;spake&quot;, &quot;spat&quot;, &quot;spoke&quot;, &quot;spoken&quot;, &quot;sprang&quot;, &quot;sprung&quot;, &quot;stave&quot;,   &quot;staves&quot;, &quot;still&quot;, &quot;such&quot;, &quot;supposing&quot;, &quot;than&quot;, &quot;that&quot;, &quot;the&quot;, &quot;thee&quot;, &quot;their&quot;, &quot;them&quot;,   &quot;themselves&quot;, &quot;then&quot;, &quot;thence&quot;, &quot;thenceforth&quot;, &quot;there&quot;, &quot;thereabout&quot;, &quot;thereabouts&quot;,   &quot;thereafter&quot;, &quot;thereby&quot;, &quot;therefore&quot;, &quot;therein&quot;, &quot;thereof&quot;, &quot;thereon&quot;, &quot;thereto&quot;, &quot;thereupon&quot;,   &quot;these&quot;, &quot;they&quot;, &quot;this&quot;, &quot;those&quot;, &quot;thou&quot;, &quot;though&quot;, &quot;thrice&quot;, &quot;through&quot;, &quot;throughout&quot;, &quot;thru&quot;,   &quot;thus&quot;, &quot;thy&quot;, &quot;thyself&quot;, &quot;till&quot;, &quot;to&quot;, &quot;together&quot;, &quot;too&quot;, &quot;toward&quot;, &quot;towards&quot;, &quot;ugh&quot;,   &quot;unable&quot;, &quot;under&quot;, &quot;underneath&quot;, &quot;unless&quot;, &quot;unlike&quot;, &quot;until&quot;, &quot;up&quot;, &quot;upon&quot;, &quot;upward&quot;,   &quot;upwards&quot;, &quot;us&quot;, &quot;use&quot;, &quot;used&quot;, &quot;using&quot;, &quot;very&quot;, &quot;via&quot;, &quot;vs&quot;, &quot;want&quot;, &quot;was&quot;, &quot;we&quot;, &quot;week&quot;,   &quot;well&quot;, &quot;were&quot;, &quot;what&quot;, &quot;whatever&quot;, &quot;whatsoever&quot;, &quot;when&quot;, &quot;whence&quot;, &quot;whenever&quot;, &quot;whensoever&quot;,   &quot;where&quot;, &quot;whereabouts&quot;, &quot;whereafter&quot;, &quot;whereas&quot;, &quot;whereat&quot;, &quot;whereby&quot;, &quot;wherefore&quot;,   &quot;wherefrom&quot;, &quot;wherein&quot;, &quot;whereinto&quot;, &quot;whereof&quot;, &quot;whereon&quot;, &quot;wheresoever&quot;, &quot;whereto&quot;,   &quot;whereunto&quot;, &quot;whereupon&quot;, &quot;wherever&quot;, &quot;wherewith&quot;, &quot;whether&quot;, &quot;whew&quot;, &quot;which&quot;, &quot;whichever&quot;,   &quot;whichsoever&quot;, &quot;while&quot;, &quot;whilst&quot;, &quot;whither&quot;, &quot;who&quot;, &quot;whoa&quot;, &quot;whoever&quot;, &quot;whole&quot;, &quot;whom&quot;,   &quot;whomever&quot;, &quot;whomsoever&quot;, &quot;whose&quot;, &quot;whosoever&quot;, &quot;why&quot;, &quot;will&quot;, &quot;wilt&quot;, &quot;with&quot;, &quot;within&quot;,   &quot;without&quot;, &quot;worse&quot;, &quot;worst&quot;, &quot;would&quot;, &quot;wow&quot;, &quot;ye&quot;, &quot;yet&quot;, &quot;year&quot;, &quot;yippee&quot;, &quot;you&quot;, &quot;your&quot;,   &quot;yours&quot;, &quot;yourself&quot;, &quot;yourselves&quot;    ]</td>
-
-          <td>&nbsp;</td>
-          <td class="context-item-desc">
-These are the default stopwords provided by Lemur.
-
-</td>
-
-        </tr>
-
-        </table>
-      </div>
-    </div>
-
 
 
 
diff --git a/doc/classes/RIR/Document.html b/doc/classes/RIR/Document.html
index 8643cb5..00f66b4 100644
--- a/doc/classes/RIR/Document.html
+++ b/doc/classes/RIR/Document.html
@@ -99,15 +99,17 @@ from a string.
 
       <div class="name-list">
 
-        <a href="#M000021">count_words</a>&nbsp;&nbsp;
+        <a href="#M000010">count_words</a>&nbsp;&nbsp;
 
-        <a href="#M000022">entropy</a>&nbsp;&nbsp;
+        <a href="#M000011">entropy</a>&nbsp;&nbsp;
 
-        <a href="#M000019">format_words</a>&nbsp;&nbsp;
+        <a href="#M000008">format_words</a>&nbsp;&nbsp;
 
-        <a href="#M000023">new</a>&nbsp;&nbsp;
+        <a href="#M000013">new</a>&nbsp;&nbsp;
 
-        <a href="#M000020">ngrams</a>&nbsp;&nbsp;
+        <a href="#M000009">ngrams</a>&nbsp;&nbsp;
+
+        <a href="#M000012">tf</a>&nbsp;&nbsp;
 
       </div>
     </div>
@@ -154,13 +156,13 @@ from a string.
       <h3 class="section-bar">Public Class methods</h3>
 
 
-      <div id="method-M000023" class="method-detail">
-        <a name="M000023"></a>
+      <div id="method-M000013" class="method-detail">
+        <a name="M000013"></a>
 
         <div class="method-heading">
 
-          <a href="Document.src/M000023.html" target="Code" class="method-signature"
-            onclick="popupCode('Document.src/M000023.html');return false;">
+          <a href="Document.src/M000013.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000013.html');return false;">
 
           <span class="method-name">new</span><span class="method-args">(content)</span>
 
@@ -177,13 +179,13 @@ from a string.
       <h3 class="section-bar">Public Instance methods</h3>
 
 
-      <div id="method-M000021" class="method-detail">
-        <a name="M000021"></a>
+      <div id="method-M000010" class="method-detail">
+        <a name="M000010"></a>
 
         <div class="method-heading">
 
-          <a href="Document.src/M000021.html" target="Code" class="method-signature"
-            onclick="popupCode('Document.src/M000021.html');return false;">
+          <a href="Document.src/M000010.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000010.html');return false;">
 
           <span class="method-name">count_words</span><span class="method-args">()</span>
 
@@ -205,13 +207,13 @@ current <a href="Document.html">Document</a>.
       </div>
 
 
-      <div id="method-M000022" class="method-detail">
-        <a name="M000022"></a>
+      <div id="method-M000011" class="method-detail">
+        <a name="M000011"></a>
 
         <div class="method-heading">
 
-          <a href="Document.src/M000022.html" target="Code" class="method-signature"
-            onclick="popupCode('Document.src/M000022.html');return false;">
+          <a href="Document.src/M000011.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000011.html');return false;">
 
           <span class="method-name">entropy</span><span class="method-args">(s)</span>
 
@@ -229,20 +231,21 @@ If the string parameter is composed of many words (i.e. tokens separated by
 whitespace(s)), it is considered as an ngram.
 </p>
 <pre>
-  entropy(&quot;guitar&quot;) #=&gt; 0.00389919463243839
+  entropy(&quot;guitar&quot;) #=&gt; 0.00432114812727959
+  entropy(&quot;dillinger escape plan&quot;) #=&gt; 0.265862076325102
 </pre>
 
         </div>
       </div>
 
 
-      <div id="method-M000020" class="method-detail">
-        <a name="M000020"></a>
+      <div id="method-M000009" class="method-detail">
+        <a name="M000009"></a>
 
         <div class="method-heading">
 
-          <a href="Document.src/M000020.html" target="Code" class="method-signature"
-            onclick="popupCode('Document.src/M000020.html');return false;">
+          <a href="Document.src/M000009.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000009.html');return false;">
 
           <span class="method-name">ngrams</span><span class="method-args">(n)</span>
 
@@ -264,16 +267,43 @@ Returns an Array containing the <tt>n</tt>-grams (words) from the current
       </div>
 
 
+      <div id="method-M000012" class="method-detail">
+        <a name="M000012"></a>
+
+        <div class="method-heading">
+
+          <a href="Document.src/M000012.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000012.html');return false;">
+
+          <span class="method-name">tf</span><span class="method-args">(s)</span>
+
+          </a>
+
+        </div>
+
+        <div class="method-description">
+
+          <p>
+Computes the term frequency of a given <b>word</b> <tt>s</tt>.
+</p>
+<pre>
+  tf(&quot;guitar&quot;) #=&gt; 0.000380372765310004
+</pre>
+
+        </div>
+      </div>
+
+
       <h3 class="section-bar">Protected Instance methods</h3>
 
 
-      <div id="method-M000019" class="method-detail">
-        <a name="M000019"></a>
+      <div id="method-M000008" class="method-detail">
+        <a name="M000008"></a>
 
         <div class="method-heading">
 
-          <a href="Document.src/M000019.html" target="Code" class="method-signature"
-            onclick="popupCode('Document.src/M000019.html');return false;">
+          <a href="Document.src/M000008.html" target="Code" class="method-signature"
+            onclick="popupCode('Document.src/M000008.html');return false;">
 
           <span class="method-name">format_words</span><span class="method-args">()</span>
 
diff --git a/doc/classes/RIR/Document.src/M000008.html b/doc/classes/RIR/Document.src/M000008.html
new file mode 100644
index 0000000..72c51f5
--- /dev/null
+++ b/doc/classes/RIR/Document.src/M000008.html
@@ -0,0 +1,23 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>format_words (RIR::Document)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 31</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">format_words</span>
+      <span class="ruby-identifier">wo</span> = []
+
+      <span class="ruby-ivar">@doc_content</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
+        <span class="ruby-identifier">w</span>.<span class="ruby-identifier">split</span>(<span class="ruby-regexp re">/\W/</span>).<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">sw</span><span class="ruby-operator">|</span> 
+          <span class="ruby-identifier">wo</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">sw</span>.<span class="ruby-identifier">downcase</span>) <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">sw</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/[a-zA-Z]/</span> 
+        <span class="ruby-keyword kw">end</span>
+      <span class="ruby-keyword kw">end</span>
+      
+      <span class="ruby-identifier">wo</span>
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/Document.src/M000009.html b/doc/classes/RIR/Document.src/M000009.html
new file mode 100644
index 0000000..6257629
--- /dev/null
+++ b/doc/classes/RIR/Document.src/M000009.html
@@ -0,0 +1,26 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>ngrams (RIR::Document)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 46</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">ngrams</span>(<span class="ruby-identifier">n</span>)
+      <span class="ruby-identifier">window</span>       = []
+      <span class="ruby-identifier">ngrams_array</span> = []
+
+      <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
+        <span class="ruby-identifier">window</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">w</span>)
+        <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">size</span> <span class="ruby-operator">==</span> <span class="ruby-identifier">n</span>
+          <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">push</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">join</span>(<span class="ruby-value str">&quot; &quot;</span>)
+          <span class="ruby-identifier">window</span>.<span class="ruby-identifier">delete_at</span>(<span class="ruby-value">0</span>)
+        <span class="ruby-keyword kw">end</span>
+      <span class="ruby-keyword kw">end</span>
+
+      <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">uniq</span>
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/Document.src/M000010.html b/doc/classes/RIR/Document.src/M000010.html
index 5056008..e8ddeec 100644
--- a/doc/classes/RIR/Document.src/M000010.html
+++ b/doc/classes/RIR/Document.src/M000010.html
@@ -2,22 +2,17 @@
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
 <head>
-  <title>format_words (RIR::Document)</title>
+  <title>count_words (RIR::Document)</title>
   <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
 </head>
 <body class="standalone-code">
-  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 31</span>
-    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">format_words</span>
-      <span class="ruby-identifier">wo</span> = []
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 64</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">count_words</span>
+      <span class="ruby-identifier">counts</span> = <span class="ruby-constant">Hash</span>.<span class="ruby-identifier">new</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">h</span>,<span class="ruby-identifier">k</span><span class="ruby-operator">|</span> <span class="ruby-identifier">h</span>[<span class="ruby-identifier">k</span>] = <span class="ruby-value">0</span> }
+      <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>] <span class="ruby-operator">+=</span> <span class="ruby-value">1</span> }
 
-      <span class="ruby-ivar">@doc_content</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
-        <span class="ruby-identifier">w</span>.<span class="ruby-identifier">split</span>(<span class="ruby-regexp re">/\W/</span>).<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">sw</span><span class="ruby-operator">|</span> 
-          <span class="ruby-identifier">wo</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">sw</span>) <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">sw</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/[a-zA-Z]/</span> 
-        <span class="ruby-keyword kw">end</span>
-      <span class="ruby-keyword kw">end</span>
-      
-      <span class="ruby-identifier">wo</span>
+      <span class="ruby-identifier">counts</span>
     <span class="ruby-keyword kw">end</span></pre>
 </body>
 </html>
diff --git a/doc/classes/RIR/Document.src/M000011.html b/doc/classes/RIR/Document.src/M000011.html
index 6257629..50f6db7 100644
--- a/doc/classes/RIR/Document.src/M000011.html
+++ b/doc/classes/RIR/Document.src/M000011.html
@@ -2,25 +2,23 @@
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
 <head>
-  <title>ngrams (RIR::Document)</title>
+  <title>entropy (RIR::Document)</title>
   <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
 </head>
 <body class="standalone-code">
-  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 46</span>
-    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">ngrams</span>(<span class="ruby-identifier">n</span>)
-      <span class="ruby-identifier">window</span>       = []
-      <span class="ruby-identifier">ngrams_array</span> = []
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 78</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">entropy</span>(<span class="ruby-identifier">s</span>)
+      <span class="ruby-identifier">en</span> = <span class="ruby-value">0</span><span class="ruby-value">.0</span>
+      <span class="ruby-identifier">counts</span> = <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span>
 
-      <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
-        <span class="ruby-identifier">window</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">w</span>)
-        <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">size</span> <span class="ruby-operator">==</span> <span class="ruby-identifier">n</span>
-          <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">push</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">join</span>(<span class="ruby-value str">&quot; &quot;</span>)
-          <span class="ruby-identifier">window</span>.<span class="ruby-identifier">delete_at</span>(<span class="ruby-value">0</span>)
-        <span class="ruby-keyword kw">end</span>
+      <span class="ruby-identifier">s</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
+        <span class="ruby-identifier">p_wi</span> = <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">count</span>.<span class="ruby-identifier">to_f</span>
+        <span class="ruby-identifier">en</span> <span class="ruby-operator">+=</span> <span class="ruby-identifier">p_wi</span><span class="ruby-operator">*</span><span class="ruby-constant">Math</span>.<span class="ruby-identifier">log2</span>(<span class="ruby-identifier">p_wi</span>)
       <span class="ruby-keyword kw">end</span>
 
-      <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">uniq</span>
+      <span class="ruby-identifier">en</span> <span class="ruby-operator">*=</span> <span class="ruby-value">-1</span>
+      <span class="ruby-identifier">en</span>
     <span class="ruby-keyword kw">end</span></pre>
 </body>
 </html>
diff --git a/doc/classes/RIR/Document.src/M000012.html b/doc/classes/RIR/Document.src/M000012.html
index 978234a..eb4436b 100644
--- a/doc/classes/RIR/Document.src/M000012.html
+++ b/doc/classes/RIR/Document.src/M000012.html
@@ -2,17 +2,14 @@
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
 <head>
-  <title>count_words (RIR::Document)</title>
+  <title>tf (RIR::Document)</title>
   <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
 </head>
 <body class="standalone-code">
-  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 64</span>
-    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">count_words</span>
-      <span class="ruby-identifier">counts</span> = <span class="ruby-constant">Hash</span>.<span class="ruby-identifier">new</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">h</span>,<span class="ruby-identifier">k</span><span class="ruby-operator">|</span> <span class="ruby-identifier">h</span>[<span class="ruby-identifier">k</span>] = <span class="ruby-value">0</span> }
-      <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>.<span class="ruby-identifier">downcase</span>] <span class="ruby-operator">+=</span> <span class="ruby-value">1</span> }
-
-      <span class="ruby-identifier">counts</span>
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 94</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">tf</span>(<span class="ruby-identifier">s</span>)
+      <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span>[<span class="ruby-identifier">s</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">size</span>.<span class="ruby-identifier">to_f</span>
     <span class="ruby-keyword kw">end</span></pre>
 </body>
 </html>
diff --git a/doc/classes/RIR/Document.src/M000013.html b/doc/classes/RIR/Document.src/M000013.html
index 5694971..1ef96d5 100644
--- a/doc/classes/RIR/Document.src/M000013.html
+++ b/doc/classes/RIR/Document.src/M000013.html
@@ -2,23 +2,15 @@
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
 <head>
-  <title>entropy (RIR::Document)</title>
+  <title>new (RIR::Document)</title>
   <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
 </head>
 <body class="standalone-code">
-  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 77</span>
-    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">entropy</span>(<span class="ruby-identifier">s</span>)
-      <span class="ruby-identifier">en</span> = <span class="ruby-value">0</span><span class="ruby-value">.0</span>
-      <span class="ruby-identifier">counts</span> = <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span>
-
-      <span class="ruby-identifier">s</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span>
-        <span class="ruby-identifier">p_wi</span> = <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">count</span>.<span class="ruby-identifier">to_f</span>
-        <span class="ruby-identifier">en</span> <span class="ruby-operator">+=</span> <span class="ruby-identifier">p_wi</span><span class="ruby-operator">*</span><span class="ruby-constant">Math</span>.<span class="ruby-identifier">log2</span>(<span class="ruby-identifier">p_wi</span>)
-      <span class="ruby-keyword kw">end</span>
-
-      <span class="ruby-identifier">en</span> <span class="ruby-operator">*=</span> <span class="ruby-value">-1</span>
-      <span class="ruby-identifier">en</span>
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 99</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">content</span>)
+      <span class="ruby-ivar">@doc_content</span> = <span class="ruby-identifier">content</span>
+      <span class="ruby-ivar">@words</span> = <span class="ruby-identifier">format_words</span>
     <span class="ruby-keyword kw">end</span></pre>
 </body>
 </html>
diff --git a/doc/classes/RIR/Indri/IndriQuery.html b/doc/classes/RIR/Indri/IndriQuery.html
index 5bd769e..922525d 100644
--- a/doc/classes/RIR/Indri/IndriQuery.html
+++ b/doc/classes/RIR/Indri/IndriQuery.html
@@ -95,9 +95,9 @@
 
       <div class="name-list">
 
-        <a href="#M000014">new</a>&nbsp;&nbsp;
+        <a href="#M000006">new</a>&nbsp;&nbsp;
 
-        <a href="#M000015">to_s</a>&nbsp;&nbsp;
+        <a href="#M000007">to_s</a>&nbsp;&nbsp;
 
       </div>
     </div>
@@ -160,13 +160,13 @@
       <h3 class="section-bar">Public Class methods</h3>
 
 
-      <div id="method-M000014" class="method-detail">
-        <a name="M000014"></a>
+      <div id="method-M000006" class="method-detail">
+        <a name="M000006"></a>
 
         <div class="method-heading">
 
-          <a href="IndriQuery.src/M000014.html" target="Code" class="method-signature"
-            onclick="popupCode('IndriQuery.src/M000014.html');return false;">
+          <a href="IndriQuery.src/M000006.html" target="Code" class="method-signature"
+            onclick="popupCode('IndriQuery.src/M000006.html');return false;">
 
           <span class="method-name">new</span><span class="method-args">(id,query,params)</span>
 
@@ -183,13 +183,13 @@
       <h3 class="section-bar">Public Instance methods</h3>
 
 
-      <div id="method-M000015" class="method-detail">
-        <a name="M000015"></a>
+      <div id="method-M000007" class="method-detail">
+        <a name="M000007"></a>
 
         <div class="method-heading">
 
-          <a href="IndriQuery.src/M000015.html" target="Code" class="method-signature"
-            onclick="popupCode('IndriQuery.src/M000015.html');return false;">
+          <a href="IndriQuery.src/M000007.html" target="Code" class="method-signature"
+            onclick="popupCode('IndriQuery.src/M000007.html');return false;">
 
           <span class="method-name">to_s</span><span class="method-args">()</span>
 
diff --git a/doc/classes/RIR/Indri/IndriQuery.src/M000006.html b/doc/classes/RIR/Indri/IndriQuery.src/M000006.html
new file mode 100644
index 0000000..c72d135
--- /dev/null
+++ b/doc/classes/RIR/Indri/IndriQuery.src/M000006.html
@@ -0,0 +1,22 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>new (RIR::Indri::IndriQuery)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 62</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">id</span>,<span class="ruby-identifier">query</span>,<span class="ruby-identifier">params</span>)
+        <span class="ruby-ivar">@params</span> = <span class="ruby-identifier">params</span>
+        <span class="ruby-comment cmt"># Here we set the default retrieval model as Language Modeling</span>
+        <span class="ruby-comment cmt"># with a Dirichlet smoothing at 2500.</span>
+        <span class="ruby-comment cmt"># TODO: maybe a Rule class...</span>
+        <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">rule</span>  = <span class="ruby-value str">'method:dirichlet,mu:2500'</span> <span class="ruby-keyword kw">if</span> <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">rule</span>.<span class="ruby-identifier">nil?</span>
+
+        <span class="ruby-ivar">@id</span>     = <span class="ruby-identifier">id</span>
+        <span class="ruby-ivar">@query</span>  = <span class="ruby-identifier">query</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/Indri/IndriQuery.src/M000007.html b/doc/classes/RIR/Indri/IndriQuery.src/M000007.html
new file mode 100644
index 0000000..e237f9a
--- /dev/null
+++ b/doc/classes/RIR/Indri/IndriQuery.src/M000007.html
@@ -0,0 +1,22 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>to_s (RIR::Indri::IndriQuery)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 73</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">to_s</span>
+        <span class="ruby-identifier">h</span> = <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">to_s</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">&quot;&lt;query&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;number&gt;#{@id}&lt;/number&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;text&gt;#{@query}&lt;/text&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">&quot;&lt;/query&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">&quot;&lt;/parameters&gt;&quot;</span>
+
+        <span class="ruby-identifier">h</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/Indri/Parameters.html b/doc/classes/RIR/Indri/Parameters.html
index 686469e..28e11cb 100644
--- a/doc/classes/RIR/Indri/Parameters.html
+++ b/doc/classes/RIR/Indri/Parameters.html
@@ -91,9 +91,9 @@
 
       <div class="name-list">
 
-        <a href="#M000012">new</a>&nbsp;&nbsp;
+        <a href="#M000004">new</a>&nbsp;&nbsp;
 
-        <a href="#M000013">to_s</a>&nbsp;&nbsp;
+        <a href="#M000005">to_s</a>&nbsp;&nbsp;
 
       </div>
     </div>
@@ -121,7 +121,7 @@
         </tr>
 
         <tr class="top-aligned-row context-row">
-          <td class="context-item-name">corpus</td>
+          <td class="context-item-name">count</td>
 
           <td class="context-item-value">&nbsp;[RW]&nbsp;</td>
 
@@ -129,7 +129,7 @@
         </tr>
 
         <tr class="top-aligned-row context-row">
-          <td class="context-item-name">count</td>
+          <td class="context-item-name">index_path</td>
 
           <td class="context-item-value">&nbsp;[RW]&nbsp;</td>
 
@@ -196,13 +196,13 @@
       <h3 class="section-bar">Public Class methods</h3>
 
 
-      <div id="method-M000012" class="method-detail">
-        <a name="M000012"></a>
+      <div id="method-M000004" class="method-detail">
+        <a name="M000004"></a>
 
         <div class="method-heading">
 
-          <a href="Parameters.src/M000012.html" target="Code" class="method-signature"
-            onclick="popupCode('Parameters.src/M000012.html');return false;">
+          <a href="Parameters.src/M000004.html" target="Code" class="method-signature"
+            onclick="popupCode('Parameters.src/M000004.html');return false;">
 
           <span class="method-name">new</span><span class="method-args">(corpus,mem=&quot;1g&quot;,count=&quot;1000&quot;,offset=&quot;1&quot;,run_id=&quot;default&quot;,print_query=false,print_docs=false)</span>
 
@@ -219,13 +219,13 @@
       <h3 class="section-bar">Public Instance methods</h3>
 
 
-      <div id="method-M000013" class="method-detail">
-        <a name="M000013"></a>
+      <div id="method-M000005" class="method-detail">
+        <a name="M000005"></a>
 
         <div class="method-heading">
 
-          <a href="Parameters.src/M000013.html" target="Code" class="method-signature"
-            onclick="popupCode('Parameters.src/M000013.html');return false;">
+          <a href="Parameters.src/M000005.html" target="Code" class="method-signature"
+            onclick="popupCode('Parameters.src/M000005.html');return false;">
 
           <span class="method-name">to_s</span><span class="method-args">()</span>
 
diff --git a/doc/classes/RIR/Indri/Parameters.src/M000004.html b/doc/classes/RIR/Indri/Parameters.src/M000004.html
new file mode 100644
index 0000000..a5d26e0
--- /dev/null
+++ b/doc/classes/RIR/Indri/Parameters.src/M000004.html
@@ -0,0 +1,21 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>new (RIR::Indri::Parameters)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 30</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">corpus</span>,<span class="ruby-identifier">mem</span>=<span class="ruby-value str">&quot;1g&quot;</span>,<span class="ruby-identifier">count</span>=<span class="ruby-value str">&quot;1000&quot;</span>,<span class="ruby-identifier">offset</span>=<span class="ruby-value str">&quot;1&quot;</span>,<span class="ruby-identifier">run_id</span>=<span class="ruby-value str">&quot;default&quot;</span>,<span class="ruby-identifier">print_query</span>=<span class="ruby-keyword kw">false</span>,<span class="ruby-identifier">print_docs</span>=<span class="ruby-keyword kw">false</span>)
+        <span class="ruby-ivar">@index_path</span>  = <span class="ruby-identifier">corpus</span>
+        <span class="ruby-ivar">@memory</span>      = <span class="ruby-identifier">mem</span>
+        <span class="ruby-ivar">@count</span>       = <span class="ruby-identifier">count</span>
+        <span class="ruby-ivar">@offset</span>      = <span class="ruby-identifier">offset</span>
+        <span class="ruby-ivar">@run_id</span>      = <span class="ruby-identifier">run_id</span>
+        <span class="ruby-ivar">@print_query</span> = <span class="ruby-identifier">print_query</span> <span class="ruby-value">? </span><span class="ruby-value str">&quot;true&quot;</span> <span class="ruby-operator">:</span> <span class="ruby-value str">&quot;false&quot;</span>
+        <span class="ruby-ivar">@print_docs</span>  = <span class="ruby-identifier">print_docs</span>  <span class="ruby-value">? </span><span class="ruby-value str">&quot;true&quot;</span> <span class="ruby-operator">:</span> <span class="ruby-value str">&quot;false&quot;</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/Indri/Parameters.src/M000005.html b/doc/classes/RIR/Indri/Parameters.src/M000005.html
new file mode 100644
index 0000000..3a235ca
--- /dev/null
+++ b/doc/classes/RIR/Indri/Parameters.src/M000005.html
@@ -0,0 +1,29 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>to_s (RIR::Indri::Parameters)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 40</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">to_s</span>
+        <span class="ruby-identifier">h</span> = <span class="ruby-value str">&quot;&lt;parameters&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;memory&gt;#{@memory}&lt;/memory&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;index&gt;#{@index_path}&lt;/index&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;count&gt;#{@count}&lt;/count&gt;\n&quot;</span>
+        <span class="ruby-keyword kw">unless</span> <span class="ruby-ivar">@baseline</span>.<span class="ruby-identifier">nil?</span>
+          <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;baseline&gt;#{@baseline}&lt;/baseline&gt;\n&quot;</span> 
+        <span class="ruby-keyword kw">else</span>
+          <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;rule&gt;#{@rule}&lt;/rule&gt;\n&quot;</span>
+        <span class="ruby-keyword kw">end</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;queryOffset&gt;#{@offset}&lt;/queryOffset&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;runID&gt;#{@run_id}&lt;/runID&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;printQuery&gt;#{@print_query}&lt;/printQuery&gt;\n&quot;</span>
+        <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">&quot;&lt;printDocuments&gt;#{@print_docs}&lt;/printDocuments&gt;\n&quot;</span>
+
+        <span class="ruby-identifier">h</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger.html b/doc/classes/RIR/TreeTagger.html
new file mode 100644
index 0000000..a46f3bd
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger.html
@@ -0,0 +1,123 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Module: RIR::TreeTagger [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Module</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+    <div id="description">
+      <p>
+TreeTagger-related stuff module.
+</p>
+<p>
+See <a
+href="http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html">www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html</a>
+</p>
+
+    </div>
+
+   </div>
+
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+    <div id="class-list">
+      <h3 class="section-bar">Classes and Modules</h3>
+
+      Class <a href="TreeTagger/Chunk.html" class="link">RIR::TreeTagger::Chunk</a><br />
+Class <a href="TreeTagger/TaggerChunker.html" class="link">RIR::TreeTagger::TaggerChunker</a><br />
+Class <a href="TreeTagger/TaggerChunkerEnglish.html" class="link">RIR::TreeTagger::TaggerChunkerEnglish</a><br />
+Class <a href="TreeTagger/TaggerChunkerFrench.html" class="link">RIR::TreeTagger::TaggerChunkerFrench</a><br />
+Class <a href="TreeTagger/TaggerChunkerGerman.html" class="link">RIR::TreeTagger::TaggerChunkerGerman</a><br />
+
+    </div>
+
+
+
+
+    <!-- if method_list -->
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/Chunk.html b/doc/classes/RIR/TreeTagger/Chunk.html
new file mode 100644
index 0000000..95f4e8c
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/Chunk.html
@@ -0,0 +1,187 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Class: RIR::TreeTagger::Chunk [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Class</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger::Chunk</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        <tr class="top-aligned-row">
+            <td><strong>Parent:</strong></td>
+            <td>
+
+                Object
+
+            </td>
+        </tr>
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+    <div id="description">
+      <p>
+Represents a <a href="Chunk.html">Chunk</a> extracted when parsing a <a
+href="TaggerChunker.html">TaggerChunker</a> file.
+</p>
+
+    </div>
+
+   </div>
+
+
+    <div id="method-list">
+      <h3 class="section-bar">Methods</h3>
+
+      <div class="name-list">
+
+        <a href="#M000003">new</a>&nbsp;&nbsp;
+
+      </div>
+    </div>
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+    <div id="attribute-list">
+      <h3 class="section-bar">Attributes</h3>
+
+      <div class="name-list">
+        <table>
+
+        <tr class="top-aligned-row context-row">
+          <td class="context-item-name">tag</td>
+
+          <td class="context-item-value">&nbsp;[R]&nbsp;</td>
+
+          <td class="context-item-desc"></td>
+        </tr>
+
+        <tr class="top-aligned-row context-row">
+          <td class="context-item-name">words</td>
+
+          <td class="context-item-value">&nbsp;[R]&nbsp;</td>
+
+          <td class="context-item-desc"></td>
+        </tr>
+
+        </table>
+      </div>
+    </div>
+
+
+    <!-- if method_list -->
+
+    <div id="methods">
+
+      <h3 class="section-bar">Public Class methods</h3>
+
+
+      <div id="method-M000003" class="method-detail">
+        <a name="M000003"></a>
+
+        <div class="method-heading">
+
+          <a href="Chunk.src/M000003.html" target="Code" class="method-signature"
+            onclick="popupCode('Chunk.src/M000003.html');return false;">
+
+          <span class="method-name">new</span><span class="method-args">(str,tag)</span>
+
+          </a>
+
+        </div>
+
+        <div class="method-description">
+
+          <p>
+<tt>str</tt> are whitespace-separated terms. <tt>tag</tt> see : <a
+href="ftp://ftp.ims.uni-stuttgart.de/pub/corpora/chunker-tagset-english.txt">ftp.ims.uni-stuttgart.de/pub/corpora/chunker-tagset-english.txt</a>
+</p>
+
+        </div>
+      </div>
+
+
+
+    </div>
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/Chunk.src/M000003.html b/doc/classes/RIR/TreeTagger/Chunk.src/M000003.html
new file mode 100644
index 0000000..239dc5a
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/Chunk.src/M000003.html
@@ -0,0 +1,16 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>new (RIR::TreeTagger::Chunk)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/ttagger.rb, line 86</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span> <span class="ruby-identifier">str</span>,<span class="ruby-identifier">tag</span>
+        <span class="ruby-ivar">@words</span> = <span class="ruby-identifier">str</span>.<span class="ruby-identifier">split</span>
+        <span class="ruby-ivar">@tag</span>   = <span class="ruby-identifier">tag</span>[<span class="ruby-value">1</span><span class="ruby-operator">..</span><span class="ruby-value">-2</span>]
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunker.html b/doc/classes/RIR/TreeTagger/TaggerChunker.html
new file mode 100644
index 0000000..57ae1ae
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunker.html
@@ -0,0 +1,216 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Class: RIR::TreeTagger::TaggerChunker [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Class</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger::TaggerChunker</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        <tr class="top-aligned-row">
+            <td><strong>Parent:</strong></td>
+            <td>
+
+                Object
+
+            </td>
+        </tr>
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+    <div id="description">
+      <p>
+This class handles generic parsing of tagger-chunker outputs.
+</p>
+
+    </div>
+
+   </div>
+
+
+    <div id="method-list">
+      <h3 class="section-bar">Methods</h3>
+
+      <div class="name-list">
+
+        <a href="#M000002">new</a>&nbsp;&nbsp;
+
+        <a href="#M000001">parse</a>&nbsp;&nbsp;
+
+      </div>
+    </div>
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+    <div id="attribute-list">
+      <h3 class="section-bar">Attributes</h3>
+
+      <div class="name-list">
+        <table>
+
+        <tr class="top-aligned-row context-row">
+          <td class="context-item-name">chunks</td>
+
+          <td class="context-item-value">&nbsp;[R]&nbsp;</td>
+
+          <td class="context-item-desc"></td>
+        </tr>
+
+        <tr class="top-aligned-row context-row">
+          <td class="context-item-name">file</td>
+
+          <td class="context-item-value">&nbsp;[R]&nbsp;</td>
+
+          <td class="context-item-desc"></td>
+        </tr>
+
+        </table>
+      </div>
+    </div>
+
+
+    <!-- if method_list -->
+
+    <div id="methods">
+
+      <h3 class="section-bar">Public Class methods</h3>
+
+
+      <div id="method-M000002" class="method-detail">
+        <a name="M000002"></a>
+
+        <div class="method-heading">
+
+          <a href="TaggerChunker.src/M000002.html" target="Code" class="method-signature"
+            onclick="popupCode('TaggerChunker.src/M000002.html');return false;">
+
+          <span class="method-name">new</span><span class="method-args">(chunk_file)</span>
+
+          </a>
+
+        </div>
+
+        <div class="method-description">
+
+          <p>
+Initializes parsing. <tt>chunk_file</tt> is the output of
+<tt>tagger-chunker-</tt> and must be a valid path to the file.
+</p>
+<pre>
+  TaggerChunker.new(&quot;ttout/2010020&quot;) #=&gt; #&lt;RIR::TreeTagger::TaggerChunker:0x92fd088 @chunks=[#&lt;RIR::TreeTagger::Chunk:0x8ec5a10 @words=[&quot;robert&quot;, &quot;schumann&quot;], @tag=&quot;NC&quot;&gt;, ...] ...&gt;
+</pre>
+
+        </div>
+      </div>
+
+
+      <div id="method-M000001" class="method-detail">
+        <a name="M000001"></a>
+
+        <div class="method-heading">
+
+          <a href="TaggerChunker.src/M000001.html" target="Code" class="method-signature"
+            onclick="popupCode('TaggerChunker.src/M000001.html');return false;">
+
+          <span class="method-name">parse</span><span class="method-args">(chunk_lines)</span>
+
+          </a>
+
+        </div>
+
+        <div class="method-description">
+
+          <p>
+Parses a tagger-chunker output and returns an Array of <a
+href="Chunk.html">Chunk</a>.
+</p>
+
+        </div>
+      </div>
+
+
+
+    </div>
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000001.html b/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000001.html
new file mode 100644
index 0000000..3bdb228
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000001.html
@@ -0,0 +1,39 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>parse (RIR::TreeTagger::TaggerChunker)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/ttagger.rb, line 33</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">parse</span> <span class="ruby-identifier">chunk_lines</span>
+        <span class="ruby-identifier">open</span> = <span class="ruby-keyword kw">false</span>
+        <span class="ruby-identifier">tag</span>  = <span class="ruby-keyword kw">nil</span>
+
+        <span class="ruby-identifier">chunks</span> = []
+        <span class="ruby-identifier">words</span>  = []
+
+        <span class="ruby-identifier">chunk_lines</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">l</span><span class="ruby-operator">|</span>
+          <span class="ruby-identifier">l</span>.<span class="ruby-identifier">chomp!</span>
+          <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">l</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/^&lt;\w+&gt;$/</span>
+            <span class="ruby-identifier">open</span> = <span class="ruby-keyword kw">true</span>
+            <span class="ruby-identifier">tag</span>  = <span class="ruby-identifier">l</span>
+          <span class="ruby-keyword kw">elsif</span> <span class="ruby-identifier">l</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/^&lt;\/\w+&gt;$/</span>
+            <span class="ruby-keyword kw">if</span> <span class="ruby-operator">!</span><span class="ruby-identifier">words</span>.<span class="ruby-identifier">empty?</span> <span class="ruby-operator">&amp;&amp;</span> <span class="ruby-identifier">open</span> <span class="ruby-operator">&amp;&amp;</span> <span class="ruby-identifier">l</span> <span class="ruby-operator">==</span> <span class="ruby-identifier">tag</span>.<span class="ruby-identifier">sub</span>(<span class="ruby-regexp re">/&lt;/</span>, <span class="ruby-value str">'&lt;/'</span>)
+              <span class="ruby-identifier">open</span> = <span class="ruby-keyword kw">false</span>
+              <span class="ruby-identifier">chunks</span>.<span class="ruby-identifier">push</span> <span class="ruby-constant">Chunk</span>.<span class="ruby-identifier">new</span>(<span class="ruby-identifier">words</span>.<span class="ruby-identifier">join</span>(<span class="ruby-value str">&quot; &quot;</span>), <span class="ruby-identifier">tag</span>) 
+              <span class="ruby-identifier">words</span>.<span class="ruby-identifier">clear</span>
+            <span class="ruby-keyword kw">else</span>
+              <span class="ruby-keyword kw">next</span>
+            <span class="ruby-keyword kw">end</span>
+          <span class="ruby-keyword kw">else</span>
+            <span class="ruby-identifier">words</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">l</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">first</span>)
+          <span class="ruby-keyword kw">end</span>
+        <span class="ruby-keyword kw">end</span>
+
+        <span class="ruby-identifier">chunks</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000002.html b/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000002.html
new file mode 100644
index 0000000..c33487c
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunker.src/M000002.html
@@ -0,0 +1,15 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>new (RIR::TreeTagger::TaggerChunker)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/ttagger.rb, line 65</span>
+      <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span> <span class="ruby-identifier">chunk_file</span>
+        <span class="ruby-ivar">@chunks</span> = <span class="ruby-constant">TaggerChunker</span>.<span class="ruby-identifier">parse</span> <span class="ruby-constant">File</span>.<span class="ruby-identifier">open</span>(<span class="ruby-identifier">chunk_file</span>).<span class="ruby-identifier">readlines</span>
+      <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunkerEnglish.html b/doc/classes/RIR/TreeTagger/TaggerChunkerEnglish.html
new file mode 100644
index 0000000..f5a878f
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunkerEnglish.html
@@ -0,0 +1,114 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Class: RIR::TreeTagger::TaggerChunkerEnglish [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Class</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger::TaggerChunkerEnglish</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        <tr class="top-aligned-row">
+            <td><strong>Parent:</strong></td>
+            <td>
+
+                <a href="TaggerChunker.html">
+
+                RIR::TreeTagger::TaggerChunker
+
+               </a>
+
+            </td>
+        </tr>
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+   </div>
+
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+
+    <!-- if method_list -->
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunkerFrench.html b/doc/classes/RIR/TreeTagger/TaggerChunkerFrench.html
new file mode 100644
index 0000000..203b487
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunkerFrench.html
@@ -0,0 +1,114 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Class: RIR::TreeTagger::TaggerChunkerFrench [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Class</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger::TaggerChunkerFrench</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        <tr class="top-aligned-row">
+            <td><strong>Parent:</strong></td>
+            <td>
+
+                <a href="TaggerChunker.html">
+
+                RIR::TreeTagger::TaggerChunker
+
+               </a>
+
+            </td>
+        </tr>
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+   </div>
+
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+
+    <!-- if method_list -->
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/TreeTagger/TaggerChunkerGerman.html b/doc/classes/RIR/TreeTagger/TaggerChunkerGerman.html
new file mode 100644
index 0000000..fd7e410
--- /dev/null
+++ b/doc/classes/RIR/TreeTagger/TaggerChunkerGerman.html
@@ -0,0 +1,114 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>Class: RIR::TreeTagger::TaggerChunkerGerman [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+    <div id="classHeader">
+        <table class="header-table">
+        <tr class="top-aligned-row">
+          <td><strong>Class</strong></td>
+          <td class="class-name-in-header">RIR::TreeTagger::TaggerChunkerGerman</td>
+        </tr>
+        <tr class="top-aligned-row">
+            <td><strong>In:</strong></td>
+            <td>
+
+
+                <a href="../../../files/lib/rir/ttagger_rb.html">
+
+                lib/rir/ttagger.rb
+
+                </a>
+
+
+        <br />
+
+            </td>
+        </tr>
+
+
+        <tr class="top-aligned-row">
+            <td><strong>Parent:</strong></td>
+            <td>
+
+                <a href="TaggerChunker.html">
+
+                RIR::TreeTagger::TaggerChunker
+
+               </a>
+
+            </td>
+        </tr>
+
+        </table>
+    </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+   </div>
+
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+
+    <!-- if method_list -->
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/classes/RIR/WebDocument.html b/doc/classes/RIR/WebDocument.html
index 75a2a8d..f2e6c6a 100644
--- a/doc/classes/RIR/WebDocument.html
+++ b/doc/classes/RIR/WebDocument.html
@@ -103,9 +103,9 @@ href="Document.html">Document</a> with a <tt>url</tt>.
 
       <div class="name-list">
 
-        <a href="#M000024">get_content</a>&nbsp;&nbsp;
+        <a href="#M000014">get_content</a>&nbsp;&nbsp;
 
-        <a href="#M000025">new</a>&nbsp;&nbsp;
+        <a href="#M000015">new</a>&nbsp;&nbsp;
 
       </div>
     </div>
@@ -144,13 +144,13 @@ href="Document.html">Document</a> with a <tt>url</tt>.
       <h3 class="section-bar">Public Class methods</h3>
 
 
-      <div id="method-M000024" class="method-detail">
-        <a name="M000024"></a>
+      <div id="method-M000014" class="method-detail">
+        <a name="M000014"></a>
 
         <div class="method-heading">
 
-          <a href="WebDocument.src/M000024.html" target="Code" class="method-signature"
-            onclick="popupCode('WebDocument.src/M000024.html');return false;">
+          <a href="WebDocument.src/M000014.html" target="Code" class="method-signature"
+            onclick="popupCode('WebDocument.src/M000014.html');return false;">
 
           <span class="method-name">get_content</span><span class="method-args">(url)</span>
 
@@ -168,13 +168,13 @@ Returns the HTML text from the page of a given <tt>url</tt>.
       </div>
 
 
-      <div id="method-M000025" class="method-detail">
-        <a name="M000025"></a>
+      <div id="method-M000015" class="method-detail">
+        <a name="M000015"></a>
 
         <div class="method-heading">
 
-          <a href="WebDocument.src/M000025.html" target="Code" class="method-signature"
-            onclick="popupCode('WebDocument.src/M000025.html');return false;">
+          <a href="WebDocument.src/M000015.html" target="Code" class="method-signature"
+            onclick="popupCode('WebDocument.src/M000015.html');return false;">
 
           <span class="method-name">new</span><span class="method-args">(url)</span>
 
diff --git a/doc/classes/RIR/WebDocument.src/M000014.html b/doc/classes/RIR/WebDocument.src/M000014.html
new file mode 100644
index 0000000..e3931e7
--- /dev/null
+++ b/doc/classes/RIR/WebDocument.src/M000014.html
@@ -0,0 +1,16 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>get_content (RIR::WebDocument)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 112</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">get_content</span>(<span class="ruby-identifier">url</span>)
+      <span class="ruby-identifier">require</span> <span class="ruby-value str">'net/http'</span>
+      <span class="ruby-constant">Net</span><span class="ruby-operator">::</span><span class="ruby-constant">HTTP</span>.<span class="ruby-identifier">get</span>(<span class="ruby-constant">URI</span>.<span class="ruby-identifier">parse</span>(<span class="ruby-identifier">url</span>))
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/WebDocument.src/M000015.html b/doc/classes/RIR/WebDocument.src/M000015.html
index 54776b5..dd6da25 100644
--- a/doc/classes/RIR/WebDocument.src/M000015.html
+++ b/doc/classes/RIR/WebDocument.src/M000015.html
@@ -2,15 +2,15 @@
 "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
 <head>
-  <title>get_content (RIR::WebDocument)</title>
+  <title>new (RIR::WebDocument)</title>
   <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
   <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
 </head>
 <body class="standalone-code">
-  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 105</span>
-    <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">get_content</span>(<span class="ruby-identifier">url</span>)
-      <span class="ruby-identifier">require</span> <span class="ruby-value str">'net/http'</span>
-      <span class="ruby-constant">Net</span><span class="ruby-operator">::</span><span class="ruby-constant">HTTP</span>.<span class="ruby-identifier">get</span>(<span class="ruby-constant">URI</span>.<span class="ruby-identifier">parse</span>(<span class="ruby-identifier">url</span>))
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 119</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">url</span>)
+      <span class="ruby-ivar">@url</span> = <span class="ruby-identifier">url</span>
+      <span class="ruby-keyword kw">super</span> <span class="ruby-constant">WebDocument</span>.<span class="ruby-identifier">get_content</span>(<span class="ruby-identifier">url</span>).<span class="ruby-identifier">strip_javascripts</span>.<span class="ruby-identifier">strip_stylesheets</span>.<span class="ruby-identifier">strip_xml_tags</span>
     <span class="ruby-keyword kw">end</span></pre>
 </body>
 </html>
diff --git a/doc/classes/RIR/WikipediaPage.html b/doc/classes/RIR/WikipediaPage.html
index 4464b3e..02b496f 100644
--- a/doc/classes/RIR/WikipediaPage.html
+++ b/doc/classes/RIR/WikipediaPage.html
@@ -103,11 +103,11 @@ href="WebDocument.html">WebDocument</a>.
 
       <div class="name-list">
 
-        <a href="#M000027">get_url</a>&nbsp;&nbsp;
+        <a href="#M000017">get_url</a>&nbsp;&nbsp;
 
-        <a href="#M000028">search_homepage</a>&nbsp;&nbsp;
+        <a href="#M000018">search_homepage</a>&nbsp;&nbsp;
 
-        <a href="#M000026">search_wikipedia_titles</a>&nbsp;&nbsp;
+        <a href="#M000016">search_wikipedia_titles</a>&nbsp;&nbsp;
 
       </div>
     </div>
@@ -128,13 +128,13 @@ href="WebDocument.html">WebDocument</a>.
       <h3 class="section-bar">Public Class methods</h3>
 
 
-      <div id="method-M000027" class="method-detail">
-        <a name="M000027"></a>
+      <div id="method-M000017" class="method-detail">
+        <a name="M000017"></a>
 
         <div class="method-heading">
 
-          <a href="WikipediaPage.src/M000027.html" target="Code" class="method-signature"
-            onclick="popupCode('WikipediaPage.src/M000027.html');return false;">
+          <a href="WikipediaPage.src/M000017.html" target="Code" class="method-signature"
+            onclick="popupCode('WikipediaPage.src/M000017.html');return false;">
 
           <span class="method-name">get_url</span><span class="method-args">(name)</span>
 
@@ -148,13 +148,13 @@ href="WebDocument.html">WebDocument</a>.
       </div>
 
 
-      <div id="method-M000028" class="method-detail">
-        <a name="M000028"></a>
+      <div id="method-M000018" class="method-detail">
+        <a name="M000018"></a>
 
         <div class="method-heading">
 
-          <a href="WikipediaPage.src/M000028.html" target="Code" class="method-signature"
-            onclick="popupCode('WikipediaPage.src/M000028.html');return false;">
+          <a href="WikipediaPage.src/M000018.html" target="Code" class="method-signature"
+            onclick="popupCode('WikipediaPage.src/M000018.html');return false;">
 
           <span class="method-name">search_homepage</span><span class="method-args">(name)</span>
 
@@ -168,13 +168,13 @@ href="WebDocument.html">WebDocument</a>.
       </div>
 
 
-      <div id="method-M000026" class="method-detail">
-        <a name="M000026"></a>
+      <div id="method-M000016" class="method-detail">
+        <a name="M000016"></a>
 
         <div class="method-heading">
 
-          <a href="WikipediaPage.src/M000026.html" target="Code" class="method-signature"
-            onclick="popupCode('WikipediaPage.src/M000026.html');return false;">
+          <a href="WikipediaPage.src/M000016.html" target="Code" class="method-signature"
+            onclick="popupCode('WikipediaPage.src/M000016.html');return false;">
 
           <span class="method-name">search_wikipedia_titles</span><span class="method-args">(name)</span>
 
diff --git a/doc/classes/RIR/WikipediaPage.src/M000016.html b/doc/classes/RIR/WikipediaPage.src/M000016.html
new file mode 100644
index 0000000..eb3518e
--- /dev/null
+++ b/doc/classes/RIR/WikipediaPage.src/M000016.html
@@ -0,0 +1,19 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>search_wikipedia_titles (RIR::WikipediaPage)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 132</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">search_wikipedia_titles</span>(<span class="ruby-identifier">name</span>)
+      <span class="ruby-identifier">raise</span> <span class="ruby-constant">ArgumentError</span>, <span class="ruby-value str">&quot;Bad encoding&quot;</span>, <span class="ruby-identifier">name</span> <span class="ruby-keyword kw">unless</span> <span class="ruby-identifier">name</span>.<span class="ruby-identifier">isutf8</span>
+
+      <span class="ruby-identifier">res</span> = <span class="ruby-constant">REXML</span><span class="ruby-operator">::</span><span class="ruby-constant">Document</span>.<span class="ruby-identifier">new</span>(<span class="ruby-constant">Net</span><span class="ruby-operator">::</span><span class="ruby-constant">HTTP</span>.<span class="ruby-identifier">get</span>( <span class="ruby-constant">URI</span>.<span class="ruby-identifier">parse</span> <span class="ruby-node">&quot;http://en.wikipedia.org/w/api.php?action=query&amp;list=search&amp;srsearch=#{URI.escape name}&amp;format=xml&quot;</span> ).<span class="ruby-identifier">toutf8</span>).<span class="ruby-identifier">elements</span>[<span class="ruby-value str">'api/query/search'</span>]
+
+      <span class="ruby-identifier">res</span>.<span class="ruby-identifier">collect</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">e</span><span class="ruby-operator">|</span> <span class="ruby-identifier">e</span>.<span class="ruby-identifier">attributes</span>[<span class="ruby-value str">'title'</span>] } <span class="ruby-keyword kw">unless</span> <span class="ruby-identifier">res</span>.<span class="ruby-identifier">nil?</span>
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/WikipediaPage.src/M000017.html b/doc/classes/RIR/WikipediaPage.src/M000017.html
new file mode 100644
index 0000000..0b6b98b
--- /dev/null
+++ b/doc/classes/RIR/WikipediaPage.src/M000017.html
@@ -0,0 +1,19 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>get_url (RIR::WikipediaPage)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 140</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">get_url</span>(<span class="ruby-identifier">name</span>)
+      <span class="ruby-identifier">raise</span> <span class="ruby-constant">ArgumentError</span>, <span class="ruby-value str">&quot;Bad encoding&quot;</span>, <span class="ruby-identifier">name</span> <span class="ruby-keyword kw">unless</span> <span class="ruby-identifier">name</span>.<span class="ruby-identifier">isutf8</span>
+
+      <span class="ruby-identifier">atts</span> = <span class="ruby-constant">REXML</span><span class="ruby-operator">::</span><span class="ruby-constant">Document</span>.<span class="ruby-identifier">new</span>(<span class="ruby-constant">Net</span><span class="ruby-operator">::</span><span class="ruby-constant">HTTP</span>.<span class="ruby-identifier">get</span>( <span class="ruby-constant">URI</span>.<span class="ruby-identifier">parse</span> <span class="ruby-node">&quot;http://en.wikipedia.org/w/api.php?action=query&amp;titles=#{URI.escape name}&amp;inprop=url&amp;prop=info&amp;format=xml&quot;</span> ).<span class="ruby-identifier">toutf8</span>).<span class="ruby-identifier">elements</span>[<span class="ruby-value str">'api/query/pages/page'</span>].<span class="ruby-identifier">attributes</span>
+
+      <span class="ruby-identifier">atts</span>[<span class="ruby-value str">'fullurl'</span>] <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">atts</span>[<span class="ruby-value str">'missing'</span>].<span class="ruby-identifier">nil?</span>
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/classes/RIR/WikipediaPage.src/M000018.html b/doc/classes/RIR/WikipediaPage.src/M000018.html
new file mode 100644
index 0000000..d93d8db
--- /dev/null
+++ b/doc/classes/RIR/WikipediaPage.src/M000018.html
@@ -0,0 +1,17 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>search_homepage (RIR::WikipediaPage)</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+</head>
+<body class="standalone-code">
+  <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 148</span>
+    <span class="ruby-keyword kw">def</span> <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">search_homepage</span>(<span class="ruby-identifier">name</span>)
+      <span class="ruby-identifier">title</span> = <span class="ruby-constant">WikipediaPage</span>.<span class="ruby-identifier">search_wikipedia_titles</span> <span class="ruby-identifier">name</span>
+
+      <span class="ruby-constant">WikipediaPage</span>.<span class="ruby-identifier">new</span>(<span class="ruby-constant">WikipediaPage</span>.<span class="ruby-identifier">get_url</span> <span class="ruby-identifier">title</span>[<span class="ruby-value">0</span>]) <span class="ruby-keyword kw">unless</span> <span class="ruby-identifier">title</span>.<span class="ruby-identifier">nil?</span> <span class="ruby-operator">||</span> <span class="ruby-identifier">title</span>.<span class="ruby-identifier">empty?</span>
+    <span class="ruby-keyword kw">end</span></pre>
+</body>
+</html>
diff --git a/doc/created.rid b/doc/created.rid
index 5d2582c..5367b38 100644
--- a/doc/created.rid
+++ b/doc/created.rid
@@ -1 +1 @@
-Tue, 23 Nov 2010 18:20:46 +0100
+Thu, 25 Nov 2010 17:01:52 +0100
diff --git a/doc/files/lib/rir/document_rb.html b/doc/files/lib/rir/document_rb.html
index 767c904..d5a6ac5 100644
--- a/doc/files/lib/rir/document_rb.html
+++ b/doc/files/lib/rir/document_rb.html
@@ -53,7 +53,7 @@
     </tr>
     <tr class="top-aligned-row">
       <td><strong>Last Update:</strong></td>
-      <td>2010-11-23 18:14:13 +0100</td>
+      <td>2010-11-25 16:04:20 +0100</td>
     </tr>
     </table>
   </div>
diff --git a/doc/files/lib/rir/query_rb.html b/doc/files/lib/rir/query_rb.html
index 2868c72..a2db500 100644
--- a/doc/files/lib/rir/query_rb.html
+++ b/doc/files/lib/rir/query_rb.html
@@ -53,7 +53,7 @@
     </tr>
     <tr class="top-aligned-row">
       <td><strong>Last Update:</strong></td>
-      <td>2010-11-23 18:20:30 +0100</td>
+      <td>2010-11-25 13:25:18 +0100</td>
     </tr>
     </table>
   </div>
diff --git a/doc/files/lib/rir/ttagger_rb.html b/doc/files/lib/rir/ttagger_rb.html
new file mode 100644
index 0000000..67b5fa6
--- /dev/null
+++ b/doc/files/lib/rir/ttagger_rb.html
@@ -0,0 +1,143 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
+<head>
+  <title>File: ttagger.rb [RDoc Documentation]</title>
+  <meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
+  <meta http-equiv="Content-Script-Type" content="text/javascript" />
+  <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" />
+  <script type="text/javascript">
+  // <![CDATA[
+
+  function popupCode( url ) {
+    window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
+  }
+
+  function toggleCode( id ) {
+    if ( document.getElementById )
+      elem = document.getElementById( id );
+    else if ( document.all )
+      elem = eval( "document.all." + id );
+    else
+      return false;
+
+    elemStyle = elem.style;
+
+    if ( elemStyle.display != "block" ) {
+      elemStyle.display = "block"
+    } else {
+      elemStyle.display = "none"
+    }
+
+    return true;
+  }
+
+  // Make codeblocks hidden by default
+  document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" )
+
+  // ]]>
+  </script>
+
+</head>
+<body>
+
+
+  <div id="fileHeader">
+    <h1>ttagger.rb</h1>
+    <table class="header-table">
+    <tr class="top-aligned-row">
+      <td><strong>Path:</strong></td>
+      <td>lib/rir/ttagger.rb
+
+      </td>
+    </tr>
+    <tr class="top-aligned-row">
+      <td><strong>Last Update:</strong></td>
+      <td>2010-11-25 17:01:46 +0100</td>
+    </tr>
+    </table>
+  </div>
+  <!-- banner header -->
+
+  <div id="bodyContent">
+
+  <div id="contextContent">
+
+    <div id="description">
+      <p>
+This file is a part of an Information Retrieval oriented Ruby library
+</p>
+<p>
+Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com>
+</p>
+<p>
+This program is free software: you can redistribute it and/or modify it
+under the terms of the GNU General Public License as published by the Free
+Software Foundation, either version 3 of the License, or (at your option)
+any later version.
+</p>
+<p>
+This program is distributed in the hope that it will be useful, but WITHOUT
+ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
+more details.
+</p>
+<p>
+You should have received a copy of the GNU General Public License along
+with this program. If not, see <<a
+href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>.
+</p>
+<hr size="1"></hr><p>
+This file is a part of an Information Retrieval oriented Ruby library
+</p>
+<p>
+Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com>
+</p>
+<p>
+This program is free software: you can redistribute it and/or modify it
+under the terms of the GNU General Public License as published by the Free
+Software Foundation, either version 3 of the License, or (at your option)
+any later version.
+</p>
+<p>
+This program is distributed in the hope that it will be useful, but WITHOUT
+ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
+more details.
+</p>
+<p>
+You should have received a copy of the GNU General Public License along
+with this program. If not, see <<a
+href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>.
+</p>
+<hr size="1"></hr><p>
+General module for many purposes related to Information Retrieval.
+</p>
+
+    </div>
+
+   </div>
+
+
+  </div>
+
+    <!-- if includes -->
+
+    <div id="section">
+
+
+
+
+    <!-- if method_list -->
+
+
+
+
+  </div>
+
+<div id="validator-badges">
+  <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
+</div>
+
+</body>
+</html>
diff --git a/doc/files/lib/rir_rb.html b/doc/files/lib/rir_rb.html
index d43a4b6..6486ffa 100644
--- a/doc/files/lib/rir_rb.html
+++ b/doc/files/lib/rir_rb.html
@@ -53,7 +53,7 @@
     </tr>
     <tr class="top-aligned-row">
       <td><strong>Last Update:</strong></td>
-      <td>2010-11-19 11:27:16 +0100</td>
+      <td>2010-11-25 15:44:52 +0100</td>
     </tr>
     </table>
   </div>
@@ -78,6 +78,8 @@
 
         rir/regexp&nbsp;&nbsp;
 
+        rir/ttagger&nbsp;&nbsp;
+
       </div>
     </div>
 
diff --git a/doc/fr_class_index.html b/doc/fr_class_index.html
index 9a24111..36ac9d8 100644
--- a/doc/fr_class_index.html
+++ b/doc/fr_class_index.html
@@ -19,7 +19,7 @@
 
     <a href="classes/RIR.html">RIR</a><br />
 
-    <a href="classes/RIR/Corpus.html">RIR::Corpus</a><br />
+    <a href="classes/RIR/Document.html">RIR::Document</a><br />
 
     <a href="classes/RIR/Indri.html">RIR::Indri</a><br />
 
@@ -29,7 +29,21 @@
 
     <a href="classes/RIR/Query.html">RIR::Query</a><br />
 
-    <a href="classes/String.html">String</a><br />
+    <a href="classes/RIR/TreeTagger.html">RIR::TreeTagger</a><br />
+
+    <a href="classes/RIR/TreeTagger/Chunk.html">RIR::TreeTagger::Chunk</a><br />
+
+    <a href="classes/RIR/TreeTagger/TaggerChunker.html">RIR::TreeTagger::TaggerChunker</a><br />
+
+    <a href="classes/RIR/TreeTagger/TaggerChunkerEnglish.html">RIR::TreeTagger::TaggerChunkerEnglish</a><br />
+
+    <a href="classes/RIR/TreeTagger/TaggerChunkerFrench.html">RIR::TreeTagger::TaggerChunkerFrench</a><br />
+
+    <a href="classes/RIR/TreeTagger/TaggerChunkerGerman.html">RIR::TreeTagger::TaggerChunkerGerman</a><br />
+
+    <a href="classes/RIR/WebDocument.html">RIR::WebDocument</a><br />
+
+    <a href="classes/RIR/WikipediaPage.html">RIR::WikipediaPage</a><br />
 
   </div>
 </div>
diff --git a/doc/fr_file_index.html b/doc/fr_file_index.html
index 8871047..6d7fbed 100644
--- a/doc/fr_file_index.html
+++ b/doc/fr_file_index.html
@@ -17,11 +17,13 @@
   <h1 class="section-bar">Files</h1>
   <div id="index-entries">
 
-    <a href="files/lib/rir/corpus_rb.html">lib/rir/corpus.rb</a><br />
+    <a href="files/lib/rir_rb.html">lib/rir.rb</a><br />
+
+    <a href="files/lib/rir/document_rb.html">lib/rir/document.rb</a><br />
 
     <a href="files/lib/rir/query_rb.html">lib/rir/query.rb</a><br />
 
-    <a href="files/lib/rir/string_rb.html">lib/rir/string.rb</a><br />
+    <a href="files/lib/rir/ttagger_rb.html">lib/rir/ttagger.rb</a><br />
 
   </div>
 </div>
diff --git a/doc/fr_method_index.html b/doc/fr_method_index.html
index c909673..368ae37 100644
--- a/doc/fr_method_index.html
+++ b/doc/fr_method_index.html
@@ -17,39 +17,41 @@
   <h1 class="section-bar">Methods</h1>
   <div id="index-entries">
 
-    <a href="classes/String.html#M000011">extract_xmltags_values (String)</a><br />
+    <a href="classes/RIR/Document.html#M000010">count_words (RIR::Document)</a><br />
 
-    <a href="classes/RIR/Corpus.html#M000017">files (RIR::Corpus)</a><br />
+    <a href="classes/RIR/Document.html#M000011">entropy (RIR::Document)</a><br />
 
-    <a href="classes/String.html#M000001">is_stopword? (String)</a><br />
+    <a href="classes/RIR/Document.html#M000008">format_words (RIR::Document)</a><br />
 
-    <a href="classes/RIR/Corpus.html#M000016">new (RIR::Corpus)</a><br />
+    <a href="classes/RIR/WebDocument.html#M000014">get_content (RIR::WebDocument)</a><br />
 
-    <a href="classes/RIR/Indri/Parameters.html#M000012">new (RIR::Indri::Parameters)</a><br />
+    <a href="classes/RIR/WikipediaPage.html#M000017">get_url (RIR::WikipediaPage)</a><br />
 
-    <a href="classes/RIR/Indri/IndriQuery.html#M000014">new (RIR::Indri::IndriQuery)</a><br />
+    <a href="classes/RIR/WebDocument.html#M000015">new (RIR::WebDocument)</a><br />
 
-    <a href="classes/String.html#M000002">remove_special_characters (String)</a><br />
+    <a href="classes/RIR/Indri/IndriQuery.html#M000006">new (RIR::Indri::IndriQuery)</a><br />
 
-    <a href="classes/String.html#M000006">strip_javascripts (String)</a><br />
+    <a href="classes/RIR/Indri/Parameters.html#M000004">new (RIR::Indri::Parameters)</a><br />
 
-    <a href="classes/String.html#M000005">strip_javascripts! (String)</a><br />
+    <a href="classes/RIR/Document.html#M000013">new (RIR::Document)</a><br />
 
-    <a href="classes/String.html#M000010">strip_punctuation (String)</a><br />
+    <a href="classes/RIR/TreeTagger/TaggerChunker.html#M000002">new (RIR::TreeTagger::TaggerChunker)</a><br />
 
-    <a href="classes/String.html#M000009">strip_punctuation! (String)</a><br />
+    <a href="classes/RIR/TreeTagger/Chunk.html#M000003">new (RIR::TreeTagger::Chunk)</a><br />
 
-    <a href="classes/String.html#M000008">strip_stylesheets (String)</a><br />
+    <a href="classes/RIR/Document.html#M000009">ngrams (RIR::Document)</a><br />
 
-    <a href="classes/String.html#M000007">strip_stylesheets! (String)</a><br />
+    <a href="classes/RIR/TreeTagger/TaggerChunker.html#M000001">parse (RIR::TreeTagger::TaggerChunker)</a><br />
 
-    <a href="classes/String.html#M000004">strip_xml_tags (String)</a><br />
+    <a href="classes/RIR/WikipediaPage.html#M000018">search_homepage (RIR::WikipediaPage)</a><br />
 
-    <a href="classes/String.html#M000003">strip_xml_tags! (String)</a><br />
+    <a href="classes/RIR/WikipediaPage.html#M000016">search_wikipedia_titles (RIR::WikipediaPage)</a><br />
 
-    <a href="classes/RIR/Indri/Parameters.html#M000013">to_s (RIR::Indri::Parameters)</a><br />
+    <a href="classes/RIR/Document.html#M000012">tf (RIR::Document)</a><br />
 
-    <a href="classes/RIR/Indri/IndriQuery.html#M000015">to_s (RIR::Indri::IndriQuery)</a><br />
+    <a href="classes/RIR/Indri/Parameters.html#M000005">to_s (RIR::Indri::Parameters)</a><br />
+
+    <a href="classes/RIR/Indri/IndriQuery.html#M000007">to_s (RIR::Indri::IndriQuery)</a><br />
 
   </div>
 </div>
diff --git a/doc/index.html b/doc/index.html
index dcf5a4f..4b44566 100644
--- a/doc/index.html
+++ b/doc/index.html
@@ -16,6 +16,6 @@
         <frame src="fr_class_index.html"  name="Classes" />
         <frame src="fr_method_index.html" name="Methods" />
     </frameset>
-    <frame src="files/lib/rir/corpus_rb.html" name="docwin" />
+    <frame src="files/lib/rir_rb.html" name="docwin" />
 </frameset>
 </html>
diff --git a/lib/rir.rb b/lib/rir.rb
index 0b27852..e21e097 100644
--- a/lib/rir.rb
+++ b/lib/rir.rb
@@ -5,3 +5,4 @@ require 'rir/string'
 require 'rir/query'
 require 'rir/corpus'
 require 'rir/regexp'
+require 'rir/ttagger'
diff --git a/lib/rir/document.rb b/lib/rir/document.rb
index 5bda4e1..e5f69aa 100644
--- a/lib/rir/document.rb
+++ b/lib/rir/document.rb
@@ -73,7 +73,8 @@ module RIR
     # If the string parameter is composed of many words (i.e. tokens separated
     # by whitespace(s)), it is considered as an ngram.    
     #
-    #   entropy("guitar") #=> 0.00389919463243839
+    #   entropy("guitar") #=> 0.00432114812727959
+    #   entropy("dillinger escape plan") #=> 0.265862076325102
     def entropy(s)
       en = 0.0
       counts = self.count_words
@@ -87,6 +88,12 @@ module RIR
       en
     end
 
+    # Computes the term frequency of a given *word* +s+.
+    #
+    #   tf("guitar") #=> 0.000380372765310004
+    def tf(s)
+      self.count_words[s].to_f/@words.size.to_f
+    end
 
 
     def initialize(content)
@@ -123,13 +130,17 @@ module RIR
 
 
     def self.search_wikipedia_titles(name)
-      res = REXML::Document.new(Net::HTTP.get(URI.parse("http://en.wikipedia.org/w/api.php?action=query&list=search&srsearch=#{URI.escape name}&format=xml")).toutf8).elements['api/query/search']
+      raise ArgumentError, "Bad encoding", name unless name.isutf8
+
+      res = REXML::Document.new(Net::HTTP.get( URI.parse "http://en.wikipedia.org/w/api.php?action=query&list=search&srsearch=#{URI.escape name}&format=xml" ).toutf8).elements['api/query/search']
 
       res.collect { |e| e.attributes['title'] } unless res.nil?
     end
 
     def self.get_url(name)
-      atts = REXML::Document.new(Net::HTTP.get(URI.parse("http://en.wikipedia.org/w/api.php?action=query&titles=#{URI.escape name}&inprop=url&prop=info&format=xml")).toutf8).elements['api/query/pages/page'].attributes
+      raise ArgumentError, "Bad encoding", name unless name.isutf8
+
+      atts = REXML::Document.new(Net::HTTP.get( URI.parse "http://en.wikipedia.org/w/api.php?action=query&titles=#{URI.escape name}&inprop=url&prop=info&format=xml" ).toutf8).elements['api/query/pages/page'].attributes
 
       atts['fullurl'] if atts['missing'].nil?
     end
@@ -137,11 +148,7 @@ module RIR
     def self.search_homepage(name)
       title = WikipediaPage.search_wikipedia_titles name
 
-      begin
-        WikipediaPage.new(WikipediaPage.get_url title[0]) unless title.nil? || title.empty?
-      rescue
-        puts title[0]
-      end
+      WikipediaPage.new(WikipediaPage.get_url title[0]) unless title.nil? || title.empty?
     end
 
 #    def initialize(name)
diff --git a/lib/rir/query.rb b/lib/rir/query.rb
index d18e297..dbff657 100644
--- a/lib/rir/query.rb
+++ b/lib/rir/query.rb
@@ -25,10 +25,10 @@ module RIR
   module Indri
 
     class Parameters
-      attr_accessor :corpus, :memory, :count, :offset, :run_id, :print_query, :print_docs, :rule, :baseline
+      attr_accessor :index_path, :memory, :count, :offset, :run_id, :print_query, :print_docs, :rule, :baseline
 
       def initialize(corpus,mem="1g",count="1000",offset="1",run_id="default",print_query=false,print_docs=false)
-        @corpus      = corpus
+        @index_path  = corpus
         @memory      = mem
         @count       = count
         @offset      = offset
@@ -40,7 +40,7 @@ module RIR
       def to_s
         h = "<parameters>\n"
         h += "<memory>#{@memory}</memory>\n"
-        h += "<index>#{@corpus}</index>\n"
+        h += "<index>#{@index_path}</index>\n"
         h += "<count>#{@count}</count>\n"
         unless @baseline.nil?
           h += "<baseline>#{@baseline}</baseline>\n" 
diff --git a/lib/rir/ttagger.rb b/lib/rir/ttagger.rb
new file mode 100644
index 0000000..e1f2bd6
--- /dev/null
+++ b/lib/rir/ttagger.rb
@@ -0,0 +1,93 @@
+#!/usr/bin/env ruby
+
+# This file is a part of an Information Retrieval oriented Ruby library
+#
+# Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com>
+#
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+module RIR
+
+  # TreeTagger-related stuff module.
+  #
+  # See http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html
+  module TreeTagger
+    
+    # This class handles generic parsing of tagger-chunker outputs.
+    class TaggerChunker
+      attr_reader :chunks, :file
+
+
+      # Parses a tagger-chunker output and returns an Array of Chunk.
+      def self.parse chunk_lines
+        open = false
+        tag  = nil
+
+        chunks = []
+        words  = []
+
+        chunk_lines.each do |l|
+          l.chomp!
+          if l =~ /^<\w+>$/
+            open = true
+            tag  = l
+          elsif l =~ /^<\/\w+>$/
+            if !words.empty? && open && l == tag.sub(/</, '</')
+              open = false
+              chunks.push Chunk.new(words.join(" "), tag) 
+              words.clear
+            else
+              next
+            end
+          else
+            words.push(l.split.first)
+          end
+        end
+
+        chunks
+      end
+
+      # Initializes parsing. +chunk_file+ is the output of +tagger-chunker-+ and must
+      # be a valid path to the file.
+      #
+      #   TaggerChunker.new("ttout/2010020") #=> #<RIR::TreeTagger::TaggerChunker:0x92fd088 @chunks=[#<RIR::TreeTagger::Chunk:0x8ec5a10 @words=["robert", "schumann"], @tag="NC">, ...] ...>
+      def initialize chunk_file
+        @chunks = TaggerChunker.parse File.open(chunk_file).readlines
+      end
+
+    end
+
+    class TaggerChunkerEnglish < TaggerChunker
+    end
+
+    class TaggerChunkerFrench  < TaggerChunker
+    end
+
+    class TaggerChunkerGerman  < TaggerChunker
+    end
+
+    # Represents a Chunk extracted when parsing a TaggerChunker file.
+    class Chunk
+      attr_reader :words, :tag
+
+      # +str+ are whitespace-separated terms.
+      # +tag+ see : ftp://ftp.ims.uni-stuttgart.de/pub/corpora/chunker-tagset-english.txt
+      def initialize str,tag
+        @words = str.split
+        @tag   = tag[1..-2]
+      end
+    end
+
+  end
+end
diff --git a/main.rb b/main.rb
index 87408f7..78d5b8d 100644
--- a/main.rb
+++ b/main.rb
@@ -3,4 +3,5 @@ $LOAD_PATH.unshift File.expand_path(File.join(File.dirname(__FILE__), "lib"))
 require 'rir'
 
 w = RIR::WikipediaPage.new("http://en.wikipedia.org/wiki/The_Dillinger_Escape_Plan")
-p w.entropy("guitar")
+p w.entropy("dillinger escape plan")
+p w.tf("guitar")