Commit a79a228434f1eebcb042bcc576a3a0d6476789e4
1 parent
87316a38a5
Exists in
master
new TreeTagger module. tagger-chunker parsing & doc.
Showing 44 changed files with 1597 additions and 208 deletions Side-by-side Diff
- doc/classes/RIR.html
- doc/classes/RIR/Document.html
- doc/classes/RIR/Document.src/M000008.html
- doc/classes/RIR/Document.src/M000009.html
- doc/classes/RIR/Document.src/M000010.html
- doc/classes/RIR/Document.src/M000011.html
- doc/classes/RIR/Document.src/M000012.html
- doc/classes/RIR/Document.src/M000013.html
- doc/classes/RIR/Indri/IndriQuery.html
- doc/classes/RIR/Indri/IndriQuery.src/M000006.html
- doc/classes/RIR/Indri/IndriQuery.src/M000007.html
- doc/classes/RIR/Indri/Parameters.html
- doc/classes/RIR/Indri/Parameters.src/M000004.html
- doc/classes/RIR/Indri/Parameters.src/M000005.html
- doc/classes/RIR/TreeTagger.html
- doc/classes/RIR/TreeTagger/Chunk.html
- doc/classes/RIR/TreeTagger/Chunk.src/M000003.html
- doc/classes/RIR/TreeTagger/TaggerChunker.html
- doc/classes/RIR/TreeTagger/TaggerChunker.src/M000001.html
- doc/classes/RIR/TreeTagger/TaggerChunker.src/M000002.html
- doc/classes/RIR/TreeTagger/TaggerChunkerEnglish.html
- doc/classes/RIR/TreeTagger/TaggerChunkerFrench.html
- doc/classes/RIR/TreeTagger/TaggerChunkerGerman.html
- doc/classes/RIR/WebDocument.html
- doc/classes/RIR/WebDocument.src/M000014.html
- doc/classes/RIR/WebDocument.src/M000015.html
- doc/classes/RIR/WikipediaPage.html
- doc/classes/RIR/WikipediaPage.src/M000016.html
- doc/classes/RIR/WikipediaPage.src/M000017.html
- doc/classes/RIR/WikipediaPage.src/M000018.html
- doc/created.rid
- doc/files/lib/rir/document_rb.html
- doc/files/lib/rir/query_rb.html
- doc/files/lib/rir/ttagger_rb.html
- doc/files/lib/rir_rb.html
- doc/fr_class_index.html
- doc/fr_file_index.html
- doc/fr_method_index.html
- doc/index.html
- lib/rir.rb
- lib/rir/document.rb
- lib/rir/query.rb
- lib/rir/ttagger.rb
- main.rb
doc/classes/RIR.html
... | ... | @@ -53,9 +53,9 @@ |
53 | 53 | <td> |
54 | 54 | |
55 | 55 | |
56 | - <a href="../files/lib/rir/corpus_rb.html"> | |
56 | + <a href="../files/lib/rir/ttagger_rb.html"> | |
57 | 57 | |
58 | - lib/rir/corpus.rb | |
58 | + lib/rir/ttagger.rb | |
59 | 59 | |
60 | 60 | </a> |
61 | 61 | |
62 | 62 | |
... | ... | @@ -73,9 +73,9 @@ |
73 | 73 | <br /> |
74 | 74 | |
75 | 75 | |
76 | - <a href="../files/lib/rir/string_rb.html"> | |
76 | + <a href="../files/lib/rir/document_rb.html"> | |
77 | 77 | |
78 | - lib/rir/string.rb | |
78 | + lib/rir/document.rb | |
79 | 79 | |
80 | 80 | </a> |
81 | 81 | |
82 | 82 | |
... | ... | @@ -142,28 +142,8 @@ |
142 | 142 | href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>. |
143 | 143 | </p> |
144 | 144 | <hr size="1"></hr><p> |
145 | -This file is a part of an Information Retrieval oriented Ruby library | |
145 | +General module for many purposes related to Information Retrieval. | |
146 | 146 | </p> |
147 | -<p> | |
148 | -Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com> | |
149 | -</p> | |
150 | -<p> | |
151 | -This program is free software: you can redistribute it and/or modify it | |
152 | -under the terms of the GNU General Public License as published by the Free | |
153 | -Software Foundation, either version 3 of the License, or (at your option) | |
154 | -any later version. | |
155 | -</p> | |
156 | -<p> | |
157 | -This program is distributed in the hope that it will be useful, but WITHOUT | |
158 | -ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
159 | -FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | |
160 | -more details. | |
161 | -</p> | |
162 | -<p> | |
163 | -You should have received a copy of the GNU General Public License along | |
164 | -with this program. If not, see <<a | |
165 | -href="http://www.gnu.org/licenses/">www.gnu.org/licenses/</a>>. | |
166 | -</p> | |
167 | 147 | |
168 | 148 | </div> |
169 | 149 | |
170 | 150 | |
171 | 151 | |
... | ... | @@ -180,32 +160,12 @@ |
180 | 160 | <h3 class="section-bar">Classes and Modules</h3> |
181 | 161 | |
182 | 162 | Module <a href="RIR/Indri.html" class="link">RIR::Indri</a><br /> |
183 | -Class <a href="RIR/Corpus.html" class="link">RIR::Corpus</a><br /> | |
163 | +Module <a href="RIR/TreeTagger.html" class="link">RIR::TreeTagger</a><br /> | |
164 | +Class <a href="RIR/Document.html" class="link">RIR::Document</a><br /> | |
184 | 165 | Class <a href="RIR/Query.html" class="link">RIR::Query</a><br /> |
166 | +Class <a href="RIR/WebDocument.html" class="link">RIR::WebDocument</a><br /> | |
167 | +Class <a href="RIR/WikipediaPage.html" class="link">RIR::WikipediaPage</a><br /> | |
185 | 168 | |
186 | - </div> | |
187 | - | |
188 | - <div id="constants-list"> | |
189 | - <h3 class="section-bar">Constants</h3> | |
190 | - | |
191 | - <div class="name-list"> | |
192 | - <table summary="Constants"> | |
193 | - | |
194 | - <tr class="top-aligned-row context-row"> | |
195 | - <td class="context-item-name">Stoplist</td> | |
196 | - <td>=</td> | |
197 | - <td class="context-item-value">[ "a", "anything", "anyway", "anywhere", "apart", "are", "around", "as", "at", "av", "be", "became", "because", "become", "becomes", "becoming", "been", "before", "beforehand", "behind", "being", "below", "beside", "besides", "between", "beyond", "both", "but", "by", "can", "cannot", "canst", "certain", "cf", "choose", "contrariwise", "cos", "could", "cu", "day", "do", "does", "doesn't", "doing", "dost", "doth", "double", "down", "dual", "during", "each", "either", "else", "elsewhere", "enough", "et", "etc", "even", "ever", "every", "everybody", "everyone", "everything", "everywhere", "except", "excepted", "excepting", "exception", "exclude", "excluding", "exclusive", "far", "farther", "farthest", "few", "ff", "first", "for", "formerly", "forth", "forward", "from", "front", "further", "furthermore", "furthest", "get", "go", "had", "halves", "hardly", "has", "hast", "hath", "have", "he", "hence", "henceforth", "her", "here", "hereabouts", "hereafter", "hereby", "herein", "hereto", "hereupon", "hers", "herself", "him", "himself", "hindmost", "his", "hither", "hitherto", "how", "however", "howsoever", "i", "ie", "if", "in", "inasmuch", "inc", "include", "included", "including", "indeed", "indoors", "inside", "insomuch", "instead", "into", "inward", "inwards", "is", "it", "its", "itself", "just", "kind", "kg", "km", "last", "latter", "latterly", "less", "lest", "let", "like", "little", "ltd", "many", "may", "maybe", "me", "meantime", "meanwhile", "might", "moreover", "most", "mostly", "more", "mr", "mrs", "ms", "much", "must", "my", "myself", "namely", "need", "neither", "never", "nevertheless", "next", "no", "nobody", "none", "nonetheless", "noone", "nope", "nor", "not", "nothing", "notwithstanding", "now", "nowadays", "nowhere", "of", "off", "often", "ok", "on", "once", "one", "only", "onto", "or", "other", "others", "otherwise", "ought", "our", "ours", "ourselves", "out", "outside", "over", "own", "per", "perhaps", "plenty", "provide", "quite", "rather", "really", "round", "said", "sake", "same", "sang", "save", "saw", "see", "seeing", "seem", "seemed", "seeming", "seems", "seen", "seldom", "selves", "sent", "several", "shalt", "she", "should", "shown", "sideways", "since", "slept", "slew", "slung", "slunk", "smote", "so", "some", "somebody", "somehow", "someone", "something", "sometime", "sometimes", "somewhat", "somewhere", "spake", "spat", "spoke", "spoken", "sprang", "sprung", "stave", "staves", "still", "such", "supposing", "than", "that", "the", "thee", "their", "them", "themselves", "then", "thence", "thenceforth", "there", "thereabout", "thereabouts", "thereafter", "thereby", "therefore", "therein", "thereof", "thereon", "thereto", "thereupon", "these", "they", "this", "those", "thou", "though", "thrice", "through", "throughout", "thru", "thus", "thy", "thyself", "till", "to", "together", "too", "toward", "towards", "ugh", "unable", "under", "underneath", "unless", "unlike", "until", "up", "upon", "upward", "upwards", "us", "use", "used", "using", "very", "via", "vs", "want", "was", "we", "week", "well", "were", "what", "whatever", "whatsoever", "when", "whence", "whenever", "whensoever", "where", "whereabouts", "whereafter", "whereas", "whereat", "whereby", "wherefore", "wherefrom", "wherein", "whereinto", "whereof", "whereon", "wheresoever", "whereto", "whereunto", "whereupon", "wherever", "wherewith", "whether", "whew", "which", "whichever", "whichsoever", "while", "whilst", "whither", "who", "whoa", "whoever", "whole", "whom", "whomever", "whomsoever", "whose", "whosoever", "why", "will", "wilt", "with", "within", "without", "worse", "worst", "would", "wow", "ye", "yet", "year", "yippee", "you", "your", "yours", "yourself", "yourselves" ]</td> | |
198 | - | |
199 | - <td> </td> | |
200 | - <td class="context-item-desc"> | |
201 | -These are the default stopwords provided by Lemur. | |
202 | - | |
203 | -</td> | |
204 | - | |
205 | - </tr> | |
206 | - | |
207 | - </table> | |
208 | - </div> | |
209 | 169 | </div> |
210 | 170 | |
211 | 171 |
doc/classes/RIR/Document.html
... | ... | @@ -99,16 +99,18 @@ |
99 | 99 | |
100 | 100 | <div class="name-list"> |
101 | 101 | |
102 | - <a href="#M000021">count_words</a> | |
102 | + <a href="#M000010">count_words</a> | |
103 | 103 | |
104 | - <a href="#M000022">entropy</a> | |
104 | + <a href="#M000011">entropy</a> | |
105 | 105 | |
106 | - <a href="#M000019">format_words</a> | |
106 | + <a href="#M000008">format_words</a> | |
107 | 107 | |
108 | - <a href="#M000023">new</a> | |
108 | + <a href="#M000013">new</a> | |
109 | 109 | |
110 | - <a href="#M000020">ngrams</a> | |
110 | + <a href="#M000009">ngrams</a> | |
111 | 111 | |
112 | + <a href="#M000012">tf</a> | |
113 | + | |
112 | 114 | </div> |
113 | 115 | </div> |
114 | 116 | |
115 | 117 | |
... | ... | @@ -154,13 +156,13 @@ |
154 | 156 | <h3 class="section-bar">Public Class methods</h3> |
155 | 157 | |
156 | 158 | |
157 | - <div id="method-M000023" class="method-detail"> | |
158 | - <a name="M000023"></a> | |
159 | + <div id="method-M000013" class="method-detail"> | |
160 | + <a name="M000013"></a> | |
159 | 161 | |
160 | 162 | <div class="method-heading"> |
161 | 163 | |
162 | - <a href="Document.src/M000023.html" target="Code" class="method-signature" | |
163 | - onclick="popupCode('Document.src/M000023.html');return false;"> | |
164 | + <a href="Document.src/M000013.html" target="Code" class="method-signature" | |
165 | + onclick="popupCode('Document.src/M000013.html');return false;"> | |
164 | 166 | |
165 | 167 | <span class="method-name">new</span><span class="method-args">(content)</span> |
166 | 168 | |
167 | 169 | |
... | ... | @@ -177,13 +179,13 @@ |
177 | 179 | <h3 class="section-bar">Public Instance methods</h3> |
178 | 180 | |
179 | 181 | |
180 | - <div id="method-M000021" class="method-detail"> | |
181 | - <a name="M000021"></a> | |
182 | + <div id="method-M000010" class="method-detail"> | |
183 | + <a name="M000010"></a> | |
182 | 184 | |
183 | 185 | <div class="method-heading"> |
184 | 186 | |
185 | - <a href="Document.src/M000021.html" target="Code" class="method-signature" | |
186 | - onclick="popupCode('Document.src/M000021.html');return false;"> | |
187 | + <a href="Document.src/M000010.html" target="Code" class="method-signature" | |
188 | + onclick="popupCode('Document.src/M000010.html');return false;"> | |
187 | 189 | |
188 | 190 | <span class="method-name">count_words</span><span class="method-args">()</span> |
189 | 191 | |
190 | 192 | |
... | ... | @@ -205,13 +207,13 @@ |
205 | 207 | </div> |
206 | 208 | |
207 | 209 | |
208 | - <div id="method-M000022" class="method-detail"> | |
209 | - <a name="M000022"></a> | |
210 | + <div id="method-M000011" class="method-detail"> | |
211 | + <a name="M000011"></a> | |
210 | 212 | |
211 | 213 | <div class="method-heading"> |
212 | 214 | |
213 | - <a href="Document.src/M000022.html" target="Code" class="method-signature" | |
214 | - onclick="popupCode('Document.src/M000022.html');return false;"> | |
215 | + <a href="Document.src/M000011.html" target="Code" class="method-signature" | |
216 | + onclick="popupCode('Document.src/M000011.html');return false;"> | |
215 | 217 | |
216 | 218 | <span class="method-name">entropy</span><span class="method-args">(s)</span> |
217 | 219 | |
218 | 220 | |
219 | 221 | |
... | ... | @@ -229,20 +231,21 @@ |
229 | 231 | whitespace(s)), it is considered as an ngram. |
230 | 232 | </p> |
231 | 233 | <pre> |
232 | - entropy("guitar") #=> 0.00389919463243839 | |
234 | + entropy("guitar") #=> 0.00432114812727959 | |
235 | + entropy("dillinger escape plan") #=> 0.265862076325102 | |
233 | 236 | </pre> |
234 | 237 | |
235 | 238 | </div> |
236 | 239 | </div> |
237 | 240 | |
238 | 241 | |
239 | - <div id="method-M000020" class="method-detail"> | |
240 | - <a name="M000020"></a> | |
242 | + <div id="method-M000009" class="method-detail"> | |
243 | + <a name="M000009"></a> | |
241 | 244 | |
242 | 245 | <div class="method-heading"> |
243 | 246 | |
244 | - <a href="Document.src/M000020.html" target="Code" class="method-signature" | |
245 | - onclick="popupCode('Document.src/M000020.html');return false;"> | |
247 | + <a href="Document.src/M000009.html" target="Code" class="method-signature" | |
248 | + onclick="popupCode('Document.src/M000009.html');return false;"> | |
246 | 249 | |
247 | 250 | <span class="method-name">ngrams</span><span class="method-args">(n)</span> |
248 | 251 | |
249 | 252 | |
250 | 253 | |
... | ... | @@ -264,16 +267,43 @@ |
264 | 267 | </div> |
265 | 268 | |
266 | 269 | |
270 | + <div id="method-M000012" class="method-detail"> | |
271 | + <a name="M000012"></a> | |
272 | + | |
273 | + <div class="method-heading"> | |
274 | + | |
275 | + <a href="Document.src/M000012.html" target="Code" class="method-signature" | |
276 | + onclick="popupCode('Document.src/M000012.html');return false;"> | |
277 | + | |
278 | + <span class="method-name">tf</span><span class="method-args">(s)</span> | |
279 | + | |
280 | + </a> | |
281 | + | |
282 | + </div> | |
283 | + | |
284 | + <div class="method-description"> | |
285 | + | |
286 | + <p> | |
287 | +Computes the term frequency of a given <b>word</b> <tt>s</tt>. | |
288 | +</p> | |
289 | +<pre> | |
290 | + tf("guitar") #=> 0.000380372765310004 | |
291 | +</pre> | |
292 | + | |
293 | + </div> | |
294 | + </div> | |
295 | + | |
296 | + | |
267 | 297 | <h3 class="section-bar">Protected Instance methods</h3> |
268 | 298 | |
269 | 299 | |
270 | - <div id="method-M000019" class="method-detail"> | |
271 | - <a name="M000019"></a> | |
300 | + <div id="method-M000008" class="method-detail"> | |
301 | + <a name="M000008"></a> | |
272 | 302 | |
273 | 303 | <div class="method-heading"> |
274 | 304 | |
275 | - <a href="Document.src/M000019.html" target="Code" class="method-signature" | |
276 | - onclick="popupCode('Document.src/M000019.html');return false;"> | |
305 | + <a href="Document.src/M000008.html" target="Code" class="method-signature" | |
306 | + onclick="popupCode('Document.src/M000008.html');return false;"> | |
277 | 307 | |
278 | 308 | <span class="method-name">format_words</span><span class="method-args">()</span> |
279 | 309 |
doc/classes/RIR/Document.src/M000008.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>format_words (RIR::Document)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 31</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">format_words</span> | |
12 | + <span class="ruby-identifier">wo</span> = [] | |
13 | + | |
14 | + <span class="ruby-ivar">@doc_content</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
15 | + <span class="ruby-identifier">w</span>.<span class="ruby-identifier">split</span>(<span class="ruby-regexp re">/\W/</span>).<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">sw</span><span class="ruby-operator">|</span> | |
16 | + <span class="ruby-identifier">wo</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">sw</span>.<span class="ruby-identifier">downcase</span>) <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">sw</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/[a-zA-Z]/</span> | |
17 | + <span class="ruby-keyword kw">end</span> | |
18 | + <span class="ruby-keyword kw">end</span> | |
19 | + | |
20 | + <span class="ruby-identifier">wo</span> | |
21 | + <span class="ruby-keyword kw">end</span></pre> | |
22 | +</body> | |
23 | +</html> |
doc/classes/RIR/Document.src/M000009.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>ngrams (RIR::Document)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 46</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">ngrams</span>(<span class="ruby-identifier">n</span>) | |
12 | + <span class="ruby-identifier">window</span> = [] | |
13 | + <span class="ruby-identifier">ngrams_array</span> = [] | |
14 | + | |
15 | + <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
16 | + <span class="ruby-identifier">window</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">w</span>) | |
17 | + <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">size</span> <span class="ruby-operator">==</span> <span class="ruby-identifier">n</span> | |
18 | + <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">push</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">join</span>(<span class="ruby-value str">" "</span>) | |
19 | + <span class="ruby-identifier">window</span>.<span class="ruby-identifier">delete_at</span>(<span class="ruby-value">0</span>) | |
20 | + <span class="ruby-keyword kw">end</span> | |
21 | + <span class="ruby-keyword kw">end</span> | |
22 | + | |
23 | + <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">uniq</span> | |
24 | + <span class="ruby-keyword kw">end</span></pre> | |
25 | +</body> | |
26 | +</html> |
doc/classes/RIR/Document.src/M000010.html
... | ... | @@ -2,22 +2,17 @@ |
2 | 2 | "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> |
3 | 3 | <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> |
4 | 4 | <head> |
5 | - <title>format_words (RIR::Document)</title> | |
5 | + <title>count_words (RIR::Document)</title> | |
6 | 6 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> |
7 | 7 | <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> |
8 | 8 | </head> |
9 | 9 | <body class="standalone-code"> |
10 | - <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 31</span> | |
11 | - <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">format_words</span> | |
12 | - <span class="ruby-identifier">wo</span> = [] | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 64</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">count_words</span> | |
12 | + <span class="ruby-identifier">counts</span> = <span class="ruby-constant">Hash</span>.<span class="ruby-identifier">new</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">h</span>,<span class="ruby-identifier">k</span><span class="ruby-operator">|</span> <span class="ruby-identifier">h</span>[<span class="ruby-identifier">k</span>] = <span class="ruby-value">0</span> } | |
13 | + <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>] <span class="ruby-operator">+=</span> <span class="ruby-value">1</span> } | |
13 | 14 | |
14 | - <span class="ruby-ivar">@doc_content</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
15 | - <span class="ruby-identifier">w</span>.<span class="ruby-identifier">split</span>(<span class="ruby-regexp re">/\W/</span>).<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">sw</span><span class="ruby-operator">|</span> | |
16 | - <span class="ruby-identifier">wo</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">sw</span>) <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">sw</span> <span class="ruby-operator">=~</span> <span class="ruby-regexp re">/[a-zA-Z]/</span> | |
17 | - <span class="ruby-keyword kw">end</span> | |
18 | - <span class="ruby-keyword kw">end</span> | |
19 | - | |
20 | - <span class="ruby-identifier">wo</span> | |
15 | + <span class="ruby-identifier">counts</span> | |
21 | 16 | <span class="ruby-keyword kw">end</span></pre> |
22 | 17 | </body> |
23 | 18 | </html> |
doc/classes/RIR/Document.src/M000011.html
... | ... | @@ -2,25 +2,23 @@ |
2 | 2 | "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> |
3 | 3 | <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> |
4 | 4 | <head> |
5 | - <title>ngrams (RIR::Document)</title> | |
5 | + <title>entropy (RIR::Document)</title> | |
6 | 6 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> |
7 | 7 | <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> |
8 | 8 | </head> |
9 | 9 | <body class="standalone-code"> |
10 | - <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 46</span> | |
11 | - <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">ngrams</span>(<span class="ruby-identifier">n</span>) | |
12 | - <span class="ruby-identifier">window</span> = [] | |
13 | - <span class="ruby-identifier">ngrams_array</span> = [] | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 78</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">entropy</span>(<span class="ruby-identifier">s</span>) | |
12 | + <span class="ruby-identifier">en</span> = <span class="ruby-value">0</span><span class="ruby-value">.0</span> | |
13 | + <span class="ruby-identifier">counts</span> = <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span> | |
14 | 14 | |
15 | - <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
16 | - <span class="ruby-identifier">window</span>.<span class="ruby-identifier">push</span>(<span class="ruby-identifier">w</span>) | |
17 | - <span class="ruby-keyword kw">if</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">size</span> <span class="ruby-operator">==</span> <span class="ruby-identifier">n</span> | |
18 | - <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">push</span> <span class="ruby-identifier">window</span>.<span class="ruby-identifier">join</span>(<span class="ruby-value str">" "</span>) | |
19 | - <span class="ruby-identifier">window</span>.<span class="ruby-identifier">delete_at</span>(<span class="ruby-value">0</span>) | |
20 | - <span class="ruby-keyword kw">end</span> | |
15 | + <span class="ruby-identifier">s</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
16 | + <span class="ruby-identifier">p_wi</span> = <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">count</span>.<span class="ruby-identifier">to_f</span> | |
17 | + <span class="ruby-identifier">en</span> <span class="ruby-operator">+=</span> <span class="ruby-identifier">p_wi</span><span class="ruby-operator">*</span><span class="ruby-constant">Math</span>.<span class="ruby-identifier">log2</span>(<span class="ruby-identifier">p_wi</span>) | |
21 | 18 | <span class="ruby-keyword kw">end</span> |
22 | 19 | |
23 | - <span class="ruby-identifier">ngrams_array</span>.<span class="ruby-identifier">uniq</span> | |
20 | + <span class="ruby-identifier">en</span> <span class="ruby-operator">*=</span> <span class="ruby-value">-1</span> | |
21 | + <span class="ruby-identifier">en</span> | |
24 | 22 | <span class="ruby-keyword kw">end</span></pre> |
25 | 23 | </body> |
26 | 24 | </html> |
doc/classes/RIR/Document.src/M000012.html
... | ... | @@ -2,17 +2,14 @@ |
2 | 2 | "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> |
3 | 3 | <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> |
4 | 4 | <head> |
5 | - <title>count_words (RIR::Document)</title> | |
5 | + <title>tf (RIR::Document)</title> | |
6 | 6 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> |
7 | 7 | <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> |
8 | 8 | </head> |
9 | 9 | <body class="standalone-code"> |
10 | - <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 64</span> | |
11 | - <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">count_words</span> | |
12 | - <span class="ruby-identifier">counts</span> = <span class="ruby-constant">Hash</span>.<span class="ruby-identifier">new</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">h</span>,<span class="ruby-identifier">k</span><span class="ruby-operator">|</span> <span class="ruby-identifier">h</span>[<span class="ruby-identifier">k</span>] = <span class="ruby-value">0</span> } | |
13 | - <span class="ruby-ivar">@words</span>.<span class="ruby-identifier">each</span> { <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>.<span class="ruby-identifier">downcase</span>] <span class="ruby-operator">+=</span> <span class="ruby-value">1</span> } | |
14 | - | |
15 | - <span class="ruby-identifier">counts</span> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 94</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">tf</span>(<span class="ruby-identifier">s</span>) | |
12 | + <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span>[<span class="ruby-identifier">s</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">size</span>.<span class="ruby-identifier">to_f</span> | |
16 | 13 | <span class="ruby-keyword kw">end</span></pre> |
17 | 14 | </body> |
18 | 15 | </html> |
doc/classes/RIR/Document.src/M000013.html
... | ... | @@ -2,23 +2,15 @@ |
2 | 2 | "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> |
3 | 3 | <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> |
4 | 4 | <head> |
5 | - <title>entropy (RIR::Document)</title> | |
5 | + <title>new (RIR::Document)</title> | |
6 | 6 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> |
7 | 7 | <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> |
8 | 8 | </head> |
9 | 9 | <body class="standalone-code"> |
10 | - <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 77</span> | |
11 | - <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">entropy</span>(<span class="ruby-identifier">s</span>) | |
12 | - <span class="ruby-identifier">en</span> = <span class="ruby-value">0</span><span class="ruby-value">.0</span> | |
13 | - <span class="ruby-identifier">counts</span> = <span class="ruby-keyword kw">self</span>.<span class="ruby-identifier">count_words</span> | |
14 | - | |
15 | - <span class="ruby-identifier">s</span>.<span class="ruby-identifier">split</span>.<span class="ruby-identifier">each</span> <span class="ruby-keyword kw">do</span> <span class="ruby-operator">|</span><span class="ruby-identifier">w</span><span class="ruby-operator">|</span> | |
16 | - <span class="ruby-identifier">p_wi</span> = <span class="ruby-identifier">counts</span>[<span class="ruby-identifier">w</span>].<span class="ruby-identifier">to_f</span><span class="ruby-operator">/</span><span class="ruby-ivar">@words</span>.<span class="ruby-identifier">count</span>.<span class="ruby-identifier">to_f</span> | |
17 | - <span class="ruby-identifier">en</span> <span class="ruby-operator">+=</span> <span class="ruby-identifier">p_wi</span><span class="ruby-operator">*</span><span class="ruby-constant">Math</span>.<span class="ruby-identifier">log2</span>(<span class="ruby-identifier">p_wi</span>) | |
18 | - <span class="ruby-keyword kw">end</span> | |
19 | - | |
20 | - <span class="ruby-identifier">en</span> <span class="ruby-operator">*=</span> <span class="ruby-value">-1</span> | |
21 | - <span class="ruby-identifier">en</span> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/document.rb, line 99</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">content</span>) | |
12 | + <span class="ruby-ivar">@doc_content</span> = <span class="ruby-identifier">content</span> | |
13 | + <span class="ruby-ivar">@words</span> = <span class="ruby-identifier">format_words</span> | |
22 | 14 | <span class="ruby-keyword kw">end</span></pre> |
23 | 15 | </body> |
24 | 16 | </html> |
doc/classes/RIR/Indri/IndriQuery.html
... | ... | @@ -95,9 +95,9 @@ |
95 | 95 | |
96 | 96 | <div class="name-list"> |
97 | 97 | |
98 | - <a href="#M000014">new</a> | |
98 | + <a href="#M000006">new</a> | |
99 | 99 | |
100 | - <a href="#M000015">to_s</a> | |
100 | + <a href="#M000007">to_s</a> | |
101 | 101 | |
102 | 102 | </div> |
103 | 103 | </div> |
104 | 104 | |
... | ... | @@ -160,13 +160,13 @@ |
160 | 160 | <h3 class="section-bar">Public Class methods</h3> |
161 | 161 | |
162 | 162 | |
163 | - <div id="method-M000014" class="method-detail"> | |
164 | - <a name="M000014"></a> | |
163 | + <div id="method-M000006" class="method-detail"> | |
164 | + <a name="M000006"></a> | |
165 | 165 | |
166 | 166 | <div class="method-heading"> |
167 | 167 | |
168 | - <a href="IndriQuery.src/M000014.html" target="Code" class="method-signature" | |
169 | - onclick="popupCode('IndriQuery.src/M000014.html');return false;"> | |
168 | + <a href="IndriQuery.src/M000006.html" target="Code" class="method-signature" | |
169 | + onclick="popupCode('IndriQuery.src/M000006.html');return false;"> | |
170 | 170 | |
171 | 171 | <span class="method-name">new</span><span class="method-args">(id,query,params)</span> |
172 | 172 | |
173 | 173 | |
... | ... | @@ -183,13 +183,13 @@ |
183 | 183 | <h3 class="section-bar">Public Instance methods</h3> |
184 | 184 | |
185 | 185 | |
186 | - <div id="method-M000015" class="method-detail"> | |
187 | - <a name="M000015"></a> | |
186 | + <div id="method-M000007" class="method-detail"> | |
187 | + <a name="M000007"></a> | |
188 | 188 | |
189 | 189 | <div class="method-heading"> |
190 | 190 | |
191 | - <a href="IndriQuery.src/M000015.html" target="Code" class="method-signature" | |
192 | - onclick="popupCode('IndriQuery.src/M000015.html');return false;"> | |
191 | + <a href="IndriQuery.src/M000007.html" target="Code" class="method-signature" | |
192 | + onclick="popupCode('IndriQuery.src/M000007.html');return false;"> | |
193 | 193 | |
194 | 194 | <span class="method-name">to_s</span><span class="method-args">()</span> |
195 | 195 |
doc/classes/RIR/Indri/IndriQuery.src/M000006.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>new (RIR::Indri::IndriQuery)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 62</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">id</span>,<span class="ruby-identifier">query</span>,<span class="ruby-identifier">params</span>) | |
12 | + <span class="ruby-ivar">@params</span> = <span class="ruby-identifier">params</span> | |
13 | + <span class="ruby-comment cmt"># Here we set the default retrieval model as Language Modeling</span> | |
14 | + <span class="ruby-comment cmt"># with a Dirichlet smoothing at 2500.</span> | |
15 | + <span class="ruby-comment cmt"># TODO: maybe a Rule class...</span> | |
16 | + <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">rule</span> = <span class="ruby-value str">'method:dirichlet,mu:2500'</span> <span class="ruby-keyword kw">if</span> <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">rule</span>.<span class="ruby-identifier">nil?</span> | |
17 | + | |
18 | + <span class="ruby-ivar">@id</span> = <span class="ruby-identifier">id</span> | |
19 | + <span class="ruby-ivar">@query</span> = <span class="ruby-identifier">query</span> | |
20 | + <span class="ruby-keyword kw">end</span></pre> | |
21 | +</body> | |
22 | +</html> |
doc/classes/RIR/Indri/IndriQuery.src/M000007.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>to_s (RIR::Indri::IndriQuery)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 73</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">to_s</span> | |
12 | + <span class="ruby-identifier">h</span> = <span class="ruby-ivar">@params</span>.<span class="ruby-identifier">to_s</span> | |
13 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">"<query>\n"</span> | |
14 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<number>#{@id}</number>\n"</span> | |
15 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<text>#{@query}</text>\n"</span> | |
16 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">"</query>\n"</span> | |
17 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-value str">"</parameters>"</span> | |
18 | + | |
19 | + <span class="ruby-identifier">h</span> | |
20 | + <span class="ruby-keyword kw">end</span></pre> | |
21 | +</body> | |
22 | +</html> |
doc/classes/RIR/Indri/Parameters.html
... | ... | @@ -91,9 +91,9 @@ |
91 | 91 | |
92 | 92 | <div class="name-list"> |
93 | 93 | |
94 | - <a href="#M000012">new</a> | |
94 | + <a href="#M000004">new</a> | |
95 | 95 | |
96 | - <a href="#M000013">to_s</a> | |
96 | + <a href="#M000005">to_s</a> | |
97 | 97 | |
98 | 98 | </div> |
99 | 99 | </div> |
... | ... | @@ -121,7 +121,7 @@ |
121 | 121 | </tr> |
122 | 122 | |
123 | 123 | <tr class="top-aligned-row context-row"> |
124 | - <td class="context-item-name">corpus</td> | |
124 | + <td class="context-item-name">count</td> | |
125 | 125 | |
126 | 126 | <td class="context-item-value"> [RW] </td> |
127 | 127 | |
... | ... | @@ -129,7 +129,7 @@ |
129 | 129 | </tr> |
130 | 130 | |
131 | 131 | <tr class="top-aligned-row context-row"> |
132 | - <td class="context-item-name">count</td> | |
132 | + <td class="context-item-name">index_path</td> | |
133 | 133 | |
134 | 134 | <td class="context-item-value"> [RW] </td> |
135 | 135 | |
136 | 136 | |
... | ... | @@ -196,13 +196,13 @@ |
196 | 196 | <h3 class="section-bar">Public Class methods</h3> |
197 | 197 | |
198 | 198 | |
199 | - <div id="method-M000012" class="method-detail"> | |
200 | - <a name="M000012"></a> | |
199 | + <div id="method-M000004" class="method-detail"> | |
200 | + <a name="M000004"></a> | |
201 | 201 | |
202 | 202 | <div class="method-heading"> |
203 | 203 | |
204 | - <a href="Parameters.src/M000012.html" target="Code" class="method-signature" | |
205 | - onclick="popupCode('Parameters.src/M000012.html');return false;"> | |
204 | + <a href="Parameters.src/M000004.html" target="Code" class="method-signature" | |
205 | + onclick="popupCode('Parameters.src/M000004.html');return false;"> | |
206 | 206 | |
207 | 207 | <span class="method-name">new</span><span class="method-args">(corpus,mem="1g",count="1000",offset="1",run_id="default",print_query=false,print_docs=false)</span> |
208 | 208 | |
209 | 209 | |
... | ... | @@ -219,13 +219,13 @@ |
219 | 219 | <h3 class="section-bar">Public Instance methods</h3> |
220 | 220 | |
221 | 221 | |
222 | - <div id="method-M000013" class="method-detail"> | |
223 | - <a name="M000013"></a> | |
222 | + <div id="method-M000005" class="method-detail"> | |
223 | + <a name="M000005"></a> | |
224 | 224 | |
225 | 225 | <div class="method-heading"> |
226 | 226 | |
227 | - <a href="Parameters.src/M000013.html" target="Code" class="method-signature" | |
228 | - onclick="popupCode('Parameters.src/M000013.html');return false;"> | |
227 | + <a href="Parameters.src/M000005.html" target="Code" class="method-signature" | |
228 | + onclick="popupCode('Parameters.src/M000005.html');return false;"> | |
229 | 229 | |
230 | 230 | <span class="method-name">to_s</span><span class="method-args">()</span> |
231 | 231 |
doc/classes/RIR/Indri/Parameters.src/M000004.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>new (RIR::Indri::Parameters)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 30</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span>(<span class="ruby-identifier">corpus</span>,<span class="ruby-identifier">mem</span>=<span class="ruby-value str">"1g"</span>,<span class="ruby-identifier">count</span>=<span class="ruby-value str">"1000"</span>,<span class="ruby-identifier">offset</span>=<span class="ruby-value str">"1"</span>,<span class="ruby-identifier">run_id</span>=<span class="ruby-value str">"default"</span>,<span class="ruby-identifier">print_query</span>=<span class="ruby-keyword kw">false</span>,<span class="ruby-identifier">print_docs</span>=<span class="ruby-keyword kw">false</span>) | |
12 | + <span class="ruby-ivar">@index_path</span> = <span class="ruby-identifier">corpus</span> | |
13 | + <span class="ruby-ivar">@memory</span> = <span class="ruby-identifier">mem</span> | |
14 | + <span class="ruby-ivar">@count</span> = <span class="ruby-identifier">count</span> | |
15 | + <span class="ruby-ivar">@offset</span> = <span class="ruby-identifier">offset</span> | |
16 | + <span class="ruby-ivar">@run_id</span> = <span class="ruby-identifier">run_id</span> | |
17 | + <span class="ruby-ivar">@print_query</span> = <span class="ruby-identifier">print_query</span> <span class="ruby-value">? </span><span class="ruby-value str">"true"</span> <span class="ruby-operator">:</span> <span class="ruby-value str">"false"</span> | |
18 | + <span class="ruby-ivar">@print_docs</span> = <span class="ruby-identifier">print_docs</span> <span class="ruby-value">? </span><span class="ruby-value str">"true"</span> <span class="ruby-operator">:</span> <span class="ruby-value str">"false"</span> | |
19 | + <span class="ruby-keyword kw">end</span></pre> | |
20 | +</body> | |
21 | +</html> |
doc/classes/RIR/Indri/Parameters.src/M000005.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>to_s (RIR::Indri::Parameters)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/query.rb, line 40</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">to_s</span> | |
12 | + <span class="ruby-identifier">h</span> = <span class="ruby-value str">"<parameters>\n"</span> | |
13 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<memory>#{@memory}</memory>\n"</span> | |
14 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<index>#{@index_path}</index>\n"</span> | |
15 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<count>#{@count}</count>\n"</span> | |
16 | + <span class="ruby-keyword kw">unless</span> <span class="ruby-ivar">@baseline</span>.<span class="ruby-identifier">nil?</span> | |
17 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<baseline>#{@baseline}</baseline>\n"</span> | |
18 | + <span class="ruby-keyword kw">else</span> | |
19 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<rule>#{@rule}</rule>\n"</span> | |
20 | + <span class="ruby-keyword kw">end</span> | |
21 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<queryOffset>#{@offset}</queryOffset>\n"</span> | |
22 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<runID>#{@run_id}</runID>\n"</span> | |
23 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<printQuery>#{@print_query}</printQuery>\n"</span> | |
24 | + <span class="ruby-identifier">h</span> <span class="ruby-operator">+=</span> <span class="ruby-node">"<printDocuments>#{@print_docs}</printDocuments>\n"</span> | |
25 | + | |
26 | + <span class="ruby-identifier">h</span> | |
27 | + <span class="ruby-keyword kw">end</span></pre> | |
28 | +</body> | |
29 | +</html> |
doc/classes/RIR/TreeTagger.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>Module: RIR::TreeTagger [RDoc Documentation]</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <meta http-equiv="Content-Script-Type" content="text/javascript" /> | |
8 | + <link rel="stylesheet" href="../.././rdoc-style.css" type="text/css" media="screen" /> | |
9 | + <script type="text/javascript"> | |
10 | + // <![CDATA[ | |
11 | + | |
12 | + function popupCode( url ) { | |
13 | + window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400") | |
14 | + } | |
15 | + | |
16 | + function toggleCode( id ) { | |
17 | + if ( document.getElementById ) | |
18 | + elem = document.getElementById( id ); | |
19 | + else if ( document.all ) | |
20 | + elem = eval( "document.all." + id ); | |
21 | + else | |
22 | + return false; | |
23 | + | |
24 | + elemStyle = elem.style; | |
25 | + | |
26 | + if ( elemStyle.display != "block" ) { | |
27 | + elemStyle.display = "block" | |
28 | + } else { | |
29 | + elemStyle.display = "none" | |
30 | + } | |
31 | + | |
32 | + return true; | |
33 | + } | |
34 | + | |
35 | + // Make codeblocks hidden by default | |
36 | + document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" ) | |
37 | + | |
38 | + // ]]> | |
39 | + </script> | |
40 | + | |
41 | +</head> | |
42 | +<body> | |
43 | + | |
44 | + | |
45 | + <div id="classHeader"> | |
46 | + <table class="header-table"> | |
47 | + <tr class="top-aligned-row"> | |
48 | + <td><strong>Module</strong></td> | |
49 | + <td class="class-name-in-header">RIR::TreeTagger</td> | |
50 | + </tr> | |
51 | + <tr class="top-aligned-row"> | |
52 | + <td><strong>In:</strong></td> | |
53 | + <td> | |
54 | + | |
55 | + | |
56 | + <a href="../../files/lib/rir/ttagger_rb.html"> | |
57 | + | |
58 | + lib/rir/ttagger.rb | |
59 | + | |
60 | + </a> | |
61 | + | |
62 | + | |
63 | + <br /> | |
64 | + | |
65 | + </td> | |
66 | + </tr> | |
67 | + | |
68 | + | |
69 | + </table> | |
70 | + </div> | |
71 | + <!-- banner header --> | |
72 | + | |
73 | + <div id="bodyContent"> | |
74 | + | |
75 | + <div id="contextContent"> | |
76 | + | |
77 | + <div id="description"> | |
78 | + <p> | |
79 | +TreeTagger-related stuff module. | |
80 | +</p> | |
81 | +<p> | |
82 | +See <a | |
83 | +href="http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html">www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html</a> | |
84 | +</p> | |
85 | + | |
86 | + </div> | |
87 | + | |
88 | + </div> | |
89 | + | |
90 | + | |
91 | + </div> | |
92 | + | |
93 | + <!-- if includes --> | |
94 | + | |
95 | + <div id="section"> | |
96 | + | |
97 | + <div id="class-list"> | |
98 | + <h3 class="section-bar">Classes and Modules</h3> | |
99 | + | |
100 | + Class <a href="TreeTagger/Chunk.html" class="link">RIR::TreeTagger::Chunk</a><br /> | |
101 | +Class <a href="TreeTagger/TaggerChunker.html" class="link">RIR::TreeTagger::TaggerChunker</a><br /> | |
102 | +Class <a href="TreeTagger/TaggerChunkerEnglish.html" class="link">RIR::TreeTagger::TaggerChunkerEnglish</a><br /> | |
103 | +Class <a href="TreeTagger/TaggerChunkerFrench.html" class="link">RIR::TreeTagger::TaggerChunkerFrench</a><br /> | |
104 | +Class <a href="TreeTagger/TaggerChunkerGerman.html" class="link">RIR::TreeTagger::TaggerChunkerGerman</a><br /> | |
105 | + | |
106 | + </div> | |
107 | + | |
108 | + | |
109 | + | |
110 | + | |
111 | + <!-- if method_list --> | |
112 | + | |
113 | + | |
114 | + | |
115 | + | |
116 | + </div> | |
117 | + | |
118 | +<div id="validator-badges"> | |
119 | + <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p> | |
120 | +</div> | |
121 | + | |
122 | +</body> | |
123 | +</html> |
doc/classes/RIR/TreeTagger/Chunk.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>Class: RIR::TreeTagger::Chunk [RDoc Documentation]</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <meta http-equiv="Content-Script-Type" content="text/javascript" /> | |
8 | + <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> | |
9 | + <script type="text/javascript"> | |
10 | + // <![CDATA[ | |
11 | + | |
12 | + function popupCode( url ) { | |
13 | + window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400") | |
14 | + } | |
15 | + | |
16 | + function toggleCode( id ) { | |
17 | + if ( document.getElementById ) | |
18 | + elem = document.getElementById( id ); | |
19 | + else if ( document.all ) | |
20 | + elem = eval( "document.all." + id ); | |
21 | + else | |
22 | + return false; | |
23 | + | |
24 | + elemStyle = elem.style; | |
25 | + | |
26 | + if ( elemStyle.display != "block" ) { | |
27 | + elemStyle.display = "block" | |
28 | + } else { | |
29 | + elemStyle.display = "none" | |
30 | + } | |
31 | + | |
32 | + return true; | |
33 | + } | |
34 | + | |
35 | + // Make codeblocks hidden by default | |
36 | + document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" ) | |
37 | + | |
38 | + // ]]> | |
39 | + </script> | |
40 | + | |
41 | +</head> | |
42 | +<body> | |
43 | + | |
44 | + | |
45 | + <div id="classHeader"> | |
46 | + <table class="header-table"> | |
47 | + <tr class="top-aligned-row"> | |
48 | + <td><strong>Class</strong></td> | |
49 | + <td class="class-name-in-header">RIR::TreeTagger::Chunk</td> | |
50 | + </tr> | |
51 | + <tr class="top-aligned-row"> | |
52 | + <td><strong>In:</strong></td> | |
53 | + <td> | |
54 | + | |
55 | + | |
56 | + <a href="../../../files/lib/rir/ttagger_rb.html"> | |
57 | + | |
58 | + lib/rir/ttagger.rb | |
59 | + | |
60 | + </a> | |
61 | + | |
62 | + | |
63 | + <br /> | |
64 | + | |
65 | + </td> | |
66 | + </tr> | |
67 | + | |
68 | + | |
69 | + <tr class="top-aligned-row"> | |
70 | + <td><strong>Parent:</strong></td> | |
71 | + <td> | |
72 | + | |
73 | + Object | |
74 | + | |
75 | + </td> | |
76 | + </tr> | |
77 | + | |
78 | + </table> | |
79 | + </div> | |
80 | + <!-- banner header --> | |
81 | + | |
82 | + <div id="bodyContent"> | |
83 | + | |
84 | + <div id="contextContent"> | |
85 | + | |
86 | + <div id="description"> | |
87 | + <p> | |
88 | +Represents a <a href="Chunk.html">Chunk</a> extracted when parsing a <a | |
89 | +href="TaggerChunker.html">TaggerChunker</a> file. | |
90 | +</p> | |
91 | + | |
92 | + </div> | |
93 | + | |
94 | + </div> | |
95 | + | |
96 | + | |
97 | + <div id="method-list"> | |
98 | + <h3 class="section-bar">Methods</h3> | |
99 | + | |
100 | + <div class="name-list"> | |
101 | + | |
102 | + <a href="#M000003">new</a> | |
103 | + | |
104 | + </div> | |
105 | + </div> | |
106 | + | |
107 | + </div> | |
108 | + | |
109 | + <!-- if includes --> | |
110 | + | |
111 | + <div id="section"> | |
112 | + | |
113 | + | |
114 | + | |
115 | + <div id="attribute-list"> | |
116 | + <h3 class="section-bar">Attributes</h3> | |
117 | + | |
118 | + <div class="name-list"> | |
119 | + <table> | |
120 | + | |
121 | + <tr class="top-aligned-row context-row"> | |
122 | + <td class="context-item-name">tag</td> | |
123 | + | |
124 | + <td class="context-item-value"> [R] </td> | |
125 | + | |
126 | + <td class="context-item-desc"></td> | |
127 | + </tr> | |
128 | + | |
129 | + <tr class="top-aligned-row context-row"> | |
130 | + <td class="context-item-name">words</td> | |
131 | + | |
132 | + <td class="context-item-value"> [R] </td> | |
133 | + | |
134 | + <td class="context-item-desc"></td> | |
135 | + </tr> | |
136 | + | |
137 | + </table> | |
138 | + </div> | |
139 | + </div> | |
140 | + | |
141 | + | |
142 | + <!-- if method_list --> | |
143 | + | |
144 | + <div id="methods"> | |
145 | + | |
146 | + <h3 class="section-bar">Public Class methods</h3> | |
147 | + | |
148 | + | |
149 | + <div id="method-M000003" class="method-detail"> | |
150 | + <a name="M000003"></a> | |
151 | + | |
152 | + <div class="method-heading"> | |
153 | + | |
154 | + <a href="Chunk.src/M000003.html" target="Code" class="method-signature" | |
155 | + onclick="popupCode('Chunk.src/M000003.html');return false;"> | |
156 | + | |
157 | + <span class="method-name">new</span><span class="method-args">(str,tag)</span> | |
158 | + | |
159 | + </a> | |
160 | + | |
161 | + </div> | |
162 | + | |
163 | + <div class="method-description"> | |
164 | + | |
165 | + <p> | |
166 | +<tt>str</tt> are whitespace-separated terms. <tt>tag</tt> see : <a | |
167 | +href="ftp://ftp.ims.uni-stuttgart.de/pub/corpora/chunker-tagset-english.txt">ftp.ims.uni-stuttgart.de/pub/corpora/chunker-tagset-english.txt</a> | |
168 | +</p> | |
169 | + | |
170 | + </div> | |
171 | + </div> | |
172 | + | |
173 | + | |
174 | + | |
175 | + </div> | |
176 | + | |
177 | + | |
178 | + | |
179 | + | |
180 | + </div> | |
181 | + | |
182 | +<div id="validator-badges"> | |
183 | + <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p> | |
184 | +</div> | |
185 | + | |
186 | +</body> | |
187 | +</html> |
doc/classes/RIR/TreeTagger/Chunk.src/M000003.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>new (RIR::TreeTagger::Chunk)</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <link rel="stylesheet" href="../../../.././rdoc-style.css" type="text/css" media="screen" /> | |
8 | +</head> | |
9 | +<body class="standalone-code"> | |
10 | + <pre><span class="ruby-comment cmt"># File lib/rir/ttagger.rb, line 86</span> | |
11 | + <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">initialize</span> <span class="ruby-identifier">str</span>,<span class="ruby-identifier">tag</span> | |
12 | + <span class="ruby-ivar">@words</span> = <span class="ruby-identifier">str</span>.<span class="ruby-identifier">split</span> | |
13 | + <span class="ruby-ivar">@tag</span> = <span class="ruby-identifier">tag</span>[<span class="ruby-value">1</span><span class="ruby-operator">..</span><span class="ruby-value">-2</span>] | |
14 | + <span class="ruby-keyword kw">end</span></pre> | |
15 | +</body> | |
16 | +</html> |
doc/classes/RIR/TreeTagger/TaggerChunker.html
1 | +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" | |
2 | +"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> | |
3 | +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en"> | |
4 | +<head> | |
5 | + <title>Class: RIR::TreeTagger::TaggerChunker [RDoc Documentation]</title> | |
6 | + <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> | |
7 | + <meta http-equiv="Content-Script-Type" content="text/javascript" /> | |
8 | + <link rel="stylesheet" href="../../.././rdoc-style.css" type="text/css" media="screen" /> | |
9 | + <script type="text/javascript"> | |
10 | + // <![CDATA[ | |
11 | + | |
12 | + function popupCode( url ) { | |
13 | + window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400") | |
14 | + } | |
15 | + | |
16 | + function toggleCode( id ) { | |
17 | + if ( document.getElementById ) | |
18 | + elem = document.getElementById( id ); | |
19 | + else if ( document.all ) | |
20 | + elem = eval( "document.all." + id ); | |
21 | + else | |
22 | + return false; | |
23 | + | |
24 | + elemStyle = elem.style; | |
25 | + | |
26 | + if ( elemStyle.display != "block" ) { | |
27 | + elemStyle.display = "block" | |
28 | + } else { | |
29 | + elemStyle.display = "none" | |
30 | + } | |
31 | + | |
32 | + return true; | |
33 | + } | |
34 | + | |
35 | + // Make codeblocks hidden by default | |
36 | + document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }<\/style>" ) | |
37 | + | |
38 | + // ]]> | |
39 | + </script> | |
40 | + | |
41 | +</head> | |
42 | +<body> | |
43 | + | |
44 | + | |
45 | + <div id="classHeader"> | |
46 | + <table class="header-table"> | |
47 | + <tr class="top-aligned-row"> | |
48 | + <td><strong>Class</strong></td> | |
49 | + <td class="class-name-in-header">RIR::TreeTagger::TaggerChunker</td> | |
50 | + </tr> | |
51 | + <tr class="top-aligned-row"> | |
52 | + <td><strong>In:</strong></td> | |
53 | + <td> | |
54 | + | |
55 | + | |
56 | + <a href="../../../files/lib/rir/ttagger_rb.html"> | |
57 | + | |
58 | + lib/rir/ttagger.rb | |
59 | + | |
60 | + </a> | |
61 | + | |
62 | + | |
63 | + <br /> | |
64 | + | |
65 | + </td> | |
66 | + </tr> | |
67 | + | |
68 | + | |