Blame view
lib/mirimiri/query.rb
3.31 KB
cd7432252
|
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 |
#!/usr/bin/env ruby #-- # This file is a part of the mirimiri library # # Copyright (C) 2010-2011 Romain Deveaud <romain.deveaud@gmail.com> # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program. If not, see <http://www.gnu.org/licenses/>. #++ class Query end module Indri class Parameters attr_accessor :index_path, :memory, :count, :offset, :run_id, :print_query, :print_docs, :rule, :baseline |
aa386f553
|
29 |
def initialize(corpus,count="1000",mem="1g",threads="1",offset="1",run_id="default",print_query=false,print_docs=false) |
cd7432252
|
30 31 32 |
@index_path = corpus @memory = mem @count = count |
aa386f553
|
33 |
@threads = threads |
cd7432252
|
34 35 36 37 38 39 40 |
@offset = offset @run_id = run_id @print_query = print_query ? "true" : "false" @print_docs = print_docs ? "true" : "false" end def to_s |
845768f8a
|
41 42 |
h = "<memory>#{@memory}</memory> " |
cd7432252
|
43 44 45 46 |
h += "<index>#{@index_path}</index> " h += "<count>#{@count}</count> " |
aa386f553
|
47 48 |
h += "<threads>#{@threads}</threads> " |
cd7432252
|
49 50 51 52 53 54 55 |
unless @baseline.nil? h += "<baseline>#{@baseline}</baseline> " else h += "<rule>#{@rule}</rule> " end |
845768f8a
|
56 57 |
h += "<trecFormat>true</trecFormat> " |
cd7432252
|
58 59 60 61 62 63 64 65 66 67 68 69 |
h += "<queryOffset>#{@offset}</queryOffset> " h += "<runID>#{@run_id}</runID> " h += "<printQuery>#{@print_query}</printQuery> " h += "<printDocuments>#{@print_docs}</printDocuments> " h end end |
cd7432252
|
70 |
|
aa386f553
|
71 |
class IndriQueryOld < Query |
845768f8a
|
72 |
attr_accessor :id, :query, :rule |
cd7432252
|
73 |
|
845768f8a
|
74 |
def initialize(id,query) |
cd7432252
|
75 76 77 78 79 |
@id = id @query = query end def to_s |
845768f8a
|
80 81 |
h = "<query> " |
cd7432252
|
82 83 84 85 86 87 |
h += "<number>#{@id}</number> " h += "<text>#{@query}</text> " h += "</query> " |
845768f8a
|
88 89 90 |
h end |
ca96fb31f
|
91 92 93 94 |
def exec params `IndriRunQuery -query='#{@query}' -index=#{params.index_path} -count=#{params.count} -rule=method:dirichlet,mu:2500 -trecFormat` end |
845768f8a
|
95 |
end |
aa386f553
|
96 97 98 99 100 101 102 103 104 105 106 107 108 |
class IndriQuery < Query attr_accessor :query, :count, :sm_method, :sm_param, :sm_value, :args def initialize atts={},args=nil raise ArgumentError, 'Argument 1 must be a Hash' unless args.is_a? Hash atts.each do |k,v| instance_variable_set("@#{k}", v) unless v.nil? end raise ArgumentError, 'Argument 2 must be a String' unless args.is_a? String @args = args end end |
845768f8a
|
109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 |
class IndriQueries attr_accessor :params, :queries def initialize(params,*queries) @queries = queries @params = params # Here we set the default retrieval model as Language Modeling # with a Dirichlet smoothing at 2500. # TODO: maybe a Rule class... @params.rule = 'method:dirichlet,mu:2500' if @params.rule.nil? end def to_s h = "<parameters> " h += @params.to_s h += @queries.collect { |q| q.to_s }.join "" |
cd7432252
|
127 128 129 130 131 132 133 |
h += "</parameters>" h end end end |