Displaying 1 result from an estimated 1 matches for "seenterm".
Did you mean:
seenterms
2007 Mar 09
5
memory leak in index build?
...:field1=>name,
:field2=>name,
:field3=>name,
}
}
i.close
i=Ferret::Index::IndexReader.new dir
i.max_doc.times{|n|
i.term_vector(n,:data).terms \
.inject(0){|sum,tvt| tvt.positions.size } > 1_000_000 and
puts "heinous term count for #{i[n][:name]}"
}
seenterms=Set[]
begin
i.terms(:data).each{|term,df|
seenterms.include? term and next
i.term_docs_for(:data,term)
seenterms << term
}
rescue Exception
raise
end