From bcacf025a0d2cbba181ad3e55fba30926286f9c8 Mon Sep 17 00:00:00 2001 From: Giuseppe Bilotta Date: Tue, 6 Feb 2007 16:46:54 +0000 Subject: Move code to get first par from a series of urls from search plugin to Utils, and use it in dict plugin too --- lib/rbot/core/utils/utils.rb | 35 +++++++++++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) (limited to 'lib/rbot') diff --git a/lib/rbot/core/utils/utils.rb b/lib/rbot/core/utils/utils.rb index 11312e19..f5a6c1db 100644 --- a/lib/rbot/core/utils/utils.rb +++ b/lib/rbot/core/utils/utils.rb @@ -445,5 +445,40 @@ module ::Irc end return txt end + + # Get the first pars of the first _count_ _urls_. + # The pages are downloaded using an HttpUtil service passed as _opts_ :http_util, + # and echoed as replies to the IRC message passed as _opts_ :message. + # + def Utils.get_first_pars(urls, count, opts={}) + idx = 0 + msg = opts[:message] + while count > 0 and urls.length > 0 + url = urls.shift + idx += 1 + + # FIXME what happens if some big file is returned? We should share + # code with the url plugin to only retrieve partial file content! + xml = opts[:http_util].get_cached(url) + if xml.nil? + debug "Unable to retrieve #{url}" + next + end + debug "Retrieved #{url}" + debug "\t#{xml}" + par = Utils.ircify_first_html_par(xml) + if par.empty? + debug "No first par found\n#{xml}" + # FIXME only do this if the 'url' plugin is loaded + # TODO even better, put the code here + # par = @bot.plugins['url'].get_title_from_html(xml) + next if par.empty? + end + msg.reply "[#{idx}] #{par}", :overlong => :truncate if msg + count -=1 + end + end + + end end -- cgit v1.2.3