require 'httpclient' require 'nokogiri' module Impressionist module Bots LIST_URL = "http://www.user-agents.org/allagents.xml" def self.consume response = HTTPClient.new.get_content(LIST_URL) doc = Nokogiri::XML(response) list = [] doc.xpath('//user-agent').each do |agent| type = agent.xpath("Type").text list << agent.xpath("String").text.gsub("<","<") if ["R","S"].include?(type) #gsub hack for badly formatted data end list end end end