My HTTP utilities
require 'html/htmltokenizer'
require 'net/http'
require 'cgi'
class String
def ends_with?(substr)
len = substr.length
self.reverse() [0 .. len-1].reverse == substr
end
end
def get_all_links( html_string )
tokenizer = HTMLTokenizer.new(html_string)
t = nil
links = []
link = nil
while t = tokenizer.getTag('a','area')
link = t.attr_hash['href']
next if link.nil?
link = CGI.unescapeHTML link
m = link.match(/[^\?]*/)
links << link
end
links
end
def get_page_with_cookie( url, cookie )
uri = URI.parse url
req = Net::HTTP::Get.new(url)
req["Cookie"] = cookie
res = Net::HTTP.new(uri.host, uri.port).start{|http| http.request(req) }
body = res.body
end
Posted by laza at July 2, 2006 01:24 AM
| TrackBack