metasploit-framework/data/msfcrawler/link.rb


##
# This file is part of the Metasploit Framework and may be subject to
# redistribution and commercial restrictions. Please see the Metasploit
# Framework web site for more information on licensing and terms of use.
# http://metasploit.com/framework/
##

# $Revision: 9212 $

require 'rubygems'
require 'pathname'
require 'hpricot'
require 'uri'

class CrawlerLink < BaseParser

  def parse(request,result)

    if !result['Content-Type'].include? "text/html"
      return
    end

    doc = Hpricot(result.body.to_s)
    doc.search('link').each do |link|

    hr = link.attributes['href']

    if hr and !hr.match(/^(\#|javascript\:)/)
      begin
        hreq = urltohash('GET',hr,request['uri'],nil)

        insertnewpath(hreq)

      rescue URI::InvalidURIError
        #puts "Parse error"
        #puts "Error: #{link[0]}"
      end
    end
    end
  end
end
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
			`##`
			`# This file is part of the Metasploit Framework and may be subject to`
			`# redistribution and commercial restrictions. Please see the Metasploit`
			`# Framework web site for more information on licensing and terms of use.`
			`# http://metasploit.com/framework/`
			`##`

			`# $Revision: 9212 $`

			`require 'rubygems'`
			`require 'pathname'`
			`require 'hpricot'`
			`require 'uri'`

			`class CrawlerLink < BaseParser`

Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`def parse(request,result)`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`if !result['Content-Type'].include? "text/html"`
			`return`
			`end`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`doc = Hpricot(result.body.to_s)`
			`doc.search('link').each do \|link\|`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`hr = link.attributes['href']`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`if hr and !hr.match(/^(\#\|javascript\:)/)`
			`begin`
			`hreq = urltohash('GET',hr,request['uri'],nil)`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`insertnewpath(hreq)`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00
Retab all the things (except external/) 2013-09-30 18:47:53 +00:00			`rescue URI::InvalidURIError`
			`#puts "Parse error"`
			`#puts "Error: #{link[0]}"`
			`end`
			`end`
			`end`
			`end`
Add parsers git-svn-id: file:///home/svn/framework3/trunk@9441 4d416f70-5f16-0410-b530-b9f4589650da 2010-06-06 03:48:25 +00:00			`end`