Class: Main

Inherits:
Object
  • Object
show all
Defined in:
lib/driller/main.rb

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(webpage, depth, proxy_host, proxy_port) ⇒ Main

Returns a new instance of Main.



13
14
15
16
17
18
19
20
21
22
# File 'lib/driller/main.rb', line 13

def initialize(webpage, depth, proxy_host, proxy_port)
    @webpage    = webpage
    @depth      = depth
    @proxy_port = proxy_port
    @proxy_host = proxy_host

    @pageCount  = 0

    # initializing symbols
end

Instance Attribute Details

#extremely_slowObject

Returns the value of attribute extremely_slow.



11
12
13
# File 'lib/driller/main.rb', line 11

def extremely_slow
  @extremely_slow
end

#invalidObject

Returns the value of attribute invalid.



11
12
13
# File 'lib/driller/main.rb', line 11

def invalid
  @invalid
end

#slowObject

Returns the value of attribute slow.



11
12
13
# File 'lib/driller/main.rb', line 11

def slow
  @slow
end

#validObject

Returns the value of attribute valid.



11
12
13
# File 'lib/driller/main.rb', line 11

def valid
  @valid
end

Instance Method Details

#executeObject



24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
# File 'lib/driller/main.rb', line 24

def execute
    puts "Webpage   : "    + @webpage
    puts "Depth     : "    + @depth

    result = Hash.new
    Anemone.crawl(@webpage) do |anemone|

        unless @proxy_host.nil?
            anemone.proxy_host = @proxy_host
            anemone.proxy_port = @proxy_port
        end

        anemone.depth_limit = @depth.to_i
        puts "============= Driller is now checking your website links. If any of the link returned non 200, it will be displayed here========="
        anemone.focus_crawl do |page|
            page.links.select { |url| url.starts_with? @webpage }
        end


        result[:valid]              = Array.new
        result[:invalid]            = Array.new
        result[:slow]               = Array.new
        result[:extremely_slow]     = Array.new

        anemone.on_every_page do |page|

            pageObject = getPageObject(page)

            if page.code == 200
                result[:valid].push(pageObject)

                # Check Response Time
                # -------------------
                # We only check response time
                # for pages which are 200
                # because there is no point of
                # optimizing error pages.

                if page.response_time > 5000
                    result[:slow].push(pageObject)

                    puts "=======Slow Page======\n"
                    puts "Time: #{page.response_time} - #{page.url}"
                elsif page.response_time > 10000
                    result[:extremely_slow].push(pageObject)

                    puts "=======Very Slow Page======\n"
                    puts "Time: #{page.response_time} - #{page.url}"
                end
                #End checking response time.

            else #404, 301, 500
                result[:invalid].push(pageObject)

                puts "======= NON-200 Page ======\n"
                puts "#{page.code} Response from : #{page.url}"
                puts

            end

        end

        @pageCount = @pageCount + 1
        puts "Checked #{@pageCount} pages" if @pageCount % 100 == 0
    end

    generateReport('valid_pages', result[:valid])
    generateReport('broken', result[:invalid])
    generateReport('slow_pages', result[:slow])
    generateReport('extremely_slow_pages', result[:extremely_slow])

end

#generateReport(reportName, data) ⇒ Object



112
113
114
115
# File 'lib/driller/main.rb', line 112

def generateReport(reportName, data)
    report = Html_Report.new(reportName, data)
    File_Handler.new(reportName, report.getReport)
end

#getPageObject(page) ⇒ Object



97
98
99
100
101
102
103
104
105
106
107
108
109
110
# File 'lib/driller/main.rb', line 97

def getPageObject(page)
    # This means we never got an access to internet
    if page.code.nil?
        abort("Error: Either you are offline or behind proxy.")
    end

    obj = Hash.new

    obj['code']             = page.code
    obj['url']              = (page.url).to_s
    obj['response_time']    = page.response_time

    return obj
end