arachni 0.4.0.4 → 0.4.1
Sign up to get free protection for your applications and to get access to all the features.
- data/ACKNOWLEDGMENTS.md +2 -2
- data/AUTHORS.md +1 -4
- data/CHANGELOG.md +102 -3
- data/CONTRIBUTORS.md +4 -1
- data/EXPLOITATION.md +6 -6
- data/Gemfile +3 -0
- data/HACKING.md +29 -10
- data/LICENSE.md +176 -339
- data/NOTICE +12 -0
- data/README.md +160 -119
- data/Rakefile +83 -45
- data/arachni.gemspec +124 -0
- data/bin/arachni +14 -8
- data/bin/arachni_console +52 -0
- data/bin/arachni_rpc +14 -8
- data/bin/arachni_rpcd +15 -9
- data/bin/arachni_rpcd_monitor +14 -8
- data/bin/arachni_script +41 -0
- data/bin/arachni_web +18 -19
- data/bin/arachni_web_autostart +17 -18
- data/external/metasploit/plugins/arachni.rb +7 -9
- data/external/metasploit/{LICENSE → plugins/arachni/LICENSE} +0 -0
- data/external/metasploit/{modules → plugins/arachni/modules}/exploits/unix/webapp/arachni_exec.rb +1 -1
- data/external/metasploit/{modules → plugins/arachni/modules}/exploits/unix/webapp/arachni_path_traversal.rb +2 -2
- data/external/metasploit/{modules → plugins/arachni/modules}/exploits/unix/webapp/arachni_php_eval.rb +1 -1
- data/external/metasploit/{modules → plugins/arachni/modules}/exploits/unix/webapp/arachni_php_include.rb +1 -1
- data/external/metasploit/{modules → plugins/arachni/modules}/exploits/unix/webapp/arachni_sqlmap.rb +2 -2
- data/external/scripts/LICENSE.tpl +174 -0
- data/external/scripts/README.md +95 -0
- data/external/scripts/README.tpl +30 -0
- data/external/scripts/build.sh +631 -0
- data/external/scripts/build_all.sh +29 -0
- data/external/scripts/build_and_package.sh +100 -0
- data/external/scripts/cross_build_and_package.sh +20 -0
- data/external/scripts/installer.sh.tpl +166 -0
- data/external/scripts/lib/readlink_f.sh +40 -0
- data/external/scripts/package.sh +134 -0
- data/external/scripts/push_nightlies.sh +125 -0
- data/extras/placeholder +0 -0
- data/gfx/README.md +18 -0
- data/gfx/compiled/banner.png +0 -0
- data/gfx/compiled/favicon.ico +0 -0
- data/gfx/compiled/icon.png +0 -0
- data/gfx/compiled/logo.png +0 -0
- data/gfx/compiled/spider.png +0 -0
- data/gfx/font/Beneath_the_Surface.ttf +0 -0
- data/gfx/font/bts_readme.txt +14 -0
- data/gfx/source/banner.svg +999 -0
- data/gfx/source/icon.svg +627 -0
- data/gfx/source/logo.svg +672 -0
- data/gfx/source/spider.png +0 -0
- data/gfx/source/spider.svg +277 -0
- data/lib/arachni.rb +30 -5
- data/lib/arachni/audit_store.rb +111 -143
- data/lib/arachni/banner.rb +37 -0
- data/lib/arachni/bloom_filter.rb +74 -0
- data/lib/arachni/cache.rb +21 -0
- data/lib/arachni/cache/base.rb +170 -0
- data/lib/arachni/cache/least_cost_replacement.rb +89 -0
- data/lib/arachni/cache/least_recently_used.rb +73 -0
- data/lib/arachni/cache/random_replacement.rb +52 -0
- data/lib/arachni/component/manager.rb +391 -0
- data/lib/arachni/component/options.rb +38 -0
- data/lib/arachni/component/options/address.rb +41 -0
- data/lib/arachni/component/options/base.rb +126 -0
- data/lib/arachni/component/options/bool.rb +55 -0
- data/lib/arachni/component/options/enum.rb +51 -0
- data/lib/arachni/component/options/float.rb +45 -0
- data/lib/arachni/component/options/int.rb +44 -0
- data/lib/arachni/component/options/path.rb +36 -0
- data/lib/arachni/component/options/port.rb +37 -0
- data/lib/arachni/component/options/string.rb +44 -0
- data/lib/arachni/component/options/url.rb +42 -0
- data/lib/arachni/crypto/rsa_aes_cbc.rb +14 -8
- data/lib/arachni/database.rb +4 -4
- data/lib/arachni/database/base.rb +14 -8
- data/lib/arachni/database/hash.rb +21 -12
- data/lib/arachni/database/queue.rb +15 -9
- data/lib/arachni/element/base.rb +147 -0
- data/lib/arachni/element/capabilities/auditable.rb +623 -0
- data/lib/arachni/element/capabilities/auditable/rdiff.rb +243 -0
- data/lib/arachni/element/capabilities/auditable/taint.rb +141 -0
- data/lib/arachni/element/capabilities/auditable/timeout.rb +330 -0
- data/lib/arachni/element/capabilities/body.rb +19 -0
- data/lib/arachni/element/capabilities/mutable.rb +286 -0
- data/lib/arachni/element/capabilities/path.rb +19 -0
- data/lib/arachni/element/capabilities/refreshable.rb +48 -0
- data/lib/arachni/element/capabilities/server.rb +19 -0
- data/lib/arachni/element/cookie.rb +1043 -0
- data/lib/arachni/element/form.rb +1364 -0
- data/lib/arachni/element/header.rb +87 -0
- data/lib/arachni/element/link.rb +227 -0
- data/lib/arachni/exceptions.rb +12 -34
- data/lib/arachni/framework.rb +345 -436
- data/lib/arachni/http.rb +445 -409
- data/lib/arachni/http/cookie_jar.rb +163 -0
- data/lib/arachni/issue.rb +102 -65
- data/lib/arachni/mixins/observable.rb +25 -28
- data/lib/arachni/mixins/progress_bar.rb +11 -5
- data/lib/arachni/mixins/terminal.rb +17 -11
- data/lib/arachni/module.rb +4 -4
- data/lib/arachni/module/auditor.rb +270 -793
- data/lib/arachni/module/base.rb +107 -101
- data/lib/arachni/module/element_db.rb +54 -59
- data/lib/arachni/module/key_filler.rb +35 -35
- data/lib/arachni/module/manager.rb +178 -68
- data/lib/arachni/module/output.rb +25 -30
- data/lib/arachni/module/trainer.rb +85 -156
- data/lib/arachni/module/utilities.rb +29 -138
- data/lib/arachni/options.rb +496 -162
- data/lib/arachni/page.rb +186 -0
- data/lib/arachni/parser.rb +392 -2
- data/lib/arachni/plugin.rb +4 -4
- data/lib/arachni/plugin/base.rb +113 -44
- data/lib/arachni/plugin/manager.rb +120 -54
- data/lib/arachni/report.rb +4 -4
- data/lib/arachni/report/base.rb +59 -44
- data/lib/arachni/report/manager.rb +33 -32
- data/lib/arachni/rpc/client.rb +2 -0
- data/lib/arachni/rpc/client/base.rb +31 -18
- data/lib/arachni/rpc/client/dispatcher.rb +24 -11
- data/lib/arachni/rpc/client/instance.rb +24 -11
- data/lib/arachni/rpc/server/base.rb +12 -9
- data/lib/arachni/rpc/server/dispatcher.rb +161 -164
- data/lib/arachni/rpc/server/dispatcher/handler.rb +164 -0
- data/lib/arachni/rpc/server/{node.rb → dispatcher/node.rb} +86 -104
- data/lib/arachni/rpc/server/distributor.rb +432 -0
- data/lib/arachni/rpc/server/framework.rb +266 -758
- data/lib/arachni/rpc/server/instance.rb +38 -53
- data/lib/arachni/rpc/server/module/manager.rb +17 -20
- data/lib/arachni/rpc/server/output.rb +73 -179
- data/lib/arachni/rpc/server/plugin/manager.rb +58 -24
- data/lib/arachni/ruby.rb +6 -4
- data/lib/arachni/ruby/array.rb +30 -9
- data/lib/arachni/ruby/enumerable.rb +29 -0
- data/lib/arachni/ruby/object.rb +47 -12
- data/lib/arachni/ruby/string.rb +69 -24
- data/lib/arachni/ruby/webrick.rb +31 -0
- data/lib/arachni/session.rb +279 -0
- data/lib/arachni/spider.rb +295 -149
- data/lib/arachni/typhoeus/hydra.rb +18 -4
- data/lib/arachni/typhoeus/request.rb +52 -65
- data/lib/arachni/typhoeus/response.rb +62 -22
- data/lib/arachni/typhoeus/utils.rb +25 -0
- data/lib/arachni/ui/cli/cli.rb +331 -298
- data/lib/arachni/ui/cli/output.rb +105 -77
- data/lib/arachni/ui/foo/output.rb +116 -0
- data/lib/arachni/ui/rpc/dispatcher_monitor.rb +5 -12
- data/lib/arachni/ui/rpc/rpc.rb +43 -48
- data/lib/arachni/ui/web/addon_manager.rb +18 -13
- data/lib/arachni/ui/web/addons/sample.rb +14 -8
- data/lib/arachni/ui/web/addons/scheduler.rb +14 -8
- data/lib/arachni/ui/web/addons/scheduler/views/index.erb +1 -1
- data/lib/arachni/ui/web/addons/scheduler/views/options.erb +0 -3
- data/lib/arachni/ui/web/dispatcher_manager.rb +14 -9
- data/lib/arachni/ui/web/instance_manager.rb +14 -8
- data/lib/arachni/ui/web/log.rb +14 -10
- data/lib/arachni/ui/web/output_stream.rb +11 -5
- data/lib/arachni/ui/web/report_manager.rb +14 -10
- data/lib/arachni/ui/web/scheduler.rb +16 -11
- data/lib/arachni/ui/web/server.rb +62 -56
- data/lib/arachni/ui/web/server/public/style.css +1 -1
- data/lib/arachni/ui/web/server/views/addon.erb +1 -1
- data/lib/arachni/ui/web/server/views/dispatchers.erb +3 -3
- data/lib/arachni/ui/web/server/views/dispatchers_edit.erb +2 -2
- data/lib/arachni/ui/web/server/views/error.erb +1 -1
- data/lib/arachni/ui/web/server/views/home.erb +2 -2
- data/lib/arachni/ui/web/server/views/instance.erb +6 -6
- data/lib/arachni/ui/web/server/views/layout.erb +4 -4
- data/lib/arachni/ui/web/server/views/settings.erb +13 -8
- data/lib/arachni/ui/web/server/views/welcome.erb +1 -1
- data/lib/arachni/ui/web/utilities.rb +24 -35
- data/lib/arachni/uri.rb +619 -0
- data/lib/arachni/utilities.rb +316 -0
- data/lib/arachni/version.rb +12 -6
- data/lib/version +1 -0
- data/modules/audit/code_injection.rb +64 -81
- data/modules/audit/code_injection_timing.rb +57 -75
- data/modules/audit/csrf.rb +87 -185
- data/modules/audit/ldapi.rb +42 -67
- data/modules/audit/os_cmd_injection.rb +53 -71
- data/modules/audit/os_cmd_injection/payloads.txt +1 -1
- data/modules/audit/os_cmd_injection_timing.rb +54 -75
- data/modules/audit/os_cmd_injection_timing/payloads.txt +1 -3
- data/modules/audit/path_traversal.rb +84 -110
- data/modules/audit/response_splitting.rb +41 -53
- data/modules/audit/rfi.rb +68 -76
- data/modules/audit/session_fixation.rb +86 -0
- data/modules/audit/sqli.rb +51 -77
- data/modules/audit/sqli/regexp_ids.txt +5 -19
- data/modules/audit/sqli/regexp_ignore.txt +2 -0
- data/modules/audit/sqli_blind_rdiff.rb +51 -62
- data/modules/audit/sqli_blind_timing.rb +53 -73
- data/modules/audit/trainer.rb +21 -58
- data/modules/audit/unvalidated_redirect.rb +41 -51
- data/modules/audit/xpath.rb +38 -69
- data/modules/audit/xpath/errors.txt +2 -3
- data/modules/audit/xss.rb +65 -69
- data/modules/audit/xss_event.rb +50 -69
- data/modules/audit/xss_path.rb +63 -89
- data/modules/audit/xss_script_tag.rb +53 -66
- data/modules/audit/xss_tag.rb +46 -65
- data/modules/audit/xss_uri.rb +22 -24
- data/modules/recon/allowed_methods.rb +46 -62
- data/modules/recon/backdoors.rb +39 -66
- data/modules/recon/backup_files.rb +49 -79
- data/modules/recon/common_directories.rb +39 -63
- data/modules/recon/common_directories/directories.txt +0 -5
- data/modules/recon/common_files.rb +34 -63
- data/modules/recon/directory_listing.rb +66 -116
- data/modules/recon/grep/captcha.rb +34 -41
- data/modules/recon/grep/credit_card.rb +57 -68
- data/modules/recon/grep/cvs_svn_users.rb +40 -50
- data/modules/recon/grep/emails.rb +34 -41
- data/modules/recon/grep/html_objects.rb +30 -33
- data/modules/recon/grep/http_only_cookies.rb +57 -0
- data/modules/recon/grep/insecure_cookies.rb +55 -0
- data/modules/recon/grep/mixed_resource.rb +93 -0
- data/modules/recon/grep/private_ip.rb +34 -32
- data/modules/recon/grep/ssn.rb +33 -31
- data/modules/recon/grep/unencrypted_password_forms.rb +84 -0
- data/modules/recon/htaccess_limit.rb +38 -54
- data/modules/recon/http_put.rb +48 -62
- data/modules/recon/interesting_responses.rb +77 -79
- data/modules/recon/webdav.rb +53 -79
- data/modules/recon/xst.rb +44 -63
- data/modules/test2.rb +46 -0
- data/path_extractors/anchors.rb +17 -15
- data/path_extractors/forms.rb +17 -15
- data/path_extractors/frames.rb +17 -18
- data/path_extractors/generic.rb +52 -55
- data/path_extractors/links.rb +16 -14
- data/path_extractors/meta_refresh.rb +33 -18
- data/path_extractors/scripts.rb +17 -15
- data/plugins/autologin.rb +60 -85
- data/plugins/beep_notify.rb +25 -27
- data/plugins/cookie_collector.rb +28 -45
- data/plugins/defaults/autothrottle.rb +43 -51
- data/plugins/defaults/content_types.rb +63 -52
- data/plugins/defaults/healthmap.rb +45 -62
- data/plugins/defaults/{metamodules → meta}/remedies/discovery.rb +34 -69
- data/plugins/defaults/meta/remedies/manual_verification.rb +61 -0
- data/plugins/defaults/meta/remedies/timing_attacks.rb +108 -0
- data/plugins/defaults/meta/uniformity.rb +81 -0
- data/plugins/defaults/profiler.rb +68 -115
- data/plugins/defaults/resolver.rb +33 -28
- data/plugins/email_notify.rb +60 -62
- data/plugins/form_dicattack.rb +67 -121
- data/plugins/http_dicattack.rb +51 -65
- data/plugins/libnotify.rb +37 -41
- data/plugins/proxy.rb +407 -152
- data/plugins/proxy/panel/403_forbidden.html.erb +11 -0
- data/plugins/proxy/panel/404_not_found.html.erb +6 -0
- data/plugins/proxy/panel/css/bootstrap.min.css +9 -0
- data/plugins/proxy/panel/css/panel.css +30 -0
- data/plugins/proxy/panel/help.html.erb +66 -0
- data/plugins/proxy/panel/img/glyphicons-halflings-white.png +0 -0
- data/plugins/proxy/panel/img/glyphicons-halflings.png +0 -0
- data/plugins/proxy/panel/img/record.png +0 -0
- data/plugins/proxy/panel/inspect.html.erb +7 -0
- data/plugins/proxy/panel/js/bootstrap.min.js +6 -0
- data/plugins/proxy/panel/js/jquery.min.js +2 -0
- data/plugins/proxy/panel/js/panel.js +39 -0
- data/plugins/proxy/panel/layout.html.erb +25 -0
- data/plugins/proxy/panel/page_accordion.html.erb +67 -0
- data/plugins/proxy/panel/page_twin_accordion.html.erb +18 -0
- data/plugins/proxy/panel/panel.html.erb +63 -0
- data/plugins/proxy/panel/shutdown_message.html.erb +7 -0
- data/plugins/proxy/panel/verify_login_check.html.erb +31 -0
- data/plugins/proxy/panel/verify_login_final.html.erb +26 -0
- data/plugins/proxy/panel/verify_login_sequence.html.erb +45 -0
- data/plugins/proxy/server.rb +175 -47
- data/plugins/proxy/ssl-interceptor-cert.pem +34 -0
- data/plugins/proxy/ssl-interceptor-pkey.pem +51 -0
- data/plugins/rescan.rb +27 -28
- data/plugins/script.rb +53 -0
- data/plugins/vector_feed.rb +226 -0
- data/plugins/waf_detector.rb +70 -73
- data/reports/afr.rb +23 -24
- data/reports/ap.rb +25 -36
- data/reports/html.rb +109 -163
- data/reports/html/default.erb +13 -12
- data/reports/html/default/configuration.erb +21 -21
- data/reports/html/default/css/main.css +350 -350
- data/reports/html/default/issues.erb +1 -1
- data/reports/html/default/js/charts.js +2 -2
- data/reports/html/default/js/helpers.js +0 -42
- data/reports/html/default/js/init.js +0 -1
- data/reports/html/default/sitemap.erb +2 -2
- data/reports/html/default/summary.erb +4 -4
- data/reports/html/default/summary_issue.erb +1 -1
- data/reports/json.rb +26 -28
- data/reports/marshal.rb +23 -25
- data/reports/metareport.rb +65 -98
- data/reports/plugin_formatters/html/autologin.rb +34 -41
- data/reports/plugin_formatters/html/content_types.rb +46 -52
- data/reports/plugin_formatters/html/cookie_collector.rb +41 -47
- data/reports/plugin_formatters/html/discovery.rb +36 -41
- data/reports/plugin_formatters/html/form_dicattack.rb +28 -34
- data/reports/plugin_formatters/html/healthmap.rb +48 -55
- data/reports/plugin_formatters/html/http_dicattack.rb +28 -34
- data/reports/plugin_formatters/html/profiler.rb +26 -30
- data/reports/plugin_formatters/html/profiler/template.erb +7 -7
- data/reports/plugin_formatters/html/resolver.rb +44 -52
- data/reports/plugin_formatters/html/timing_attacks.rb +42 -44
- data/reports/plugin_formatters/html/uniformity.rb +37 -42
- data/reports/plugin_formatters/html/waf_detector.rb +26 -34
- data/reports/plugin_formatters/stdout/autologin.rb +28 -40
- data/reports/plugin_formatters/stdout/content_types.rb +36 -53
- data/reports/plugin_formatters/stdout/cookie_collector.rb +28 -41
- data/reports/plugin_formatters/stdout/discovery.rb +27 -37
- data/reports/plugin_formatters/stdout/form_dicattack.rb +22 -35
- data/reports/plugin_formatters/stdout/healthmap.rb +40 -57
- data/reports/plugin_formatters/stdout/http_dicattack.rb +22 -36
- data/reports/plugin_formatters/stdout/profiler.rb +55 -74
- data/reports/plugin_formatters/stdout/resolver.rb +18 -34
- data/reports/plugin_formatters/stdout/timing_attacks.rb +27 -39
- data/reports/plugin_formatters/stdout/uniformity.rb +32 -44
- data/reports/plugin_formatters/stdout/waf_detector.rb +20 -32
- data/reports/plugin_formatters/xml/autologin.rb +27 -49
- data/reports/plugin_formatters/xml/content_types.rb +41 -66
- data/reports/plugin_formatters/xml/cookie_collector.rb +29 -49
- data/reports/plugin_formatters/xml/discovery.rb +23 -41
- data/reports/plugin_formatters/xml/form_dicattack.rb +22 -40
- data/reports/plugin_formatters/xml/healthmap.rb +44 -63
- data/reports/plugin_formatters/xml/http_dicattack.rb +22 -41
- data/reports/plugin_formatters/xml/profiler.rb +65 -89
- data/reports/plugin_formatters/xml/resolver.rb +21 -41
- data/reports/plugin_formatters/xml/timing_attacks.rb +27 -45
- data/reports/plugin_formatters/xml/uniformity.rb +36 -55
- data/reports/plugin_formatters/xml/waf_detector.rb +23 -42
- data/reports/stdout.rb +120 -121
- data/reports/txt.rb +29 -45
- data/reports/xml.rb +109 -148
- data/reports/xml/buffer.rb +66 -79
- data/reports/yaml.rb +26 -28
- data/rpcd_handlers/placeholder +0 -0
- data/spec/arachni/audit_store_spec.rb +223 -0
- data/spec/arachni/bloom_filter_spec.rb +76 -0
- data/spec/arachni/cache/base_spec.rb +275 -0
- data/spec/arachni/cache/least_cost_replacement_spec.rb +58 -0
- data/spec/arachni/cache/least_recently_used_spec.rb +91 -0
- data/spec/arachni/cache/random_replacement_spec.rb +43 -0
- data/spec/arachni/component/manager_spec.rb +448 -0
- data/spec/arachni/component/options/address_spec.rb +32 -0
- data/spec/arachni/component/options/base_spec.rb +105 -0
- data/spec/arachni/component/options/bool_spec.rb +67 -0
- data/spec/arachni/component/options/enum_spec.rb +51 -0
- data/spec/arachni/component/options/float_spec.rb +42 -0
- data/spec/arachni/component/options/int_spec.rb +46 -0
- data/spec/arachni/component/options/path_spec.rb +32 -0
- data/spec/arachni/component/options/port_spec.rb +38 -0
- data/spec/arachni/component/options/string_spec.rb +38 -0
- data/spec/arachni/component/options/url_spec.rb +36 -0
- data/spec/arachni/crypto/rsa_aes_cbc_spec.rb +31 -0
- data/spec/arachni/database/hash_spec.rb +217 -0
- data/spec/arachni/database/queue_spec.rb +52 -0
- data/spec/arachni/element/base_spec.rb +127 -0
- data/spec/arachni/element/body_spec.rb +9 -0
- data/spec/arachni/element/capabilities/auditable/rdiff_spec.rb +47 -0
- data/spec/arachni/element/capabilities/auditable/taint_spec.rb +110 -0
- data/spec/arachni/element/capabilities/auditable/timeout_spec.rb +107 -0
- data/spec/arachni/element/capabilities/mutable_spec.rb +261 -0
- data/spec/arachni/element/cookie_spec.rb +362 -0
- data/spec/arachni/element/form_spec.rb +668 -0
- data/spec/arachni/element/header_spec.rb +49 -0
- data/spec/arachni/element/link_spec.rb +220 -0
- data/spec/arachni/element/path_spec.rb +9 -0
- data/spec/arachni/element/server_spec.rb +9 -0
- data/spec/arachni/framework_spec.rb +860 -0
- data/spec/arachni/http/cookie_jar_spec.rb +267 -0
- data/spec/arachni/http_spec.rb +991 -0
- data/spec/arachni/issue_spec.rb +307 -0
- data/spec/arachni/mixins/observable_spec.rb +59 -0
- data/spec/arachni/mixins/progress_bar_spec.rb +41 -0
- data/spec/arachni/module/auditor_spec.rb +506 -0
- data/spec/arachni/module/element_db_spec.rb +131 -0
- data/spec/arachni/module/key_filler.rb +15 -0
- data/spec/arachni/module/manager_spec.rb +154 -0
- data/spec/arachni/module/trainer_spec.rb +102 -0
- data/spec/arachni/module/utilities_spec.rb +30 -0
- data/spec/arachni/module/utilities_spec/read_file.txt +3 -0
- data/spec/arachni/options_spec.rb +555 -0
- data/spec/arachni/page_spec.rb +290 -0
- data/spec/arachni/parser_spec.rb +508 -0
- data/spec/arachni/plugin/manager_spec.rb +174 -0
- data/spec/arachni/report/base_spec.rb +53 -0
- data/spec/arachni/report/manager_spec.rb +82 -0
- data/spec/arachni/rpc/client/base_spec.rb +157 -0
- data/spec/arachni/rpc/client/dispatcher_spec.rb +40 -0
- data/spec/arachni/rpc/client/instance_spec.rb +92 -0
- data/spec/arachni/rpc/server/base_spec.rb +40 -0
- data/spec/arachni/rpc/server/dispatcher/handler.rb +120 -0
- data/spec/arachni/rpc/server/dispatcher/node_spec.rb +220 -0
- data/spec/arachni/rpc/server/dispatcher_spec.rb +136 -0
- data/spec/arachni/rpc/server/distributor_spec.rb +628 -0
- data/spec/arachni/rpc/server/framework_hpg_spec.rb +321 -0
- data/spec/arachni/rpc/server/framework_simple_spec.rb +453 -0
- data/spec/arachni/rpc/server/instance_spec.rb +81 -0
- data/spec/arachni/rpc/server/modules/manager_spec.rb +79 -0
- data/spec/arachni/rpc/server/options_spec.rb +124 -0
- data/spec/arachni/rpc/server/output_spec.rb +238 -0
- data/spec/arachni/rpc/server/plugin/manager_spec.rb +86 -0
- data/spec/arachni/ruby/array_spec.rb +103 -0
- data/spec/arachni/ruby/enumerable_spec.rb +37 -0
- data/spec/arachni/ruby/object_spec.rb +38 -0
- data/spec/arachni/ruby/string_spec.rb +77 -0
- data/spec/arachni/ruby/webrick_spec.rb +15 -0
- data/spec/arachni/session_spec.rb +308 -0
- data/spec/arachni/spider_spec.rb +383 -0
- data/spec/arachni/typhoeus/hydra_spec.rb +14 -0
- data/spec/arachni/typhoeus/requrest_spec.rb +58 -0
- data/spec/arachni/typhoeus/response_spec.rb +78 -0
- data/spec/arachni/uri_spec.rb +462 -0
- data/spec/arachni/utilities_spec.rb +297 -0
- data/spec/fixtures/auditstore.afr +2959 -0
- data/spec/fixtures/cookies.txt +9 -0
- data/spec/fixtures/modules/test.rb +58 -0
- data/spec/fixtures/modules/test2.rb +46 -0
- data/spec/fixtures/modules/test3.rb +46 -0
- data/spec/fixtures/passwords.txt +17 -0
- data/spec/fixtures/plugins/bad.rb +46 -0
- data/spec/fixtures/plugins/defaults/default.rb +45 -0
- data/spec/fixtures/plugins/distributable.rb +42 -0
- data/spec/fixtures/plugins/loop.rb +32 -0
- data/spec/fixtures/plugins/wait.rb +34 -0
- data/spec/fixtures/plugins/with_options.rb +31 -0
- data/spec/fixtures/reports/base_spec/plugin_formatters/with_formatters/foobar.rb +21 -0
- data/spec/fixtures/reports/base_spec/with_formatters.rb +23 -0
- data/spec/fixtures/reports/base_spec/with_outfile.rb +24 -0
- data/spec/fixtures/reports/base_spec/without_outfile.rb +20 -0
- data/spec/fixtures/reports/manager_spec/afr.rb +21 -0
- data/spec/fixtures/reports/manager_spec/foo.rb +26 -0
- data/spec/fixtures/rescan.afr.tpl +145 -0
- data/spec/fixtures/rpcd_handlers/echo.rb +68 -0
- data/spec/fixtures/run_mod/body.rb +58 -0
- data/spec/fixtures/run_mod/cookies.rb +58 -0
- data/spec/fixtures/run_mod/empty.rb +58 -0
- data/spec/fixtures/run_mod/flch.rb +63 -0
- data/spec/fixtures/run_mod/forms.rb +58 -0
- data/spec/fixtures/run_mod/headers.rb +58 -0
- data/spec/fixtures/run_mod/links.rb +58 -0
- data/spec/fixtures/run_mod/nil.rb +57 -0
- data/spec/fixtures/run_mod/path.rb +58 -0
- data/spec/fixtures/run_mod/server.rb +58 -0
- data/spec/fixtures/script_plugin.rb +1 -0
- data/spec/fixtures/taint_module/taint.rb +48 -0
- data/spec/fixtures/usernames.txt +13 -0
- data/spec/fixtures/wait_module/wait.rb +48 -0
- data/spec/helpers/auditor.rb +9 -0
- data/spec/helpers/misc.rb +41 -0
- data/spec/helpers/processes.rb +112 -0
- data/spec/helpers/requires.rb +8 -0
- data/spec/helpers/server.rb +54 -0
- data/spec/logs/Dispatcher - 2752-13830.log +49 -0
- data/spec/logs/Dispatcher - 2766-8238.log +35 -0
- data/spec/logs/Dispatcher - 2808-9029.log +31 -0
- data/spec/logs/Dispatcher - 2854-8571.log +26 -0
- data/spec/logs/Dispatcher - 2888-10411.log +20 -0
- data/spec/logs/Dispatcher - 2922-14464.log +13 -0
- data/spec/logs/Dispatcher - 2957-15255.log +19 -0
- data/spec/logs/Dispatcher - 3216-14203.log +35 -0
- data/spec/logs/Dispatcher - 3305-8622.log +43 -0
- data/spec/logs/Dispatcher - 3340-15426.log +35 -0
- data/spec/logs/Dispatcher - 3399-12586.log +40 -0
- data/spec/logs/Dispatcher - 3433-14149.log +26 -0
- data/spec/logs/Dispatcher - 3582-6198.log +27 -0
- data/spec/logs/Dispatcher - 3616-11169.log +13 -0
- data/spec/logs/Dispatcher - 3849-9016.log +7 -0
- data/spec/logs/output_spec.log +4 -0
- data/spec/logs/placeholder +0 -0
- data/spec/modules/audit/code_injection_spec.rb +25 -0
- data/spec/modules/audit/code_injection_timing_spec.rb +24 -0
- data/spec/modules/audit/csrf_spec.rb +38 -0
- data/spec/modules/audit/ldapi_spec.rb +19 -0
- data/spec/modules/audit/os_cmd_injection_spec.rb +24 -0
- data/spec/modules/audit/os_cmd_injection_timing_spec.rb +24 -0
- data/spec/modules/audit/path_traversal_spec.rb +23 -0
- data/spec/modules/audit/response_splitting_spec.rb +19 -0
- data/spec/modules/audit/rfi_spec.rb +19 -0
- data/spec/modules/audit/session_fixation_spec.rb +23 -0
- data/spec/modules/audit/sqli_blind_rdiff_spec.rb +19 -0
- data/spec/modules/audit/sqli_blind_timing_spec.rb +23 -0
- data/spec/modules/audit/sqli_spec.rb +24 -0
- data/spec/modules/audit/trainer_spec.rb +25 -0
- data/spec/modules/audit/unvalidated_redirect_spec.rb +24 -0
- data/spec/modules/audit/xpath_spec.rb +25 -0
- data/spec/modules/audit/xss_event_spec.rb +19 -0
- data/spec/modules/audit/xss_path_spec.rb +19 -0
- data/spec/modules/audit/xss_script_tag_spec.rb +19 -0
- data/spec/modules/audit/xss_spec.rb +24 -0
- data/spec/modules/audit/xss_tag_spec.rb +19 -0
- data/spec/modules/recon/allowed_methods_spec.rb +19 -0
- data/spec/modules/recon/backdoors_spec.rb +19 -0
- data/spec/modules/recon/backup_files_spec.rb +19 -0
- data/spec/modules/recon/common_directories_spec.rb +19 -0
- data/spec/modules/recon/common_files_spec.rb +19 -0
- data/spec/modules/recon/directory_listing_spec.rb +19 -0
- data/spec/modules/recon/grep/captcha_spec.rb +19 -0
- data/spec/modules/recon/grep/credit_card_spec.rb +19 -0
- data/spec/modules/recon/grep/cvs_svn_users_spec.rb +19 -0
- data/spec/modules/recon/grep/emails_spec.rb +19 -0
- data/spec/modules/recon/grep/html_objects_spec.rb +19 -0
- data/spec/modules/recon/grep/http_only_cookies_spec.rb +19 -0
- data/spec/modules/recon/grep/insecure_cookies_spec.rb +19 -0
- data/spec/modules/recon/grep/mixed_resource_spec.rb +20 -0
- data/spec/modules/recon/grep/private_ip_spec.rb +26 -0
- data/spec/modules/recon/grep/ssn_spec.rb +19 -0
- data/spec/modules/recon/grep/unencrypted_password_forms_spec.rb +19 -0
- data/spec/modules/recon/htaccess_limit_spec.rb +19 -0
- data/spec/modules/recon/http_put_spec.rb +19 -0
- data/spec/modules/recon/interesting_responses_spec.rb +27 -0
- data/spec/modules/recon/webdav_spec.rb +19 -0
- data/spec/modules/recon/xst_spec.rb +19 -0
- data/spec/path_extractors/anchors_spec.rb +19 -0
- data/spec/path_extractors/forms_spec.rb +19 -0
- data/spec/path_extractors/frames_spec.rb +20 -0
- data/spec/path_extractors/generic_spec.rb +28 -0
- data/spec/path_extractors/links_spec.rb +19 -0
- data/spec/path_extractors/meta_refresh_spec.rb +24 -0
- data/spec/path_extractors/scripts_spec.rb +19 -0
- data/spec/pems/cacert.pem +39 -0
- data/spec/pems/client/cert.pem +39 -0
- data/spec/pems/client/foo-cert.pem +39 -0
- data/spec/pems/client/foo-key.pem +51 -0
- data/spec/pems/client/key.pem +51 -0
- data/spec/pems/server/cert.pem +39 -0
- data/spec/pems/server/key.pem +51 -0
- data/spec/plugins/autologin_spec.rb +76 -0
- data/spec/plugins/autothrottle_spec.rb +45 -0
- data/spec/plugins/content_types_spec.rb +93 -0
- data/spec/plugins/cookie_collector_spec.rb +32 -0
- data/spec/plugins/form_dicattack_spec.rb +60 -0
- data/spec/plugins/healthmap_spec.rb +40 -0
- data/spec/plugins/http_dicattack_spec.rb +40 -0
- data/spec/plugins/meta/remedies/discovery_spec.rb +15 -0
- data/spec/plugins/meta/remedies/manual_verification_spec.rb +28 -0
- data/spec/plugins/meta/remedies/timing_attacks_spec.rb +30 -0
- data/spec/plugins/meta/uniformity_spec.rb +83 -0
- data/spec/plugins/profiler_spec.rb +82 -0
- data/spec/plugins/rescan_spec.rb +26 -0
- data/spec/plugins/resolver_spec.rb +16 -0
- data/spec/plugins/script_spec.rb +12 -0
- data/spec/plugins/vector_feed_spec.rb +155 -0
- data/spec/plugins/waf_detector_spec.rb +41 -0
- data/spec/reports/afr_spec.rb +13 -0
- data/spec/reports/ap_spec.rb +9 -0
- data/spec/reports/html_spec.rb +13 -0
- data/spec/reports/json_spec.rb +17 -0
- data/spec/reports/marshal_spec.rb +13 -0
- data/spec/reports/stdout_spec.rb +9 -0
- data/spec/reports/txt_spec.rb +8 -0
- data/spec/reports/xml_spec.rb +13 -0
- data/spec/reports/yaml_spec.rb +13 -0
- data/spec/servers/arachni/element/capabilities/auditable/rdiff.rb +36 -0
- data/spec/servers/arachni/element/capabilities/auditable/taint.rb +10 -0
- data/spec/servers/arachni/element/capabilities/auditable/timeout.rb +30 -0
- data/spec/servers/arachni/element/cookie.rb +37 -0
- data/spec/servers/arachni/element/form.rb +93 -0
- data/spec/servers/arachni/element/header.rb +22 -0
- data/spec/servers/arachni/element/link.rb +26 -0
- data/spec/servers/arachni/framework.rb +54 -0
- data/spec/servers/arachni/http.rb +140 -0
- data/spec/servers/arachni/http_auth.rb +9 -0
- data/spec/servers/arachni/module/auditor.rb +135 -0
- data/spec/servers/arachni/module/trainer.rb +40 -0
- data/spec/servers/arachni/parser.rb +70 -0
- data/spec/servers/arachni/rpc/server/framework_hpg.rb +21 -0
- data/spec/servers/arachni/rpc/server/framework_simple.rb +30 -0
- data/spec/servers/arachni/session.rb +110 -0
- data/spec/servers/arachni/spider.rb +148 -0
- data/spec/servers/modules/audit/code_injection.rb +140 -0
- data/spec/servers/modules/audit/code_injection_timing.rb +110 -0
- data/spec/servers/modules/audit/csrf.rb +80 -0
- data/spec/servers/modules/audit/ldapi.rb +73 -0
- data/spec/servers/modules/audit/os_cmd_injection.rb +140 -0
- data/spec/servers/modules/audit/os_cmd_injection_timing.rb +111 -0
- data/spec/servers/modules/audit/path_traversal.rb +176 -0
- data/spec/servers/modules/audit/response_splitting.rb +114 -0
- data/spec/servers/modules/audit/rfi.rb +113 -0
- data/spec/servers/modules/audit/session_fixation.rb +87 -0
- data/spec/servers/modules/audit/sqli.rb +118 -0
- data/spec/servers/modules/audit/sqli/coldfusion +1 -0
- data/spec/servers/modules/audit/sqli/db2 +4 -0
- data/spec/servers/modules/audit/sqli/emc +2 -0
- data/spec/servers/modules/audit/sqli/informix +3 -0
- data/spec/servers/modules/audit/sqli/interbase +2 -0
- data/spec/servers/modules/audit/sqli/jdbc +0 -0
- data/spec/servers/modules/audit/sqli/mssql +26 -0
- data/spec/servers/modules/audit/sqli/mysql +13 -0
- data/spec/servers/modules/audit/sqli/oracle +6 -0
- data/spec/servers/modules/audit/sqli/postgresql +7 -0
- data/spec/servers/modules/audit/sqli/sqlite +4 -0
- data/spec/servers/modules/audit/sqli/sybase +0 -0
- data/spec/servers/modules/audit/sqli_blind_rdiff.rb +74 -0
- data/spec/servers/modules/audit/sqli_blind_timing.rb +121 -0
- data/spec/servers/modules/audit/trainer_module.rb +160 -0
- data/spec/servers/modules/audit/unvalidated_redirect.rb +115 -0
- data/spec/servers/modules/audit/xpath.rb +111 -0
- data/spec/servers/modules/audit/xpath/dotnet +5 -0
- data/spec/servers/modules/audit/xpath/general +13 -0
- data/spec/servers/modules/audit/xpath/java +3 -0
- data/spec/servers/modules/audit/xpath/libxml2 +2 -0
- data/spec/servers/modules/audit/xpath/php +2 -0
- data/spec/servers/modules/audit/xss.rb +152 -0
- data/spec/servers/modules/audit/xss_event.rb +80 -0
- data/spec/servers/modules/audit/xss_path.rb +44 -0
- data/spec/servers/modules/audit/xss_script_tag.rb +73 -0
- data/spec/servers/modules/audit/xss_tag.rb +139 -0
- data/spec/servers/modules/module_server.rb +14 -0
- data/spec/servers/modules/recon/allowed_methods.rb +5 -0
- data/spec/servers/modules/recon/backdoors.rb +4 -0
- data/spec/servers/modules/recon/backup_files.rb +28 -0
- data/spec/servers/modules/recon/common_directories.rb +6 -0
- data/spec/servers/modules/recon/common_files.rb +6 -0
- data/spec/servers/modules/recon/directory_listing.rb +30 -0
- data/spec/servers/modules/recon/grep/captcha.rb +27 -0
- data/spec/servers/modules/recon/grep/credit_card.rb +28 -0
- data/spec/servers/modules/recon/grep/cvs_svn_users.rb +23 -0
- data/spec/servers/modules/recon/grep/emails.rb +21 -0
- data/spec/servers/modules/recon/grep/html_objects.rb +7 -0
- data/spec/servers/modules/recon/grep/http_only_cookies.rb +21 -0
- data/spec/servers/modules/recon/grep/insecure_cookies.rb +21 -0
- data/spec/servers/modules/recon/grep/mixed_resource.rb +83 -0
- data/spec/servers/modules/recon/grep/private_ip.rb +18 -0
- data/spec/servers/modules/recon/grep/ssn.rb +5 -0
- data/spec/servers/modules/recon/grep/unencrypted_password_forms.rb +33 -0
- data/spec/servers/modules/recon/htaccess_limit.rb +8 -0
- data/spec/servers/modules/recon/http_put.rb +7 -0
- data/spec/servers/modules/recon/interesting_responses.rb +5 -0
- data/spec/servers/modules/recon/webdav.rb +25 -0
- data/spec/servers/modules/recon/xst.rb +6 -0
- data/spec/servers/plugins/autologin.rb +38 -0
- data/spec/servers/plugins/autothrottle.rb +8 -0
- data/spec/servers/plugins/content_types.rb +17 -0
- data/spec/servers/plugins/cookie_collector.rb +20 -0
- data/spec/servers/plugins/form_dicattack.rb +28 -0
- data/spec/servers/plugins/healthmap.rb +16 -0
- data/spec/servers/plugins/http_dicattack.rb +9 -0
- data/spec/servers/plugins/http_dicattack_secure.rb +9 -0
- data/spec/servers/plugins/http_dicattack_unprotected.rb +5 -0
- data/spec/servers/plugins/meta/remedies/discovery.rb +7 -0
- data/spec/servers/plugins/meta/remedies/timing_attacks.rb +29 -0
- data/spec/servers/plugins/profiler.rb +82 -0
- data/spec/servers/plugins/rescan.rb +31 -0
- data/spec/servers/plugins/waf_detector.rb +33 -0
- data/spec/shared/component.rb +43 -0
- data/spec/shared/element/capabilities/auditable.rb +729 -0
- data/spec/shared/element/capabilities/refreshable.rb +56 -0
- data/spec/shared/module.rb +162 -0
- data/spec/shared/path_extractor.rb +47 -0
- data/spec/shared/plugin.rb +50 -0
- data/spec/shared/reports.rb +47 -0
- data/spec/spec_helper.rb +53 -0
- metadata +870 -323
- data/extras/modules/recon/raft_dirs.rb +0 -108
- data/extras/modules/recon/raft_dirs/raft-large-directories.txt +0 -62290
- data/extras/modules/recon/raft_files.rb +0 -110
- data/extras/modules/recon/raft_files/raft-large-files.txt +0 -37037
- data/extras/modules/recon/svn_digger_dirs.rb +0 -108
- data/extras/modules/recon/svn_digger_dirs/Licence.txt +0 -674
- data/extras/modules/recon/svn_digger_dirs/ReadMe-Arachni.txt +0 -4
- data/extras/modules/recon/svn_digger_dirs/ReadMe.txt +0 -6
- data/extras/modules/recon/svn_digger_dirs/all-dirs.txt +0 -5960
- data/extras/modules/recon/svn_digger_files.rb +0 -114
- data/extras/modules/recon/svn_digger_files/Licence.txt +0 -674
- data/extras/modules/recon/svn_digger_files/ReadMe-Arachni.txt +0 -4
- data/extras/modules/recon/svn_digger_files/ReadMe.txt +0 -6
- data/extras/modules/recon/svn_digger_files/all-extensionless.txt +0 -25419
- data/extras/modules/recon/svn_digger_files/all.txt +0 -43135
- data/lib/arachni/component_manager.rb +0 -293
- data/lib/arachni/component_options.rb +0 -425
- data/lib/arachni/parser/auditable.rb +0 -606
- data/lib/arachni/parser/elements.rb +0 -315
- data/lib/arachni/parser/page.rb +0 -168
- data/lib/arachni/parser/parser.rb +0 -866
- data/lib/arachni/rpc/server/options.rb +0 -95
- data/lib/arachni/ui/web/addons/autodeploy.rb +0 -207
- data/lib/arachni/ui/web/addons/autodeploy/lib/manager.rb +0 -398
- data/lib/arachni/ui/web/addons/autodeploy/views/index.erb +0 -291
- data/modules/recon/mixed_resource.rb +0 -100
- data/modules/recon/unencrypted_password_forms.rb +0 -107
- data/path_extractors/sitemap.rb +0 -31
- data/plugins/defaults/metamodules/remedies/manual_verification.rb +0 -65
- data/plugins/defaults/metamodules/remedies/timing_attacks.rb +0 -134
- data/plugins/defaults/metamodules/uniformity.rb +0 -99
- data/reports/metareport/arachni_metareport.rb +0 -174
- data/reports/plugin_formatters/stdout/metamodules.rb +0 -82
@@ -0,0 +1,279 @@
|
|
1
|
+
=begin
|
2
|
+
Copyright 2010-2012 Tasos Laskos <tasos.laskos@gmail.com>
|
3
|
+
|
4
|
+
Licensed under the Apache License, Version 2.0 (the "License");
|
5
|
+
you may not use this file except in compliance with the License.
|
6
|
+
You may obtain a copy of the License at
|
7
|
+
|
8
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
9
|
+
|
10
|
+
Unless required by applicable law or agreed to in writing, software
|
11
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
12
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
13
|
+
See the License for the specific language governing permissions and
|
14
|
+
limitations under the License.
|
15
|
+
=end
|
16
|
+
|
17
|
+
module Arachni
|
18
|
+
|
19
|
+
#
|
20
|
+
# Session management class
|
21
|
+
#
|
22
|
+
# Handles logins, provided log-out detection, stores and executes login sequences
|
23
|
+
# and provided general webapp session related helpers.
|
24
|
+
#
|
25
|
+
# @author Tasos "Zapotek" Laskos <tasos.laskos@gmail.com>
|
26
|
+
#
|
27
|
+
class Session
|
28
|
+
include UI::Output
|
29
|
+
include Utilities
|
30
|
+
|
31
|
+
# @return [Options] options
|
32
|
+
attr_reader :opts
|
33
|
+
|
34
|
+
#
|
35
|
+
# A block used to login to the webapp.
|
36
|
+
#
|
37
|
+
# The block should log the framework into the webapp and return +true+ on
|
38
|
+
# success, +false+ on failure.
|
39
|
+
#
|
40
|
+
# @return [Block]
|
41
|
+
#
|
42
|
+
attr_accessor :login_sequence
|
43
|
+
|
44
|
+
#
|
45
|
+
# A block used to check whether or not we're logged in to the webapp.
|
46
|
+
#
|
47
|
+
# The block should return +true+ on success, +false+ on failure.
|
48
|
+
#
|
49
|
+
# The proc should expect 2 parameters, the first one being a hash of HTTP
|
50
|
+
# options and the second one an optional block.
|
51
|
+
#
|
52
|
+
# If a block has been set, the check should work async and pass the result
|
53
|
+
# to the block, otherwise it should simply return the result.
|
54
|
+
#
|
55
|
+
# The result of the check should be +true+ or +false+.
|
56
|
+
#
|
57
|
+
# A good example of this can be found in {#set_login_check}.
|
58
|
+
#
|
59
|
+
# @return [Block]
|
60
|
+
#
|
61
|
+
# @see #set_login_check
|
62
|
+
#
|
63
|
+
attr_accessor :login_check
|
64
|
+
|
65
|
+
#
|
66
|
+
# Sets a login form and generates a login sequence from it.
|
67
|
+
#
|
68
|
+
# The form must be kosher, best be generated by one of the {Arachni::Element::Form}
|
69
|
+
# helpers, {Parser} or {#find_login_form}.
|
70
|
+
#
|
71
|
+
# Once you get the right form you need to update it with the appropriate values
|
72
|
+
# before passing it to this accessor.
|
73
|
+
#
|
74
|
+
# @return [Element::Form]
|
75
|
+
#
|
76
|
+
attr_accessor :login_form
|
77
|
+
|
78
|
+
def initialize( opts = Arachni::Options.instance )
|
79
|
+
@opts = opts
|
80
|
+
end
|
81
|
+
|
82
|
+
# @return [Array<Element::Cookie>] session cookies
|
83
|
+
def cookies
|
84
|
+
http.cookies.select{ |c| c.session? }
|
85
|
+
end
|
86
|
+
|
87
|
+
#
|
88
|
+
# Tries to find the main session (login/ID) cookie.
|
89
|
+
#
|
90
|
+
# @param [Block] block block to be passed the cookie
|
91
|
+
#
|
92
|
+
def cookie( &block )
|
93
|
+
return block.call( @session_cookie ) if @session_cookie
|
94
|
+
fail 'No login-check has been configured.' if !has_login_check?
|
95
|
+
|
96
|
+
cookies.each do |cookie|
|
97
|
+
logged_in?( cookies: { cookie.name => '' } ) do |bool|
|
98
|
+
next if bool
|
99
|
+
block.call( @session_cookie = cookie )
|
100
|
+
end
|
101
|
+
end
|
102
|
+
end
|
103
|
+
|
104
|
+
#
|
105
|
+
# Finds a login forms based on supplied location, collection and criteria.
|
106
|
+
#
|
107
|
+
# @param [Hash] opts
|
108
|
+
# @option opts [Bool] :requires_password Does the login form include a password field? (Defaults to +true+)
|
109
|
+
# @option opts [Array, Regexp] :action Regexp to match or String to compare against the form action.
|
110
|
+
# @option opts [String, Array, Hash, Symbol] :inputs Inputs that the form must contain.
|
111
|
+
# @option opts [Array<Element::Form>] :forms Collection of forms to look through.
|
112
|
+
# @option opts [Page, Array<Page>] :pages Pages to look through.
|
113
|
+
# @option opts [String] :url URL to fetch and look for forms.
|
114
|
+
#
|
115
|
+
# @param [Block] block if a block and a :url are given, the request
|
116
|
+
# will run async and the block will be called
|
117
|
+
# with the result of this method.
|
118
|
+
#
|
119
|
+
def find_login_form( opts = {}, &block )
|
120
|
+
async = block_given?
|
121
|
+
|
122
|
+
requires_password = (opts[:requires_password].nil? ? true : opts[:requires_password])
|
123
|
+
|
124
|
+
find = proc do |cforms|
|
125
|
+
cforms.select do |f|
|
126
|
+
next if requires_password && !f.requires_password?
|
127
|
+
|
128
|
+
oks = []
|
129
|
+
|
130
|
+
if action = opts[:action]
|
131
|
+
oks << !!(action.is_a?( Regexp ) ? f.action =~ action : f.action == action)
|
132
|
+
end
|
133
|
+
|
134
|
+
if inputs = opts[:inputs]
|
135
|
+
oks << f.has_inputs?( inputs )
|
136
|
+
end
|
137
|
+
|
138
|
+
oks.count( true ) == oks.size
|
139
|
+
end.first
|
140
|
+
end
|
141
|
+
|
142
|
+
forms = if opts[:pages]
|
143
|
+
[opts[:pages]].flatten.map { |p| p.forms }.flatten
|
144
|
+
elsif opts[:forms]
|
145
|
+
opts[:forms]
|
146
|
+
elsif url = opts[:url]
|
147
|
+
if async
|
148
|
+
page_from_url( url ) { |p| block.call find.call( p.forms ) }
|
149
|
+
else
|
150
|
+
page_from_url( url ).forms
|
151
|
+
end
|
152
|
+
end
|
153
|
+
|
154
|
+
find.call( forms || [] ) if !async
|
155
|
+
end
|
156
|
+
|
157
|
+
# @return [Bool] +true+ if there is log-in capability, +false+ otherwise
|
158
|
+
def can_login?
|
159
|
+
@login_sequence && @login_check
|
160
|
+
end
|
161
|
+
|
162
|
+
# @return [Bool, nil] +true+ if logged-in, +false+ otherwise, +nil+ if
|
163
|
+
# there's no log-in capability
|
164
|
+
def ensure_logged_in
|
165
|
+
return if !can_login?
|
166
|
+
return true if logged_in?
|
167
|
+
|
168
|
+
print_bad 'The scanner has been logged out.'
|
169
|
+
print_info 'Trying to re-login...'
|
170
|
+
|
171
|
+
login
|
172
|
+
|
173
|
+
if !logged_in?
|
174
|
+
print_bad 'Could not re-login.'
|
175
|
+
false
|
176
|
+
else
|
177
|
+
print_ok 'Logged-in successfully.'
|
178
|
+
true
|
179
|
+
end
|
180
|
+
end
|
181
|
+
|
182
|
+
#
|
183
|
+
# Uses the block in {#login_sequence} to login to the webapp.
|
184
|
+
#
|
185
|
+
# @return [Bool, nil] +true+ if login was successful, +false+ if not,
|
186
|
+
# +nil+ if no {#login_sequence} has been set.
|
187
|
+
#
|
188
|
+
def login
|
189
|
+
login_sequence.call if has_login_sequence?
|
190
|
+
end
|
191
|
+
|
192
|
+
# @return [Bool] +true+ if a login sequence exists, +false+ otherwise
|
193
|
+
def has_login_sequence?
|
194
|
+
!!login_sequence
|
195
|
+
end
|
196
|
+
|
197
|
+
#
|
198
|
+
# Uses the block in {#login_check} to check in we're logged in to the webapp.
|
199
|
+
#
|
200
|
+
# @param [Hash] http_opts extra HTTP options to use for the check
|
201
|
+
# @param [Block] block if a block has been provided the check
|
202
|
+
# will be async and the result will be passed
|
203
|
+
# to it, otherwise the method will return
|
204
|
+
# the result.
|
205
|
+
#
|
206
|
+
#
|
207
|
+
# @return [Bool, nil] +true+ if we're logged-in, +false+ if not,
|
208
|
+
# +nil+ if no {#login_sequence} has been set.
|
209
|
+
#
|
210
|
+
def logged_in?( http_opts = {}, &block )
|
211
|
+
login_check.call( http_opts, block ) if has_login_check?
|
212
|
+
end
|
213
|
+
|
214
|
+
# @return [Bool] +true+ if a login check exists, +false+ otherwise
|
215
|
+
def has_login_check?
|
216
|
+
!!login_check
|
217
|
+
end
|
218
|
+
|
219
|
+
def login_check( &block )
|
220
|
+
return @login_check = block if block_given?
|
221
|
+
|
222
|
+
if @opts.login_check_url && @opts.login_check_pattern
|
223
|
+
set_login_check( @opts.login_check_url, @opts.login_check_pattern )
|
224
|
+
end
|
225
|
+
|
226
|
+
@login_check
|
227
|
+
end
|
228
|
+
|
229
|
+
#
|
230
|
+
# A block used to login to the webapp.
|
231
|
+
#
|
232
|
+
# The block should log the framework into the webapp and return +true+ on
|
233
|
+
# success, +false+ on failure.
|
234
|
+
#
|
235
|
+
# @param [Block] block if a block has been given it will be set as
|
236
|
+
# the login sequence
|
237
|
+
#
|
238
|
+
# @return [Block]
|
239
|
+
#
|
240
|
+
def login_sequence( &block )
|
241
|
+
if @login_form && !block_given?
|
242
|
+
@login_sequence = proc do
|
243
|
+
@login_form.refresh( update_cookies: true ).
|
244
|
+
submit( async: false,
|
245
|
+
update_cookies: true,
|
246
|
+
follow_location: false ).
|
247
|
+
response
|
248
|
+
end
|
249
|
+
end
|
250
|
+
|
251
|
+
return @login_sequence if !block_given?
|
252
|
+
@login_sequence = block
|
253
|
+
end
|
254
|
+
|
255
|
+
#
|
256
|
+
# Sets a login check using the provided +url+ and +regexp+.
|
257
|
+
#
|
258
|
+
# @param [String, #to_s] url URL to request
|
259
|
+
# @param [String, Regexp] pattern pattern to match against the body of the response
|
260
|
+
#
|
261
|
+
def set_login_check( url, pattern )
|
262
|
+
login_check do |opts, block|
|
263
|
+
bool = nil
|
264
|
+
http.get( url.to_s, opts.merge( async: !!block ) ) do |res|
|
265
|
+
bool = !!res.body.match( pattern )
|
266
|
+
block.call( bool ) if block
|
267
|
+
end
|
268
|
+
|
269
|
+
bool
|
270
|
+
end
|
271
|
+
end
|
272
|
+
|
273
|
+
# @return [HTTP] http interface
|
274
|
+
def http
|
275
|
+
HTTP
|
276
|
+
end
|
277
|
+
|
278
|
+
end
|
279
|
+
end
|
data/lib/arachni/spider.rb
CHANGED
@@ -1,231 +1,377 @@
|
|
1
1
|
=begin
|
2
|
-
|
3
|
-
Copyright (c) 2010-2012 Tasos "Zapotek" Laskos <tasos.laskos@gmail.com>
|
2
|
+
Copyright 2010-2012 Tasos Laskos <tasos.laskos@gmail.com>
|
4
3
|
|
5
|
-
|
6
|
-
|
7
|
-
|
4
|
+
Licensed under the Apache License, Version 2.0 (the "License");
|
5
|
+
you may not use this file except in compliance with the License.
|
6
|
+
You may obtain a copy of the License at
|
8
7
|
|
9
|
-
|
8
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
10
9
|
|
11
|
-
|
12
|
-
|
13
|
-
|
10
|
+
Unless required by applicable law or agreed to in writing, software
|
11
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
12
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
13
|
+
See the License for the specific language governing permissions and
|
14
|
+
limitations under the License.
|
15
|
+
=end
|
14
16
|
|
15
17
|
module Arachni
|
16
18
|
|
19
|
+
lib = Options.dir['lib']
|
20
|
+
|
21
|
+
require lib + 'bloom_filter'
|
22
|
+
require lib + 'module/utilities'
|
23
|
+
require 'nokogiri'
|
24
|
+
require lib + 'nokogiri/xml/node'
|
25
|
+
|
17
26
|
#
|
18
|
-
#
|
19
|
-
#
|
20
|
-
# Crawls the URL in opts[:url] and grabs the HTML code and headers.
|
27
|
+
# Crawls the target webapp until there are no new paths left.
|
21
28
|
#
|
22
|
-
# @author
|
23
|
-
# <tasos.laskos@gmail.com>
|
24
|
-
# <zapotek@segfault.gr>
|
25
|
-
# @version: 0.2.3
|
29
|
+
# @author Tasos "Zapotek" Laskos <tasos.laskos@gmail.com>
|
26
30
|
#
|
27
31
|
class Spider
|
32
|
+
include UI::Output
|
33
|
+
include Utilities
|
28
34
|
|
29
|
-
|
30
|
-
include Arachni::Module::Utilities
|
31
|
-
|
32
|
-
#
|
33
|
-
#
|
34
|
-
# @return [Options]
|
35
|
-
#
|
35
|
+
# @return [Arachni::Options]
|
36
36
|
attr_reader :opts
|
37
37
|
|
38
|
-
#
|
39
|
-
# Discovered paths
|
40
|
-
#
|
41
|
-
# @return [Array]
|
42
|
-
#
|
43
|
-
attr_reader :sitemap
|
44
|
-
|
45
|
-
#
|
46
|
-
# URLs that caused redirects
|
47
|
-
#
|
48
|
-
# @return [Array]
|
49
|
-
#
|
38
|
+
# @return [Array<String>] URLs that caused redirects
|
50
39
|
attr_reader :redirects
|
51
40
|
|
52
41
|
#
|
53
|
-
# Constructor <br/>
|
54
42
|
# Instantiates Spider class with user options.
|
55
43
|
#
|
56
|
-
# @param [Options] opts
|
44
|
+
# @param [Arachni::Options] opts
|
57
45
|
#
|
58
|
-
def initialize( opts )
|
46
|
+
def initialize( opts = Options.instance )
|
59
47
|
@opts = opts
|
60
48
|
|
61
|
-
@sitemap =
|
49
|
+
@sitemap = {}
|
62
50
|
@redirects = []
|
63
|
-
@
|
51
|
+
@paths = []
|
52
|
+
@visited = Set.new
|
64
53
|
|
65
|
-
@
|
54
|
+
@on_each_page_blocks = []
|
55
|
+
@on_each_response_blocks = []
|
56
|
+
@on_complete_blocks = []
|
66
57
|
|
67
|
-
@
|
68
|
-
@
|
58
|
+
@pass_pages = true
|
59
|
+
@pending_requests = 0
|
69
60
|
|
70
|
-
|
61
|
+
seed_paths
|
62
|
+
end
|
71
63
|
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
|
64
|
+
def url
|
65
|
+
@opts.url
|
66
|
+
end
|
67
|
+
|
68
|
+
# @return [Array<String>] Working paths, paths that haven't yet been followed.
|
69
|
+
# You'll actually get a copy of the working paths
|
70
|
+
# and not the actual object itself;
|
71
|
+
# if you want to add more paths use {#push}.
|
72
|
+
def paths
|
73
|
+
@paths.clone
|
74
|
+
end
|
77
75
|
|
78
|
-
|
79
|
-
|
80
|
-
@
|
76
|
+
# @return [Array<String>] list of crawled URLs
|
77
|
+
def sitemap
|
78
|
+
@sitemap.keys
|
81
79
|
end
|
82
80
|
|
83
|
-
|
84
|
-
|
81
|
+
# @return [Hash<Integer, String>] list of crawled URLs with their HTTP codes
|
82
|
+
def fancy_sitemap
|
83
|
+
@sitemap
|
85
84
|
end
|
86
85
|
|
87
86
|
#
|
88
|
-
# Runs the Spider and passes
|
87
|
+
# Runs the Spider and passes the requested object to the block.
|
89
88
|
#
|
90
|
-
# @param [
|
89
|
+
# @param [Bool] pass_pages_to_block decides weather the block should be passed [Arachni::Page]s
|
90
|
+
# or [Typhoeus::Response]s
|
91
|
+
# @param [Block] block to be passed each page as visited
|
91
92
|
#
|
92
|
-
# @return [
|
93
|
+
# @return [Array<String>] sitemap
|
93
94
|
#
|
94
|
-
def run(
|
95
|
-
return if
|
95
|
+
def run( pass_pages_to_block = true, &block )
|
96
|
+
return if !@opts.crawl?
|
96
97
|
|
97
|
-
|
98
|
+
# options could have changed so reseed
|
99
|
+
seed_paths
|
98
100
|
|
99
|
-
|
100
|
-
:
|
101
|
-
|
102
|
-
:follow_location => true,
|
103
|
-
:update_cookies => true
|
104
|
-
}
|
101
|
+
if block_given?
|
102
|
+
pass_pages_to_block ? on_each_page( &block ) : on_each_response( &block )
|
103
|
+
end
|
105
104
|
|
106
|
-
|
107
|
-
|
108
|
-
|
105
|
+
while !done?
|
106
|
+
wait_if_paused
|
107
|
+
while !done? && url = @paths.shift
|
108
|
+
wait_if_paused
|
109
109
|
|
110
|
-
|
110
|
+
visit( url ) do |res|
|
111
|
+
obj = if pass_pages_to_block
|
112
|
+
Page.from_response( res, @opts )
|
113
|
+
else
|
114
|
+
Parser.new( res, @opts )
|
115
|
+
end
|
111
116
|
|
112
|
-
|
113
|
-
|
114
|
-
|
117
|
+
if @on_each_response_blocks.any?
|
118
|
+
call_on_each_response_blocks( res )
|
119
|
+
end
|
115
120
|
|
116
|
-
|
117
|
-
|
118
|
-
|
121
|
+
if @on_each_page_blocks.any?
|
122
|
+
call_on_each_page_blocks( pass_pages_to_block ? obj : Page.from_response( res, @opts ) )
|
123
|
+
end
|
119
124
|
|
120
|
-
|
125
|
+
push( obj.paths )
|
126
|
+
end
|
127
|
+
end
|
121
128
|
|
122
|
-
|
129
|
+
http.run
|
130
|
+
end
|
123
131
|
|
124
|
-
|
125
|
-
|res|
|
132
|
+
http.run
|
126
133
|
|
127
|
-
|
134
|
+
call_on_complete_blocks
|
128
135
|
|
129
|
-
|
136
|
+
sitemap
|
137
|
+
end
|
130
138
|
|
131
|
-
|
132
|
-
|
133
|
-
|
134
|
-
|
135
|
-
|
136
|
-
|
137
|
-
|
138
|
-
|
139
|
-
|
139
|
+
#
|
140
|
+
# Sets blocks to be called every time a page is visited.
|
141
|
+
#
|
142
|
+
# @param [Block] block
|
143
|
+
#
|
144
|
+
def on_each_page( &block )
|
145
|
+
fail 'Block is mandatory!' if !block_given?
|
146
|
+
@on_each_page_blocks << block
|
147
|
+
self
|
148
|
+
end
|
140
149
|
|
141
|
-
|
142
|
-
|
150
|
+
#
|
151
|
+
# Sets blocks to be called every time a response is received.
|
152
|
+
#
|
153
|
+
# @param [Block] block
|
154
|
+
#
|
155
|
+
def on_each_response( &block )
|
156
|
+
fail 'Block is mandatory!' if !block_given?
|
157
|
+
@on_each_response_blocks << block
|
158
|
+
self
|
159
|
+
end
|
143
160
|
|
144
|
-
|
145
|
-
|
146
|
-
|
161
|
+
#
|
162
|
+
# Sets blocks to be called once the crawler is done.
|
163
|
+
#
|
164
|
+
# @param [Block] block
|
165
|
+
#
|
166
|
+
def on_complete( &block )
|
167
|
+
fail 'Block is mandatory!' if !block_given?
|
168
|
+
@on_complete_blocks << block
|
169
|
+
self
|
170
|
+
end
|
147
171
|
|
148
|
-
|
149
|
-
|
172
|
+
#
|
173
|
+
# Pushes new paths for the crawler to follow; if the crawler has finished
|
174
|
+
# it will be awaken when new paths are pushed.
|
175
|
+
#
|
176
|
+
# The paths will be sanitized and normalized (cleaned up and converted to absolute ones).
|
177
|
+
#
|
178
|
+
# @param [String, Array<String>] paths
|
179
|
+
#
|
180
|
+
# @return [Bool] true if push was successful,
|
181
|
+
# false otherwise (provided empty or paths that must be skipped)
|
182
|
+
#
|
183
|
+
def push( paths )
|
184
|
+
paths = dedup( paths )
|
185
|
+
return false if paths.empty?
|
150
186
|
|
151
|
-
|
152
|
-
|
153
|
-
exception_jail{
|
154
|
-
if !skip?( check_url )
|
155
|
-
block.call( parse ? page.clone : res )
|
156
|
-
else
|
157
|
-
print_info( 'Matched skip rule.' )
|
158
|
-
end
|
159
|
-
}
|
160
|
-
end
|
161
|
-
}
|
162
|
-
|
163
|
-
# make sure we obey the link count limit and
|
164
|
-
# return if we have exceeded it.
|
165
|
-
if( @opts.link_count_limit &&
|
166
|
-
@opts.link_count_limit > 0 &&
|
167
|
-
visited.size >= @opts.link_count_limit )
|
168
|
-
http.run
|
169
|
-
return @sitemap.uniq
|
170
|
-
end
|
187
|
+
@paths |= paths
|
188
|
+
@paths.uniq!
|
171
189
|
|
172
|
-
|
190
|
+
# REVIEW: This may cause segfaults, Typhoeus::Hydra doesn't like threads.
|
191
|
+
#Thread.new { run } if idle? # wake up the crawler
|
192
|
+
true
|
193
|
+
end
|
173
194
|
|
174
|
-
|
175
|
-
|
195
|
+
# @return [TrueClass, FalseClass] true if crawl is done, false otherwise
|
196
|
+
def done?
|
197
|
+
idle? || limit_reached?
|
198
|
+
end
|
199
|
+
|
200
|
+
# @return [TrueClass, FalseClass] true if the queue is empty and no
|
201
|
+
# requests are pending, false otherwise
|
202
|
+
def idle?
|
203
|
+
@paths.empty? && @pending_requests == 0
|
204
|
+
end
|
205
|
+
|
206
|
+
# @return [TrueClass] pauses the system on a best effort basis
|
207
|
+
def pause
|
208
|
+
@pause = true
|
209
|
+
end
|
210
|
+
|
211
|
+
# @return [TrueClass] resumes the system on a best effort basis
|
212
|
+
def resume
|
213
|
+
@pause = false
|
214
|
+
true
|
215
|
+
end
|
216
|
+
|
217
|
+
# @return [Bool] true if the system it paused, false otherwise
|
218
|
+
def paused?
|
219
|
+
@pause ||= false
|
220
|
+
end
|
221
|
+
|
222
|
+
private
|
223
|
+
|
224
|
+
def seed_paths
|
225
|
+
push url
|
226
|
+
push @opts.extend_paths
|
227
|
+
end
|
176
228
|
|
177
|
-
|
229
|
+
def call_on_each_page_blocks( obj )
|
230
|
+
@on_each_page_blocks.each { |b| exception_jail( false ) { b.call( obj ) } }
|
178
231
|
end
|
179
232
|
|
233
|
+
def call_on_each_response_blocks( obj )
|
234
|
+
@on_each_response_blocks.each { |b| exception_jail( false ) { b.call( obj ) } }
|
235
|
+
end
|
236
|
+
|
237
|
+
def call_on_complete_blocks
|
238
|
+
@on_complete_blocks.each { |b| exception_jail( false ) { b.call } }
|
239
|
+
end
|
240
|
+
|
241
|
+
# @return [Arachni::HTTP] HTTP interface
|
180
242
|
def http
|
181
|
-
|
243
|
+
HTTP
|
182
244
|
end
|
183
245
|
|
246
|
+
#
|
247
|
+
# Decides if a URL should be skipped based on weather it:
|
248
|
+
# * has previously been {#visited?}
|
249
|
+
# * matches a {#redundant?} filter
|
250
|
+
# * matches universal {#skip_path?} options like inclusion and exclusion filters
|
251
|
+
#
|
252
|
+
# @param [String] url to check
|
253
|
+
#
|
254
|
+
# @return [Bool] true if any of the 3 filters returns true, false otherwise
|
255
|
+
#
|
184
256
|
def skip?( url )
|
185
|
-
|
257
|
+
visited?( url ) || skip_path?( url )
|
258
|
+
end
|
259
|
+
|
260
|
+
def remove_path_params( url )
|
261
|
+
uri = URI( url ).dup
|
262
|
+
uri.path = uri.path.split( ';' ).first.to_s
|
263
|
+
uri.to_s
|
264
|
+
end
|
265
|
+
|
266
|
+
#
|
267
|
+
# @param [String] url
|
268
|
+
#
|
269
|
+
# @return [Bool] true if the url has already been visited, false otherwise
|
270
|
+
#
|
271
|
+
def visited?( url )
|
272
|
+
@visited.include?( remove_path_params( url ) )
|
186
273
|
end
|
187
274
|
|
275
|
+
# @return [Bool] true if the link-count-limit has been exceeded, false otherwise
|
276
|
+
def limit_reached?
|
277
|
+
@opts.link_count_limit > 0 && @visited.size >= @opts.link_count_limit
|
278
|
+
end
|
279
|
+
|
280
|
+
#
|
281
|
+
# Checks is the provided URL matches a redundant filter
|
282
|
+
# and decreases its counter if so.
|
283
|
+
#
|
284
|
+
# If a filter's counter has reached 0 the method returns true.
|
285
|
+
#
|
286
|
+
# @param [String] url
|
287
|
+
#
|
288
|
+
# @return [Bool] true if the url is redundant, false otherwise
|
289
|
+
#
|
188
290
|
def redundant?( url )
|
189
|
-
@opts.redundant
|
190
|
-
|
291
|
+
redundant = @opts.redundant?( url ) do |count, regexp, path|
|
292
|
+
print_info "Matched redundancy rule: #{regexp} for #{path}"
|
293
|
+
print_info "Count-down: #{count}"
|
294
|
+
end
|
191
295
|
|
192
|
-
|
296
|
+
print_verbose "Discarding redundant page: #{url}" if redundant
|
297
|
+
redundant
|
298
|
+
end
|
193
299
|
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
end
|
300
|
+
def auto_redundant?( url )
|
301
|
+
return false if !@opts.auto_redundant?
|
302
|
+
@auto_redundant ||= Hash.new( 0 )
|
198
303
|
|
199
|
-
|
200
|
-
redundant['regexp'].to_s + ' for page \'' +
|
201
|
-
url + '\'' )
|
304
|
+
h = "#{url.split( '?' ).first}#{parse_query( url ).keys.sort}".hash
|
202
305
|
|
203
|
-
|
306
|
+
if @auto_redundant[h] >= @opts.auto_redundant
|
307
|
+
print_verbose "Discarding auto-redundant page: #{url}"
|
308
|
+
return true
|
309
|
+
end
|
204
310
|
|
205
|
-
|
206
|
-
|
207
|
-
}
|
208
|
-
return false
|
311
|
+
@auto_redundant[h] += 1
|
312
|
+
false
|
209
313
|
end
|
210
314
|
|
315
|
+
def dedup( paths )
|
316
|
+
return [] if !paths || paths.empty?
|
317
|
+
|
318
|
+
[paths].flatten.uniq.compact.map { |p| to_absolute( p, url ) }.
|
319
|
+
reject { |p| skip?( p ) }.uniq.compact
|
320
|
+
end
|
211
321
|
|
212
322
|
def wait_if_paused
|
213
|
-
while( paused? )
|
214
|
-
::IO::select( nil, nil, nil, 1 )
|
215
|
-
end
|
323
|
+
::IO::select( nil, nil, nil, 1 ) while( paused? )
|
216
324
|
end
|
217
325
|
|
218
|
-
def
|
219
|
-
@
|
326
|
+
def hit_redirect_limit?
|
327
|
+
@opts.redirect_limit > 0 && @opts.redirect_limit >= @followed_redirects
|
220
328
|
end
|
221
329
|
|
222
|
-
def
|
223
|
-
|
330
|
+
def visit( url, opts = {}, &block )
|
331
|
+
return if skip?( url ) || redundant?( url ) || auto_redundant?( url )
|
332
|
+
visited( url )
|
333
|
+
|
334
|
+
@followed_redirects ||= 0
|
335
|
+
@pending_requests += 1
|
336
|
+
|
337
|
+
opts = {
|
338
|
+
timeout: nil,
|
339
|
+
follow_location: false,
|
340
|
+
update_cookies: true
|
341
|
+
}.merge( opts )
|
342
|
+
|
343
|
+
wrap = proc do |res|
|
344
|
+
effective_url = normalize_url( res.effective_url )
|
345
|
+
|
346
|
+
if res.redirection?
|
347
|
+
@redirects << res.request.url
|
348
|
+
if hit_redirect_limit? || skip?( res.location )
|
349
|
+
decrease_pending
|
350
|
+
next
|
351
|
+
end
|
352
|
+
@followed_redirects += 1
|
353
|
+
push res.location
|
354
|
+
end
|
355
|
+
|
356
|
+
print_status( "[HTTP: #{res.code}] " + effective_url )
|
357
|
+
@sitemap[effective_url] = res.code
|
358
|
+
block.call( res )
|
359
|
+
|
360
|
+
decrease_pending
|
361
|
+
end
|
362
|
+
|
363
|
+
http.get( url, opts, &wrap )
|
364
|
+
rescue
|
365
|
+
decrease_pending
|
366
|
+
nil
|
224
367
|
end
|
225
368
|
|
226
|
-
def
|
227
|
-
@
|
228
|
-
|
369
|
+
def decrease_pending
|
370
|
+
@pending_requests -= 1
|
371
|
+
end
|
372
|
+
|
373
|
+
def visited( url )
|
374
|
+
@visited << remove_path_params( url )
|
229
375
|
end
|
230
376
|
|
231
377
|
end
|