# -*- coding: utf-8 -*- # ------------------------------------------------------------------------------- # Name: sfp_pageinfo # Purpose: SpiderFoot plug-in for scanning retrieved content by other # modules (such as sfp_spider) and building up information about # the page, such as whether it uses Javascript, has forms, and more. # # Author: Steve Micallef # # Created: 02/05/2012 # Copyright: (c) Steve Micallef 2012 # Licence: MIT # ------------------------------------------------------------------------------- import re from spiderfoot import SpiderFootEvent, SpiderFootPlugin # Indentify pages that use Javascript libs, handle passwords, have forms, # permit file uploads and more to come. regexps = dict({ 'URL_JAVASCRIPT': list(['text/javascript', '