o [NSE] Added a new httpspider library and the script http-email-harvest that

collects e-mail addresses by spidering a website. [Patrik]
2025-12-06 12:41:29 +00:00 · 2011-12-06 22:47:11 +00:00
parent 34db78528a
commit 682a9a746b
4 changed files with 697 additions and 0 deletions
--- a/3
+++ b/3
@@ -1,5 +1,8 @@
 # Nmap Changelog ($Id$); -*-text-*-

+o [NSE] Added a new httpspider library and the script http-email-harvest that
+  collects e-mail addresses by spidering a website. [Patrik]
+
 o [NSE] Added support for detecting whether a http connection was established
  using SSL or not by the http.lua library [Patrik]

--- a/nselib/httpspider.lua
+++ b/nselib/httpspider.lua
@@ -0,0 +1,583 @@
+---
+-- A smallish httpspider library providing basic spidering capabilities
+-- It consists of the following classes:
+--
+-- * <code>Options</code>
+-- ** This class is responsible for handling library options.
+--
+-- * <code>LinkExtractor</code>
+-- ** This class contains code responsible for extracting urls from web pages.
+--
+-- * <code>URL</code>
+-- ** This class contains code to parse and process URLs.
+--
+-- * <code>UrlQueue</code>
+-- ** This class contains a queue of the next links to process.
+--
+-- * <code>Crawler</code>
+-- ** This class is responsible for the actual crawling.
+-- 
+-- @author Patrik Karlsson <patrik@cqure.net>
+-- 
+
+module(... or "httpspider", package.seeall)
+
+require 'http'
+
+local LIBRARY_NAME = "httpspider"
+
+-- The Options class, handling all spidering options
+Options = {
+	
+	new = function(self, options)
+		local o = {	}
+		
+		-- copy all options as class members
+		for k, v in pairs(options) do o[k] = v	end
+
+		-- set a few default values
+		o.timeout  = options.timeout or 10000
+		o.withindomain = o.withindomain or false
+		
+		-- we default to withinhost, unless withindomain is set
+		if ( o.withindomain ) then
+			o.withinhost = o.withinhost or false
+		else
+			o.withinhost = o.withinhost or true
+		end
+		
+		o.whitelist = o.whitelist or {}
+		o.blacklist = o.blacklist or {}
+				
+		if ( o.withinhost or o.withindomain ) then
+			local host_match, domain_match
+			if ( ( o.base_url:getProto() == 'https' and o.base_url:getPort() == 443 ) or
+				 ( o.base_url:getProto() == 'http'  and o.base_url:getPort() == 80 ) ) then
+				if ( o.withinhost ) then
+					host_match = ("%s://%s"):format(o.base_url:getProto(), o.base_url:getHost())
+				elseif ( o.withindomain ) then
+					domain_match = ("%s://.*%s/"):format(o.base_url:getProto(), o.base_url:getDomain())
+				end
+			else
+				if ( o.withinhost ) then
+				 	host_match = ("%s://%s:%d"):format(o.base_url:getProto(), o.base_url:getHost(), o.base_url:getPort() )
+				elseif( o.withindomain ) then
+					domain_match = ("%s://.*%s/"):format(o.base_url:getProto(), o.base_url:getDomain() )
+				end
+			end
+			
+			-- set up the appropriate matching functions
+			if ( o.withinhost ) then
+				o.withinhost = function(url) return string.match(tostring(url), host_match)	end
+			else
+				o.withindomain = function(url) return string.match(tostring(url), domain_match)	end
+			end
+		end
+		setmetatable(o, self)
+		self.__index = self
+		return o
+	end,
+	
+	addWhitelist = function(self, func) table.insert(self.whitelist, func) end,
+	addBlacklist = function(self, func) table.insert(self.blacklist, func) end,
+
+}
+
+-- Placeholder for form extraction code
+FormExtractor = {
+	
+}
+
+LinkExtractor = {
+	
+	-- Creates a new instance of LinkExtractor
+	-- @return o instance of LinkExtractor
+	new = function(self, url, html, options)
+		local o = {
+			url = url,
+			html = html,
+			links = {},
+			options = options,
+		}
+		setmetatable(o, self)
+		self.__index = self
+		o:parse()
+		return o
+	end,
+	
+	-- is the link absolute or not?
+	isAbsolute = function(url)
+		-- at this point we don't care about the protocol
+		-- also, we don't add // to cover stuff like:
+		-- feed:http://example.com/rss.xml
+		return ( url:match('^%w*:') ~= nil )
+	end,
+	
+	-- Creates an absolute link from a relative one based on the base_url
+	-- The functionality is very simple and does not take any ../../ in
+	-- consideration.
+	--
+	-- @param base_url URL containing the page url from which the links were
+	--        extracted
+	-- @param rel_url string containing the relative portion of the URL
+	-- @return link string containing the absolute link
+	createAbsolute = function(base_url, rel_url, base_href)
+
+		-- is relative with leading slash? ie /dir1/foo.html
+		local leading_slash = rel_url:match("^/")
+		rel_url = rel_url:match("^/?(.*)") or '/'
+
+		-- check for tailing slash
+		if ( base_href and not(base_href:match("/$") ) ) then
+			base_href = base_href .. '/'
+		end
+
+		if ( ( base_url:getProto() == 'https' and base_url:getPort() == 443 ) or
+			 ( base_url:getProto() == 'http' and base_url:getPort() == 80 ) ) then
+			
+			if ( leading_slash ) then
+				return ("%s://%s/%s"):format(base_url:getProto(), base_url:getHost(), rel_url)
+			else
+				if ( base_href ) then
+					return ("%s%s"):format(base_href, rel_url)
+				else
+					return ("%s://%s%s%s"):format(base_url:getProto(), base_url:getHost(), base_url:getDir(), rel_url)
+				end
+			end
+		else
+			if ( leading_slash ) then
+				return ("%s://%s:%d/%s"):format(base_url:getProto(), base_url:getHost(), base_url:getPort(), rel_url)
+			else
+				if ( base_href ) then
+					return ("%s%s"):format(base_href, rel_url)
+				else
+					return ("%s://%s:%d%s%s"):format(base_url:getProto(), base_url:getHost(), base_href or base_url:getPort(), base_url:getDir(), rel_url)
+				end
+			end
+		end
+	end,
+	
+	-- Gets the depth of the link, relative to our base url eg.
+	-- base_url = http://www.cqure.net/wp/
+	-- url = http://www.cqure.net/wp/ 							- depth: 0
+	-- url = http://www.cqure.net/wp/index.php 					- depth: 0
+	-- url = http://www.cqure.net/wp/2011/index.php				- depth: 1
+	-- url = http://www.cqure.net/index.html					- depth: -1
+	--
+	-- @param url instance of URL
+	-- @return depth number containing the depth relative to the base_url
+	getDepth = function(self, url)
+		local base_dir, url_dir = self.options.base_url:getDir(), url:getDir()
+		if ( url_dir and base_dir ) then
+			local m = url_dir:match(base_dir.."(.*)")
+			if ( not(m) ) then
+				return -1
+			else
+				local _, depth = m:gsub("/", "/")
+				return depth
+			end
+		end
+	end,
+	
+	-- Parses a HTML response and extracts all links it can find
+	-- The function currently supports href, src and action links
+	-- Also all behaviour options, such as depth, white- and black-list are
+	-- processed in here.
+	parse = function(self)
+		local links = {}
+		local patterns = {
+			'[hH][rR][eE][fF]%s*=%s*[\'"](%s*[^"^\']+%s*)[\'"]',
+			'[hH][rR][eE][fF]%s*=%s*([^\'\"][^%s>]+)',
+			'[sS][rR][cC]%s*=%s*[\'"](%s*[^"^\']+%s*)[\'"]',
+			'[sS][rR][cC]%s*=%s*([^\'\"][^%s>]+)',
+			'[aA][cC][tT][iI][oO][nN]%s*=%s*[\'"](%s*[^"^\']+%s*)[\'"]',
+		}
+		
+		local base_hrefs = {
+			'[Bb][Aa][Ss][Ee]%s*[Hh][Rr][Ee][Ff]%s*=%s*[\'"](%s*[^"^\']+%s*)[\'"]',
+			'[Bb][Aa][Ss][Ee]%s*[Hh][Rr][Ee][Ff]%s*=%s*([^\'\"][^%s>]+)'
+		}
+		
+		local base_href
+		for _, pattern in ipairs(base_hrefs) do
+			base_href = self.html:match(pattern)
+			if ( base_href ) then
+				break
+			end
+		end
+
+		for _, pattern in ipairs(patterns) do
+			for l in self.html:gfind(pattern) do
+				local link = l
+				if ( not(LinkExtractor.isAbsolute(l)) ) then
+					link = LinkExtractor.createAbsolute(self.url, l, base_href)
+				end
+				
+				local url = URL:new(link)
+				
+				local function validate_link()
+					local valid = true
+
+					-- if our url is nil, abort, this could be due to a number of
+					-- reasons such as unsupported protocols: javascript, mail ... or
+					-- that the URL failed to parse for some reason
+					if ( url == nil or tostring(url) == nil ) then
+						return false
+					end
+
+					-- linkdepth trumps whitelisting
+					if ( self.options.maxdepth ) then
+						local depth = self:getDepth( url )
+						if ( -1 == depth or depth > self.options.maxdepth ) then
+							stdnse.print_debug(3, "%s: Skipping link depth: %d; b_url=%s; url=%s", LIBRARY_NAME, depth, tostring(self.options.base_url), tostring(url))
+							return false
+						end		
+					end
+				
+					-- withindomain trumps any whitelisting
+					if ( self.options.withindomain ) then
+						if ( not(self.options.withindomain(url)) ) then
+							stdnse.print_debug(2, "%s: Link is not within domain: %s", LIBRARY_NAME, tostring(url))
+							return false
+						end
+					end
+					
+					-- withinhost trumps any whitelisting
+					if ( self.options.withinhost ) then
+						if ( not(self.options.withinhost(url)) ) then
+							stdnse.print_debug(2, "%s: Link is not within host: %s", LIBRARY_NAME, tostring(url))
+							return false
+						end
+					end
+				
+					-- run through all blacklists	
+					if ( #self.options.blacklist > 0 ) then
+						for _, func in ipairs(self.options.blacklist) do
+							if ( func(url) ) then
+								stdnse.print_debug(2, "%s: Blacklist match: %s", LIBRARY_NAME, tostring(url))
+								valid = false
+								break
+							end
+						end
+					end
+					
+					-- check the url against our whitelist
+					if ( #self.options.whitelist > 0 ) then
+						for _, func in ipairs(self.options.whitelist) do
+							if ( func(url) ) then
+								stdnse.print_debug(2, "%s: Whitelist match: %s", LIBRARY_NAME, tostring(url))
+								valid = true
+								break
+							end
+						end
+					end
+					return valid
+				end
+				
+				local valid = validate_link()
+				
+				if ( valid ) then
+					stdnse.print_debug(3, "%s: Adding link: %s", LIBRARY_NAME, tostring(url))
+					links[tostring(url)] = true
+				elseif ( tostring(url) ) then
+					stdnse.print_debug(3, "%s: Skipping url: %s", LIBRARY_NAME, link)
+				end
+			end
+		end
+	  	
+		for link in pairs(links) do
+			table.insert(self.links, link)
+		end
+	
+	end,
+
+	-- Gets a table containing all of the retrieved URLs, after filtering
+	-- has been applied.
+	getLinks = function(self) return self.links end,
+	
+	
+}
+
+-- The URL class, containing code to process URLS
+-- This class is heavily inspired by the Java URL class
+URL = {
+	
+	-- Creates a new instance of URL
+	-- @param url string containing the text representation of a URL
+	-- @return o instance of URL, in case of parsing being successful
+	--         nil in case parsing fails
+	new = function(self, url)
+		local o = {
+			raw = url,
+		}
+				
+		setmetatable(o, self)
+		self.__index = self
+		if ( o:parse() ) then
+			return o
+		end
+	end,
+	
+	-- Parses the string representation of the URL and splits it into different
+	-- URL components
+	-- @return status true on success, false on failure
+	parse = function(self)
+		self.proto, self.host, self.port, self.file = self.raw:match("^(http[s]?)://([^:/]*)[:]?(%d*)")
+		if ( self.proto and self.host ) then
+			self.file = self.raw:match("^http[s]?://[^:/]*[:]?%d*(/[^\#]*)") or '/'
+			self.port = tonumber(self.port)
+			if ( not(self.port) ) then
+				if ( self.proto:match("http") ) then
+					self.port = 80 
+				elseif ( self.proto:match("https")) then
+					self.port = 443
+				end
+			end
+			
+			self.path  = self.file:match("^([^?]*)[%?]?")
+			self.dir   = self.path:match("^(.+%/)") or "/"
+			self.domain= self.host:match("^[^%.]-%.(.*)")			
+			return true
+		elseif( self.raw:match("^javascript:") ) then
+			stdnse.print_debug(2, "%s: Skipping javascript url: %s", LIBRARY_NAME, self.raw)
+		elseif( self.raw:match("^mailto:") ) then
+			stdnse.print_debug(2, "%s: Skipping mailto link: %s", LIBRARY_NAME, self.raw)
+		else
+			stdnse.print_debug(2, "%s: WARNING: Failed to parse url: %s", LIBRARY_NAME, self.raw)
+		end
+		return false
+	end,
+	
+	-- Get's the host portion of the URL
+	-- @return host string containing the hostname
+	getHost = function(self) return self.host end,
+	
+	-- Get's the protocol representation of the URL
+	-- @return proto string containing the protocol (ie. http, https)
+	getProto = function(self) return self.proto end,
+	
+	-- Returns the filename component of the URL. 
+	-- @return file string containing the path and query components of the url
+	getFile = function(self) return self.file end,
+	
+	-- Gets the port component of the URL
+	-- @return port number containing the port of the URL
+	getPort = function(self) return self.port end,
+	
+	-- Gets the path component of the URL
+	-- @return the full path and filename of the URL
+	getPath = function(self) return self.path end,
+	
+	-- Gets the directory component of the URL
+	-- @return directory string containing the directory part of the URL 
+	getDir  = function(self) return self.dir end,
+	
+	-- Gets the domain component of the URL
+	-- @return domain string containing the hosts domain
+	getDomain = function(self) return self.domain end,
+	
+	-- Converts the URL to a string
+	-- @return url string containing the string representation of the url
+	__tostring = function(self) return self.raw end,
+}
+
+-- An UrlQueue
+UrlQueue = {
+	
+	-- creates a new instance of UrlQueue
+	-- @param options table containing options
+	-- @return o new instance of UrlQueue
+	new = function(self, options)
+		local o = { 
+			urls = {},
+			options = options
+		}
+		setmetatable(o, self)
+		self.__index = self
+		return o
+	end,
+	
+	-- get's the next available url in the queue
+	getNext = function(self)
+		return table.remove(self.urls,1)
+	end,
+	
+	-- adds a new url to the queue
+	-- @param url can be either a string or a URL or a table of URLs
+	add = function(self, url)
+		assert( type(url) == 'string' or type(url) == 'table', "url was neither a string or table")
+		local urls = ( 'string' == type(url) ) and URL:new(url) or url
+		
+		-- if it's a table, it can be either a single URL or an array of URLs
+		if ( 'table' == type(url) and url.raw ) then
+			urls = { url }
+		end
+		
+		for _, u in ipairs(urls) do
+			u = ( 'string' == type(u) ) and URL:new(u) or u
+			if ( u ) then
+				table.insert(self.urls, u)
+			else
+				stdnse.print_debug("ERROR: Invalid URL: %s", url)
+			end
+		end
+	end,
+	
+	-- dumps the contents of the UrlQueue
+	dump = function(self)
+		for _, url in ipairs(self.urls) do
+			print("url:", url)
+		end
+	end,
+	
+}
+
+
+-- The Crawler class
+Crawler = {
+	
+	-- creates a new instance of the Crawler instance
+	-- @param host table as received by the action method
+	-- @param port table as received by the action method
+	-- @param url string containing the relative URL
+	-- @param options table of options
+	-- @return o new instance of Crawler or nil on failure
+	new = function(self, host, port, url, options)
+		local o = {
+			host = host,
+			port = port,
+			url = url,
+			options = options or {},
+		}
+
+		setmetatable(o, self)
+		self.__index = self
+
+		local response = http.get(o.host, o.port, '/', { timeout = o.options.timeout } )
+		
+		if ( not(response) or 'table' ~= type(response) ) then
+			return
+		end
+		
+		o.url = o.url:match("/?(.*)")
+		
+		local u_host = o.host.targetname or o.host.name
+		if ( not(u_host) or 0 == #u_host ) then
+			u_host = o.host.ip
+		end
+		local u = ("%s://%s:%d/%s"):format(response.ssl and "https" or "http", u_host, o.port.number, o.url)
+		o.options.base_url = URL:new(u)
+		o.options = Options:new(o.options)
+		o.urlqueue = UrlQueue:new(o.options)
+		o.urlqueue:add(o.options.base_url)
+
+		o.options.timeout = o.options.timeout or 10000
+		o.processed = {}
+		
+		-- script arguments have precedense
+		if ( not(o.options.maxdepth) ) then
+			o.options.maxdepth = tonumber(stdnse.get_script_args("httpspider.maxdepth"))
+		end
+		
+		-- script arguments have precedense
+		if ( not(o.options.maxpagecount) ) then
+			o.options.maxpagecount = tonumber(stdnse.get_script_args("httpspider.maxpagecount"))
+		end
+		
+		if ( not(o.options.noblacklist) ) then
+			o:addDefaultBlacklist()
+		end
+		
+		return o
+	end,
+	
+	-- Set's the timeout used by the http library
+	-- @param timeout number containing the timeout in ms.
+	set_timeout = function(self, timeout)
+		self.options.timeout = timeout
+	end,
+		
+	-- Get's the amount of pages that has been retrieved
+	-- @return count number of pages retrieved by the instance
+	getPageCount = function(self)
+		local count = 1
+		for url in pairs(self.processed) do
+			count = count + 1
+		end
+		return count
+	end,
+	
+	-- Adds a default blacklist blocking binary files such as images,
+	-- compressed archives and executable files
+	addDefaultBlacklist = function(self)
+	
+		self.options:addBlacklist( function(url)
+			local image_extensions = {"png","jpg","jpeg","gif","bmp"}
+			local archive_extensions = {"zip", "tar.gz", "gz", "rar", "7z", "sit", "sitx"}
+			local exe_extensions = {"exe", "com"}
+			local extensions = { image_extensions, archive_extensions, exe_extensions }
+			
+			for _, cat in ipairs(extensions) do
+				for _, ext in ipairs(cat) do
+					if ( url:getPath():match(ext.."$") ) then
+						return true
+					end
+				end
+			end
+	  	end )
+	
+	end,
+	
+	-- does the heavy crawling
+	--
+	-- The crawler may exit due to a number of different reasons, including
+	-- invalid options, reaching max count or simply running out of links
+	-- We return a false status for all of these and in case the error was
+	-- unexpected or requires attention we set the error property accordingly.
+	-- This way the script can alert the user of the details by calling
+	-- getError()
+	crawl = function(self)
+
+		if ( self.options.withinhost and self.options.withindomain ) then
+			return false, { err = true, reason = "Invalid options: withinhost and withindomain can't both be true" }
+		end
+
+		-- in case the user set a max page count to retrieve check how many
+		-- pages we have retrieved so far
+		local count = self:getPageCount()
+		if ( self.options.maxpagecount and
+			 ( count > self.options.maxpagecount ) ) then
+			return false, { err = false, msg = "Reached max page count" }
+		end
+		
+		-- pull links from the queue until we get a valid one
+		local url
+		repeat
+			url = self.urlqueue:getNext()
+		until( not(url) or not(self.processed[tostring(url)]) )
+
+		-- if no url could be retrieved from the queue, abort ...
+		if ( not(url) ) then
+			return false, { err = false, msg = "No more urls" }
+		end
+		
+		if ( self.options.maxpagecount ) then
+			stdnse.print_debug(2, "%s: Fetching url [%d of %d]: %s", LIBRARY_NAME, count, self.options.maxpagecount, tostring(url))
+		else
+			stdnse.print_debug(2, "%s: Fetching url: %s", LIBRARY_NAME, tostring(url))
+		end
+
+		-- fetch the url, and then push it to the processed table
+		local response = http.get(url:getHost(), url:getPort(), url:getFile(), { timeout = self.options.timeout } )
+		self.processed[tostring(url)] = true
+		
+		-- if we have a response, proceed scraping it
+		if ( response.body ) then
+			local links = LinkExtractor:new(url, response.body, self.options):getLinks()
+			self.urlqueue:add(links)
+		end
+		return true, { url = url, response = response }
+	end,
+	
+	
+}
--- a/scripts/http-email-harvest.nse
+++ b/scripts/http-email-harvest.nse
@@ -0,0 +1,110 @@
+description = [[
+Spiders a web site and collects e-mail addresses
+]]
+
+---
+-- @usage
+-- nmap --script=http-email-harvest <target>
+--
+-- @output
+-- PORT   STATE SERVICE REASON
+-- 80/tcp open  http    syn-ack
+-- | http-email-harvest: 
+-- | Spidering limited to: maxdepth=3; maxpagecount=20
+-- |   root@examplec.com
+-- |_  postmaster@example.com
+--
+-- @args http-email-harvest.maxdepth the maximum amount of directories beneath
+--       the initial url to spider. A negative value disables the limit.
+--       (default: 3)
+-- @args http-email-harvest.maxpagecount the maximum amount of pages to visit.
+--       A negative value disables the limit (default: 20)
+-- @args http-email-harvest.url the url to start spidering. This is a URL
+--       relative to the scanned host eg. /default.html (default: /)
+-- @args http-email-harvest.withinhost only spider URLs within the same host.
+--       (default: true)
+-- @args http-email-harvest.withindomain only spider URLs within the same
+--       domain. This widens the scope from <code>withinhost</code> and can
+--       not be used in combination. (default: false)
+--
+
+author = "Patrik Karlsson"
+categories = {"discovery", "safe"}
+
+require "httpspider"
+require "shortport"
+
+portrule = shortport.http
+
+function action(host, port)
+	local EMAIL_PATTERN = "[A-Za-z0-9%.%%%+%-]+@[A-Za-z0-9%.%%%+%-]+%.%w%w%w?%w?"
+
+	-- by default, we cap the script at a maximum depth of 3 
+	local maxdepth 		= tonumber(stdnse.get_script_args("http-email-harvest.maxdepth")) or 3
+	-- by default, we cap the script at a maximum pagecount of 20
+	local maxpagecount 	= tonumber(stdnse.get_script_args("http-email-harvest.maxpagecount")) or 20
+
+	local url 			= stdnse.get_script_args("http-email-harvest.url") or "/"
+	local withinhost 	= stdnse.get_script_args("http-email-harvest.withinhost")
+	local withindomain 	= stdnse.get_script_args("http-email-harvest.withindomain")
+	
+	if ( maxdepth < 0 ) then maxdepth = nil end
+	if ( maxpagecount < 0 ) then maxpagecount = nil end
+	
+	stdnse.print_debug(2, "%s: Running crawler maxdepth: %s; maxpagecount: %s", 
+		SCRIPT_NAME, maxdepth or "[none]", maxpagecount or "[none]")
+	
+	local crawler = httpspider.Crawler:new(host, port, url or '/', { 
+			maxdepth = maxdepth, 
+			maxpagecount = maxpagecount,
+			withinhost = withinhost,
+			withindomain= withindomain,
+		}
+	)
+
+	crawler:set_timeout(10000)
+
+	local emails = {}
+	while(true) do
+		local status, r = crawler:crawl()
+		-- if the crawler fails it can be due to a number of different reasons
+		-- most of them are "legitimate" and should not be reason to abort
+		if ( not(status) ) then
+			if ( r.err ) then
+				return stdnse.format_output(true, "ERROR: %s", r.reason)
+			else
+				break
+			end
+		end
+		
+		-- Collect each e-mail address and build a unique index of them
+   		for email in r.response.body:gmatch(EMAIL_PATTERN) do
+      		emails[email] = true
+		end
+	end
+
+	-- if no email addresses were collected abort
+	if ( not(emails) ) then	return end
+
+	local results = {}
+	for email, _ in pairs(emails) do
+		table.insert(results, email)
+  	end
+
+	-- Inform the user of the limitations that were used
+	if ( maxdepth > 0 or maxpagecount > 0 ) then
+		local limit = "Spidering limited to: "
+		if ( maxdepth > 0 ) then
+			limit = limit .. ("maxdepth=%d; "):format(maxdepth)
+		end
+		if ( maxpagecount > 0 ) then
+			limit = limit .. ("maxpagecount=%d"):format(maxpagecount)
+		end
+		if ( #results == 0 ) then
+			table.insert(results, limit)
+		else
+			results.name = limit
+		end
+	end
+	return stdnse.format_output(true, results)
+end
--- a/scripts/script.db
+++ b/scripts/script.db
@@ -94,6 +94,7 @@ Entry { filename = "http-cors.nse", categories = { "default", "discovery", "safe
 Entry { filename = "http-date.nse", categories = { "discovery", "safe", } }
 Entry { filename = "http-default-accounts.nse", categories = { "auth", "discovery", "safe", } }
 Entry { filename = "http-domino-enum-passwords.nse", categories = { "auth", "intrusive", } }
+Entry { filename = "http-email-harvest.nse", categories = { "discovery", "safe", } }
 Entry { filename = "http-enum.nse", categories = { "discovery", "intrusive", "vuln", } }
 Entry { filename = "http-favicon.nse", categories = { "default", "discovery", "safe", } }
 Entry { filename = "http-form-brute.nse", categories = { "brute", "intrusive", } }