1
0
mirror of https://github.com/nmap/nmap.git synced 2025-12-06 12:41:29 +00:00
Files
nmap/zenmap/zenmapCore/NmapParser.py

1428 lines
55 KiB
Python

#!/usr/bin/env python
# -*- coding: utf-8 -*-
# ***********************IMPORTANT NMAP LICENSE TERMS************************
# * *
# * The Nmap Security Scanner is (C) 1996-2019 Insecure.Com LLC ("The Nmap *
# * Project"). Nmap is also a registered trademark of the Nmap Project. *
# * This program is free software; you may redistribute and/or modify it *
# * under the terms of the GNU General Public License as published by the *
# * Free Software Foundation; Version 2 ("GPL"), BUT ONLY WITH ALL OF THE *
# * CLARIFICATIONS AND EXCEPTIONS DESCRIBED HEREIN. This guarantees your *
# * right to use, modify, and redistribute this software under certain *
# * conditions. If you wish to embed Nmap technology into proprietary *
# * software, we sell alternative licenses (contact sales@nmap.com). *
# * Dozens of software vendors already license Nmap technology such as *
# * host discovery, port scanning, OS detection, version detection, and *
# * the Nmap Scripting Engine. *
# * *
# * Note that the GPL places important restrictions on "derivative works", *
# * yet it does not provide a detailed definition of that term. To avoid *
# * misunderstandings, we interpret that term as broadly as copyright law *
# * allows. For example, we consider an application to constitute a *
# * derivative work for the purpose of this license if it does any of the *
# * following with any software or content covered by this license *
# * ("Covered Software"): *
# * *
# * o Integrates source code from Covered Software. *
# * *
# * o Reads or includes copyrighted data files, such as Nmap's nmap-os-db *
# * or nmap-service-probes. *
# * *
# * o Is designed specifically to execute Covered Software and parse the *
# * results (as opposed to typical shell or execution-menu apps, which will *
# * execute anything you tell them to). *
# * *
# * o Includes Covered Software in a proprietary executable installer. The *
# * installers produced by InstallShield are an example of this. Including *
# * Nmap with other software in compressed or archival form does not *
# * trigger this provision, provided appropriate open source decompression *
# * or de-archiving software is widely available for no charge. For the *
# * purposes of this license, an installer is considered to include Covered *
# * Software even if it actually retrieves a copy of Covered Software from *
# * another source during runtime (such as by downloading it from the *
# * Internet). *
# * *
# * o Links (statically or dynamically) to a library which does any of the *
# * above. *
# * *
# * o Executes a helper program, module, or script to do any of the above. *
# * *
# * This list is not exclusive, but is meant to clarify our interpretation *
# * of derived works with some common examples. Other people may interpret *
# * the plain GPL differently, so we consider this a special exception to *
# * the GPL that we apply to Covered Software. Works which meet any of *
# * these conditions must conform to all of the terms of this license, *
# * particularly including the GPL Section 3 requirements of providing *
# * source code and allowing free redistribution of the work as a whole. *
# * *
# * As another special exception to the GPL terms, the Nmap Project grants *
# * permission to link the code of this program with any version of the *
# * OpenSSL library which is distributed under a license identical to that *
# * listed in the included docs/licenses/OpenSSL.txt file, and distribute *
# * linked combinations including the two. *
# * *
# * The Nmap Project has permission to redistribute Npcap, a packet *
# * capturing driver and library for the Microsoft Windows platform. *
# * Npcap is a separate work with it's own license rather than this Nmap *
# * license. Since the Npcap license does not permit redistribution *
# * without special permission, our Nmap Windows binary packages which *
# * contain Npcap may not be redistributed without special permission. *
# * *
# * Any redistribution of Covered Software, including any derived works, *
# * must obey and carry forward all of the terms of this license, including *
# * obeying all GPL rules and restrictions. For example, source code of *
# * the whole work must be provided and free redistribution must be *
# * allowed. All GPL references to "this License", are to be treated as *
# * including the terms and conditions of this license text as well. *
# * *
# * Because this license imposes special exceptions to the GPL, Covered *
# * Work may not be combined (even as part of a larger work) with plain GPL *
# * software. The terms, conditions, and exceptions of this license must *
# * be included as well. This license is incompatible with some other open *
# * source licenses as well. In some cases we can relicense portions of *
# * Nmap or grant special permissions to use it in other open source *
# * software. Please contact fyodor@nmap.org with any such requests. *
# * Similarly, we don't incorporate incompatible open source software into *
# * Covered Software without special permission from the copyright holders. *
# * *
# * If you have any questions about the licensing restrictions on using *
# * Nmap in other works, we are happy to help. As mentioned above, we also *
# * offer an alternative license to integrate Nmap into proprietary *
# * applications and appliances. These contracts have been sold to dozens *
# * of software vendors, and generally include a perpetual license as well *
# * as providing support and updates. They also fund the continued *
# * development of Nmap. Please email sales@nmap.com for further *
# * information. *
# * *
# * If you have received a written license agreement or contract for *
# * Covered Software stating terms other than these, you may choose to use *
# * and redistribute Covered Software under those terms instead of these. *
# * *
# * Source is provided to this software because we believe users have a *
# * right to know exactly what a program is going to do before they run it. *
# * This also allows you to audit the software for security holes. *
# * *
# * Source code also allows you to port Nmap to new platforms, fix bugs, *
# * and add new features. You are highly encouraged to send your changes *
# * to the dev@nmap.org mailing list for possible incorporation into the *
# * main distribution. By sending these changes to Fyodor or one of the *
# * Insecure.Org development mailing lists, or checking them into the Nmap *
# * source code repository, it is understood (unless you specify *
# * otherwise) that you are offering the Nmap Project the unlimited, *
# * non-exclusive right to reuse, modify, and relicense the code. Nmap *
# * will always be available Open Source, but this is important because *
# * the inability to relicense code has caused devastating problems for *
# * other Free Software projects (such as KDE and NASM). We also *
# * occasionally relicense the code to third parties as discussed above. *
# * If you wish to specify special license conditions of your *
# * contributions, just say so when you send them. *
# * *
# * This program is distributed in the hope that it will be useful, but *
# * WITHOUT ANY WARRANTY; without even the implied warranty of *
# * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the Nmap *
# * license file for more details (it's in a COPYING file included with *
# * Nmap, and also available from https://svn.nmap.org/nmap/COPYING) *
# * *
# ***************************************************************************/
import locale
import time
import socket
import copy
# Use the faster cStringIO if available, fallback on StringIO if not
try:
from cStringIO import StringIO
except ImportError:
from StringIO import StringIO
# Prevent loading PyXML
import xml
xml.__path__ = [x for x in xml.__path__ if "_xmlplus" not in x]
from xml.sax import make_parser
from xml.sax import SAXException
from xml.sax.handler import ContentHandler, EntityResolver
from xml.sax.saxutils import XMLGenerator
from xml.sax.xmlreader import AttributesImpl as Attributes
import zenmapCore.I18N # lgtm[py/unused-import]
from zenmapCore.NmapOptions import NmapOptions, join_quoted
from zenmapCore.StringPool import unique
# The version of the Nmap DTD this file understands and emits.
XML_OUTPUT_VERSION = "1.04"
class HostInfo(object):
def __init__(self):
self.comment = None
self._tcpsequence = {}
self._osmatches = []
self._ports = []
self._ports_used = []
self._extraports = []
self._uptime = {}
self._hostnames = []
self._tcptssequence = {}
self._ipidsequence = {}
self._ip = None
self._ipv6 = None
self._mac = None
self._state = ''
self._comment = ''
self._trace = {}
def make_clone(self):
clone = HostInfo()
clone.comment = self.comment
clone._tcpsequence = copy.deepcopy(self._tcpsequence)
clone._osmatches = copy.deepcopy(self._osmatches)
clone._ports = copy.deepcopy(self._ports)
clone._ports_used = self._ports_used
clone._extraports = self._extraports
clone._uptime = copy.deepcopy(self._uptime)
clone._hostnames = copy.deepcopy(self._hostnames)
clone._tcptssequence = copy.deepcopy(self._tcptssequence)
clone._ipidsequence = copy.deepcopy(self._ipidsequence)
clone._ip = copy.deepcopy(self._ip)
clone._ipv6 = copy.deepcopy(self._ipv6)
clone._mac = copy.deepcopy(self._mac)
clone._state = self._state
clone._comment = self._comment
clone._trace = copy.deepcopy(self._trace)
return clone
# tcpsequence is a dict of the form
# {'index': u'203',
# 'values': u'3637785D,35B440D1,35E9FC3B,3640DB42,355F5931,3601AE14',
# 'difficulty': u'Good luck!'}
def set_tcpsequence(self, sequence):
self._tcpsequence = sequence
def get_tcpsequence(self):
if self._tcpsequence:
return self._tcpsequence
return {}
# tcptssequence is a dict of the form
# {'values': u'71D0483C,71D048A3,71D0490C,71D04973,71D049DB,71D04A45',
# 'class': u'1000HZ'}
def set_tcptssequence(self, sequence):
self._tcptssequence = sequence
def get_tcptssequence(self):
if self._tcptssequence:
return self._tcptssequence
return {}
# ipidsequence is a dict of the form
# {'values': u'0,0,0,0,0,0', 'class': u'All zeros'}
def set_ipidsequence(self, sequence):
self._ipidsequence = sequence
def get_ipidsequence(self):
if self._ipidsequence:
return self._ipidsequence
return {}
# osmatches is a list of dicts of the form
# {'name': u'Linux 2.6.24', 'accuracy': u'98', 'line': u'1000',
# 'osclasses': ...}
# where each 'osclasses' element is a dict of the form
# {'vendor': u'Linux', 'osfamily': u'Linux', 'type': u'general purpose',
# 'osgen': u'2.6.X', 'accuracy': u'98'}
def set_osmatches(self, matches):
self._osmatches = matches
def get_osmatches(self):
return self._osmatches
def get_best_osmatch(self):
"""Return the OS match with the highest accuracy."""
if not self._osmatches:
return None
def osmatch_key(osmatch):
try:
return -float(osmatch["accuracy"])
except ValueError:
return 0
return sorted(self._osmatches, key=osmatch_key)[0]
# ports_used is a list like
# [{'state': u'open', 'portid': u'22', 'proto': u'tcp'},
# {'state': u'closed', 'portid': u'25', 'proto': u'tcp'},
# {'state': u'closed', 'portid': u'44054', 'proto': u'udp'}]
# but not all three elements are necessarily present.
def set_ports_used(self, ports):
self._ports_used = ports
def get_ports_used(self):
return self._ports_used
# uptime is a dict of the form
# {'seconds': u'1909493', 'lastboot': u'Wed Jul 2 06:48:31 2008'}
def set_uptime(self, uptime):
self._uptime = uptime
def get_uptime(self):
if self._uptime:
return self._uptime
# Avoid empty dict return
return {"seconds": "", "lastboot": ""}
# ports is an array containing dicts of the form
# {'port_state': u'open', 'portid': u'22', 'protocol': u'tcp',
# 'service_conf': u'10', 'service_extrainfo': u'protocol 2.0',
# 'service_method': u'probed', 'service_name': u'ssh',
# 'service_product': u'OpenSSH', 'service_version': u'4.3'}
def set_ports(self, ports):
self._ports = ports
def get_ports(self):
return self._ports
# extraports is an array of dicts of the form
# {'count': u'1709', 'state': u'filtered'}
def set_extraports(self, port_list):
self._extraports = port_list
def get_extraports(self):
return self._extraports
# hostnames is a list containing dicts of the form
# [{'hostname': u'scanme.nmap.org', 'hostname_type': u'PTR'}]
def set_hostnames(self, hostname_list):
self._hostnames = hostname_list
def get_hostnames(self):
return self._hostnames
# ip, ipv6, and mac are either None or dicts of the form
# {'vendor': u'', 'type': u'ipv4', 'addr': u'64.13.134.52'}
def set_ip(self, addr):
self._ip = addr
def get_ip(self):
return self._ip
def set_mac(self, addr):
self._mac = addr
def get_mac(self):
return self._mac
def set_ipv6(self, addr):
self._ipv6 = addr
def get_ipv6(self):
return self._ipv6
def get_addrs_for_sort(self):
"""Return a list of addresses as opaque values sorted such that
1) IPv4 comes before IPv6 comes before MAC, and
2) addresses are sorted according to their binary values, not their
string representation.
Use this function to the the comparison key when sorting a list of
hosts by address."""
l = []
if self.ip:
l.append((1, socket.inet_aton(self.ip["addr"])))
if self.ipv6:
try:
l.append((1,
socket.inet_pton(socket.AF_INET6, self.ipv6["addr"])))
except AttributeError:
# Windows doesn't have socket.inet_pton. Go alphabetical.
# Encode to a byte string for possible comparison with binary
# address strings (which can't be converted to unicode).
l.append((1, self.ipv6["addr"].encode("utf-8")))
if self.mac:
l.append((3, "".join(
chr(int(x, 16)) for x in self.mac["addr"].split(":"))))
l.sort()
return l
# comment is a string.
def get_comment(self):
return self._comment
def set_comment(self, comment):
self._comment = comment
# state is a string like u'up' or u'down'.
def set_state(self, status):
self._state = status
def get_state(self):
return self._state
def get_hostname(self):
hostname = None
if len(self._hostnames) > 0:
hostname = self._hostnames[0]["hostname"]
address = self.ip or self.ipv6 or self.mac
if address is not None:
address = address["addr"]
if hostname is not None:
if address is not None:
return "%s (%s)" % (hostname, address)
else:
return hostname
else:
if address is not None:
return address
else:
return _("Unknown Host")
def get_port_count_by_states(self, states):
count = 0
for p in self.ports:
state = p.get('port_state')
if state in states:
count += 1
for extra in self.get_extraports():
if extra['state'] in states:
count += int(extra['count'])
return count
def get_open_ports(self):
return self.get_port_count_by_states(('open', 'open|filtered'))
def get_filtered_ports(self):
return self.get_port_count_by_states(
('filtered', 'open|filtered', 'closed|filtered'))
def get_closed_ports(self):
return self.get_port_count_by_states(('closed', 'closed|filtered'))
def get_scanned_ports(self):
scanned = 0
for p in self.ports:
scanned += 1
for extra in self.get_extraports():
scanned += int(extra["count"])
return scanned
def get_services(self):
services = []
for p in self.ports:
services.append({
"service_name": p.get("service_name", _("unknown")),
"portid": p.get("portid", ""),
"service_version": p.get("service_version",
_("Unknown version")),
"service_product": p.get("service_product", ""),
"service_extrainfo": p.get("service_extrainfo", ""),
"port_state": p.get("port_state", _("Unknown")),
"protocol": p.get("protocol", "")
})
return services
def get_trace(self):
return self._trace
def set_trace(self, trace):
self._trace = trace
def append_trace_hop(self, hop):
if "hops" in self._trace:
self._trace["hops"].append(hop)
else:
self._trace["hops"] = [hop]
def set_trace_error(self, errorstr):
self._trace["error"] = errorstr
# Properties
tcpsequence = property(get_tcpsequence, set_tcpsequence)
osmatches = property(get_osmatches, set_osmatches)
ports = property(get_ports, set_ports)
ports_used = property(get_ports_used, set_ports_used)
extraports = property(get_extraports, set_extraports)
uptime = property(get_uptime, set_uptime)
hostnames = property(get_hostnames, set_hostnames)
tcptssequence = property(get_tcptssequence, set_tcptssequence)
ipidsequence = property(get_ipidsequence, set_ipidsequence)
ip = property(get_ip, set_ip)
ipv6 = property(get_ipv6, set_ipv6)
mac = property(get_mac, set_mac)
state = property(get_state, set_state)
comment = property(get_comment, set_comment)
services = property(get_services)
trace = property(get_trace, set_trace)
class ParserBasics(object):
def __init__(self):
# This flag informs us whether the XML output file is temporary (True),
# or user specified (False). If any of them is user-specified, it
# doesn't get stripped out of the command string in set_nmap_command.
self.xml_is_temp = True
self.nmap = {
'nmaprun': {},
'scaninfo': [],
'verbose': '',
'debugging': '',
'hosts': [],
'runstats': {}
}
self.ops = NmapOptions()
self._nmap_output = StringIO()
def set_xml_is_temp(self, xml_is_temp):
# This flag is False if a user has specified his own -oX option - in
# which case we not should remove the -oX option from the command
# string. A value of True means that we're using a temporary file which
# should be removed from the command string (see set_nmap_command).
self.xml_is_temp = xml_is_temp
def get_profile_name(self):
return self.nmap['nmaprun'].get('profile_name', '')
def set_profile_name(self, name):
self.nmap['nmaprun']['profile_name'] = name
def get_targets(self):
return self.ops.target_specs
def set_targets(self, targets):
self.ops.target_specs = targets
def get_nmap_output(self):
return self._nmap_output.getvalue()
def set_nmap_output(self, nmap_output):
self._nmap_output.close()
del self._nmap_output
self._nmap_output = StringIO()
self._nmap_output.write(nmap_output)
def del_nmap_output(self):
self._nmap_output.close()
del self._nmap_output
def get_debugging_level(self):
return self.nmap.get('debugging', '')
def set_debugging_level(self, level):
self.nmap['debugging'] = level
def get_verbose_level(self):
return self.nmap.get('verbose', '')
def set_verbose_level(self, level):
self.nmap['verbose'] = level
def get_scaninfo(self):
return self.nmap.get('scaninfo', '')
def set_scaninfo(self, info):
self.nmap['scaninfo'] = info
def get_services_scanned(self):
if self._services_scanned is None:
return self._services_scanned
services = []
for scan in self.nmap.get('scaninfo', []):
services.append(scan['services'])
self._services_scanned = ','.join(services)
return self._services_scanned
def set_services_scanned(self, services_scanned):
self._services_scanned = services_scanned
def get_nmap_command(self):
return self.ops.render_string()
def set_nmap_command(self, command):
self.ops.parse_string(command)
if self.xml_is_temp:
self.ops["-oX"] = None
self.nmap['nmaprun']['args'] = self.ops.render_string()
def get_scan_type(self):
types = []
for t in self.nmap.get('scaninfo', []):
types.append(t['type'])
return types
def get_protocol(self):
protocols = []
for proto in self.nmap.get('scaninfo', []):
protocols.append(proto['protocol'])
return protocols
def get_num_services(self):
if self._num_services is None:
return self._num_services
num = 0
for n in self.nmap.get('scaninfo', []):
num += int(n['numservices'])
self._num_services = num
return self._num_services
def set_num_services(self, num_services):
self._num_services = num_services
def get_date(self):
epoch = int(self.nmap['nmaprun'].get('start', '0'))
return time.localtime(epoch)
def get_start(self):
return self.nmap['nmaprun'].get('start', '0')
def set_start(self, start):
self.nmap['nmaprun']['start'] = start
def set_date(self, date):
if type(date) == type(int):
self.nmap['nmaprun']['start'] = date
else:
raise Exception("Wrong date format. Date should be saved \
in epoch format!")
def get_open_ports(self):
ports = 0
for h in self.nmap.get('hosts', []):
ports += h.get_open_ports()
return ports
def get_filtered_ports(self):
ports = 0
for h in self.nmap.get('hosts', []):
ports += h.get_filtered_ports()
return ports
def get_closed_ports(self):
ports = 0
for h in self.nmap['hosts']:
ports += h.get_closed_ports()
return ports
def get_formatted_date(self):
try:
return time.strftime("%B %d, %Y - %H:%M", self.get_date()).decode(
locale.getpreferredencoding())
except LookupError:
# encoding or locale not found
return time.asctime(self.get_date()).decode('ascii')
def get_scanner(self):
return self.nmap['nmaprun'].get('scanner', '')
def set_scanner(self, scanner):
self.nmap['nmaprun']['scanner'] = scanner
def get_scanner_version(self):
return self.nmap['nmaprun'].get('version', '')
def set_scanner_version(self, version):
self.nmap['nmaprun']['version'] = version
# IPv4
def get_ipv4(self):
hosts = self.nmap.get('hosts')
if hosts is None:
return []
return [host.ip for host in hosts if host.ip is not None]
# MAC
def get_mac(self):
hosts = self.nmap.get('hosts')
if hosts is None:
return []
return [host.mac for host in hosts if host.mac is not None]
# IPv6
def get_ipv6(self):
hosts = self.nmap.get('hosts')
if hosts is None:
return []
return [host.ipv6 for host in hosts if host.ipv6 is not None]
def get_hostnames(self):
hostnames = []
for host in self.nmap.get('hosts', []):
hostnames += host.get_hostnames()
return hostnames
def get_hosts(self):
return self.nmap.get('hosts', None)
def get_runstats(self):
return self.nmap.get('runstats', None)
def set_runstats(self, stats):
self.nmap['runstats'] = stats
def get_hosts_down(self):
return int(self.nmap['runstats'].get('hosts_down', '0'))
def set_hosts_down(self, down):
self.nmap['runstats']['hosts_down'] = int(down)
def get_hosts_up(self):
return int(self.nmap['runstats'].get('hosts_up', '0'))
def set_hosts_up(self, up):
self.nmap['runstats']['hosts_up'] = int(up)
def get_hosts_scanned(self):
return int(self.nmap['runstats'].get('hosts_scanned', '0'))
def set_hosts_scanned(self, scanned):
self.nmap['runstats']['hosts_scanned'] = int(scanned)
def get_finish_time(self):
return time.localtime(int(self.nmap['runstats'].get('finished_time',
'0')))
def set_finish_time(self, finish):
self.nmap['runstats']['finished_time'] = int(finish)
def get_finish_epoc_time(self):
return int(self.nmap['runstats'].get('finished_time', '0'))
def set_finish_epoc_time(self, time):
self.nmap['runstats']['finished_time'] = time
def get_scan_name(self):
"""Get a human-readable string representing this scan."""
scan_name = self.nmap.get("scan_name")
if scan_name:
return scan_name
if self.profile_name and self.get_targets():
return _("%s on %s") % (self.profile_name,
join_quoted(self.get_targets()))
return self.get_nmap_command()
def set_scan_name(self, scan_name):
self.nmap["scan_name"] = scan_name
def get_formatted_finish_date(self):
return time.strftime("%B %d, %Y - %H:%M", self.get_finish_time())
def get_port_protocol_dict(self):
#Create a dict of port -> protocol for all ports scanned
ports = {}
for scaninfo in self.scaninfo:
services_string = scaninfo['services'].strip()
if services_string == "":
services_array = []
else:
services_array = services_string.split(',')
for item in services_array:
if item.find('-') == -1:
if int(item) not in ports:
ports[int(item)] = []
ports[int(item)].append(scaninfo['protocol'])
else:
begin, end = item.split('-')
for port in range(int(begin), int(end) + 1):
if int(port) not in ports:
ports[int(port)] = []
ports[int(port)].append(scaninfo['protocol'])
return ports
profile_name = property(get_profile_name, set_profile_name)
nmap_output = property(get_nmap_output, set_nmap_output, del_nmap_output)
debugging_level = property(get_debugging_level, set_debugging_level)
verbose_level = property(get_verbose_level, set_verbose_level)
scaninfo = property(get_scaninfo, set_scaninfo)
services_scanned = property(get_services_scanned, set_services_scanned)
nmap_command = property(get_nmap_command, set_nmap_command)
scan_type = property(get_scan_type)
protocol = property(get_protocol)
num_services = property(get_num_services, set_num_services)
date = property(get_date, set_date)
open_ports = property(get_open_ports)
filtered_ports = property(get_filtered_ports)
closed_ports = property(get_closed_ports)
formatted_date = property(get_formatted_date)
scanner = property(get_scanner, set_scanner)
scanner_version = property(get_scanner_version, set_scanner_version)
ipv4 = property(get_ipv4)
mac = property(get_mac)
ipv6 = property(get_ipv6)
hostnames = property(get_hostnames)
hosts = property(get_hosts)
runstats = property(get_runstats, set_runstats)
hosts_down = property(get_hosts_down, set_hosts_down)
hosts_up = property(get_hosts_up, set_hosts_up)
hosts_scanned = property(get_hosts_scanned, set_hosts_scanned)
finish_time = property(get_finish_time, set_finish_time)
finish_epoc_time = property(get_finish_epoc_time, set_finish_epoc_time)
formatted_finish_date = property(get_formatted_finish_date)
start = property(get_start, set_start)
scan_name = property(get_scan_name, set_scan_name)
_num_services = None
_services_scanned = None
class NmapParserSAX(ParserBasics, ContentHandler):
def __init__(self):
ParserBasics.__init__(self)
# The text inside an xml-stylesheet processing instruction, like
# 'href="file:///usr/share/nmap/nmap.xsl" type="text/xsl"'.
self.xml_stylesheet_data = None
self.in_interactive_output = False
self.in_run_stats = False
self.in_host = False
self.in_hostnames = False
self.in_ports = False
self.in_port = False
self.in_os = False
self.in_trace = False
self.list_extraports = []
self.filename = None
self.unsaved = False
def set_parser(self, parser):
self.parser = parser
def parse(self, f):
"""Parse an Nmap XML file from the file-like object f."""
self.parser.parse(f)
def parse_file(self, filename):
"""Parse an Nmap XML file from the named file."""
f = open(filename, "r")
try:
self.parse(f)
self.filename = filename
finally:
f.close()
def _parse_nmaprun(self, attrs):
run_tag = "nmaprun"
if self.nmap_output == "" and "nmap_output" in attrs:
self.nmap_output = attrs["nmap_output"]
self.nmap[run_tag]["profile_name"] = attrs.get("profile_name", "")
self.nmap[run_tag]["start"] = attrs.get("start", "")
self.nmap[run_tag]["args"] = attrs.get("args", "")
self.nmap[run_tag]["scanner"] = attrs.get("scanner", "")
self.nmap[run_tag]["version"] = attrs.get("version", "")
self.nmap[run_tag]["xmloutputversion"] = attrs.get(
"xmloutputversion", "")
self.nmap_command = self.nmap[run_tag]["args"]
def _parse_output(self, attrs):
if attrs.get("type") != "interactive":
return
if self.in_interactive_output:
raise SAXException("Unexpected nested \"output\" element.")
self.in_interactive_output = True
self.nmap_output = ""
def _parse_scaninfo(self, attrs):
dic = {}
dic["type"] = unique(attrs.get("type", ""))
dic["protocol"] = unique(attrs.get("protocol", ""))
dic["numservices"] = attrs.get("numservices", "")
dic["services"] = attrs.get("services", "")
self.nmap["scaninfo"].append(dic)
def _parse_verbose(self, attrs):
self.nmap["verbose"] = attrs.get("level", "")
def _parse_debugging(self, attrs):
self.nmap["debugging"] = attrs.get("level", "")
def _parse_runstats_finished(self, attrs):
self.nmap["runstats"]["finished_time"] = attrs.get("time", "")
def _parse_runstats_hosts(self, attrs):
self.nmap["runstats"]["hosts_up"] = attrs.get("up", "")
self.nmap["runstats"]["hosts_down"] = attrs.get("down", "")
self.nmap["runstats"]["hosts_scanned"] = attrs.get("total", "")
def _parse_host(self, attrs):
self.host_info = HostInfo()
self.host_info.comment = attrs.get("comment", "")
def _parse_host_status(self, attrs):
self.host_info.set_state(unique(attrs.get("state", "")))
def _parse_host_address(self, attrs):
address_attributes = {"type": unique(attrs.get("addrtype", "")),
"vendor": attrs.get("vendor", ""),
"addr": attrs.get("addr", "")}
if address_attributes["type"] == "ipv4":
self.host_info.set_ip(address_attributes)
elif address_attributes["type"] == "ipv6":
self.host_info.set_ipv6(address_attributes)
elif address_attributes["type"] == "mac":
self.host_info.set_mac(address_attributes)
def _parse_host_hostname(self, attrs):
self.list_hostnames.append({"hostname": attrs.get("name", ""),
"hostname_type": attrs.get("type", "")})
def _parse_host_extraports(self, attrs):
self.list_extraports.append({"state": unique(attrs.get("state", "")),
"count": attrs.get("count", "")})
def _parse_host_port(self, attrs):
self.dic_port = {"protocol": unique(attrs.get("protocol", "")),
"portid": unique(attrs.get("portid", ""))}
def _parse_host_port_state(self, attrs):
self.dic_port["port_state"] = unique(attrs.get("state", ""))
self.dic_port["reason"] = unique(attrs.get("reason", ""))
self.dic_port["reason_ttl"] = unique(attrs.get("reason_ttl", ""))
def _parse_host_port_service(self, attrs):
self.dic_port["service_name"] = attrs.get("name", "")
self.dic_port["service_method"] = unique(attrs.get("method", ""))
self.dic_port["service_conf"] = attrs.get("conf", "")
self.dic_port["service_product"] = attrs.get("product", "")
self.dic_port["service_version"] = attrs.get("version", "")
self.dic_port["service_extrainfo"] = attrs.get("extrainfo", "")
def _parse_host_osmatch(self, attrs):
osmatch = self._parsing(attrs, [], ['name', 'accuracy', 'line'])
osmatch['osclasses'] = []
self.list_osmatch.append(osmatch)
def _parse_host_portused(self, attrs):
self.list_portused.append(self._parsing(
attrs, ['state', 'proto', 'portid'], []))
def _parse_host_osclass(self, attrs):
self.list_osclass.append(self._parsing(
attrs, ['type', 'vendor', 'osfamily', 'osgen'], ['accuracy']))
def _parsing(self, attrs, unique_names, other_names):
# Returns a dict with the attributes of a given tag with the
# attributes names as keys and their respective values
dic = {}
for at in unique_names:
dic[at] = unique(attrs.get(at, ""))
for at in other_names:
dic[at] = attrs.get(at, "")
return dic
def _parse_host_uptime(self, attrs):
self.host_info.set_uptime(self._parsing(
attrs, [], ["seconds", "lastboot"]))
def _parse_host_tcpsequence(self, attrs):
self.host_info.set_tcpsequence(self._parsing(
attrs, ['difficulty'], ['index', 'values']))
def _parse_host_tcptssequence(self, attrs):
self.host_info.set_tcptssequence(self._parsing(
attrs, ['class'], ['values']))
def _parse_host_ipidsequence(self, attrs):
self.host_info.set_ipidsequence(self._parsing(
attrs, ['class'], ['values']))
def _parse_host_trace(self, attrs):
trace = {}
for attr in ["proto", "port"]:
trace[attr] = unique(attrs.get(attr, ""))
self.host_info.set_trace(trace)
def _parse_host_trace_hop(self, attrs):
hop = self._parsing(attrs, [], ["ttl", "rtt", "ipaddr", "host"])
self.host_info.append_trace_hop(hop)
def _parse_host_trace_error(self, attrs):
self.host_info.set_trace_error(unique(attrs.get("errorstr", "")))
def processingInstruction(self, target, data):
if target == "xml-stylesheet":
self.xml_stylesheet_data = data
def startElement(self, name, attrs):
if name == "nmaprun":
self._parse_nmaprun(attrs)
if name == "output":
self._parse_output(attrs)
elif name == "scaninfo":
self._parse_scaninfo(attrs)
elif name == "verbose":
self._parse_verbose(attrs)
elif name == "debugging":
self._parse_debugging(attrs)
elif name == "runstats":
self.in_run_stats = True
elif self.in_run_stats and name == "finished":
self._parse_runstats_finished(attrs)
elif self.in_run_stats and name == "hosts":
self._parse_runstats_hosts(attrs)
elif name == "host":
self.in_host = True
self._parse_host(attrs)
self.list_ports = []
self.list_extraports = []
elif self.in_host and name == "status":
self._parse_host_status(attrs)
elif self.in_host and name == "address":
self._parse_host_address(attrs)
elif self.in_host and name == "hostnames":
self.in_hostnames = True
self.list_hostnames = []
elif self.in_host and self.in_hostnames and name == "hostname":
self._parse_host_hostname(attrs)
elif self.in_host and name == "ports":
self.in_ports = True
elif self.in_host and self.in_ports and name == "extraports":
self._parse_host_extraports(attrs)
elif self.in_host and self.in_ports and name == "port":
self.in_port = True
self._parse_host_port(attrs)
elif self.in_host and self.in_ports and \
self.in_port and name == "state":
self._parse_host_port_state(attrs)
elif self.in_host and self.in_ports and \
self.in_port and name == "service":
self._parse_host_port_service(attrs)
elif self.in_host and name == "os":
self.in_os = True
self.list_portused = []
self.list_osmatch = []
elif self.in_host and self.in_os and name == "osmatch":
self._parse_host_osmatch(attrs)
elif self.in_host and self.in_os and name == "portused":
self._parse_host_portused(attrs)
elif self.in_host and self.in_os and name == "osclass":
self.list_osclass = []
self._parse_host_osclass(attrs)
elif self.in_host and name == "uptime":
self._parse_host_uptime(attrs)
elif self.in_host and name == "tcpsequence":
self._parse_host_tcpsequence(attrs)
elif self.in_host and name == "tcptssequence":
self._parse_host_tcptssequence(attrs)
elif self.in_host and name == "ipidsequence":
self._parse_host_ipidsequence(attrs)
elif self.in_host and name == "trace":
self.in_trace = True
self._parse_host_trace(attrs)
elif self.in_host and self.in_trace and name == "hop":
self._parse_host_trace_hop(attrs)
elif self.in_host and self.in_trace and name == "error":
self._parse_host_trace_error(attrs)
def endElement(self, name):
if name == "output":
self.in_interactive_output = False
elif name == "runstats":
self.in_run_stats = False
elif name == "host":
self.in_host = False
self.host_info.set_extraports(self.list_extraports)
self.host_info.set_ports(self.list_ports)
self.nmap["hosts"].append(self.host_info)
elif self.in_host and name == "hostnames":
self.in_hostnames = False
self.host_info.set_hostnames(self.list_hostnames)
elif self.in_host and name == "ports":
self.in_ports = False
elif self.in_host and self.in_ports and name == "port":
self.in_port = False
self.list_ports.append(self.dic_port)
del(self.dic_port)
elif self.in_host and self.in_os and name == "osmatch":
self.list_osmatch[-1]['osclasses'].extend(self.list_osclass)
self.list_osclass = []
elif self.in_host and self.in_os and name == "os":
self.in_os = False
self.host_info.set_ports_used(self.list_portused)
self.host_info.set_osmatches(self.list_osmatch)
del(self.list_portused)
del(self.list_osmatch)
elif self.in_host and self.in_trace and name == "trace":
self.in_trace = False
def characters(self, content):
if self.in_interactive_output:
self._nmap_output.write(content)
def write_text(self, f):
"""Write the Nmap text output of this object to the file-like object
f."""
if self.nmap_output == "":
return
f.write(self.nmap_output)
def write_xml(self, f):
"""Write the XML representation of this object to the file-like object
f."""
writer = XMLGenerator(f)
writer.startDocument()
if self.xml_stylesheet_data is not None:
writer.processingInstruction(
"xml-stylesheet", self.xml_stylesheet_data)
self._write_nmaprun(writer)
self._write_scaninfo(writer)
self._write_verbose(writer)
self._write_debugging(writer)
self._write_output(writer)
self._write_hosts(writer)
self._write_runstats(writer)
writer.endElement("nmaprun")
writer.endDocument()
def get_xml(self):
"""Return a string containing the XML representation of this scan."""
buffer = StringIO()
self.write_xml(buffer)
string = buffer.getvalue()
buffer.close()
return string
def write_xml_to_file(self, filename):
"""Write the XML representation of this scan to the file whose name is
given."""
fd = open(filename, "wb")
self.write_xml(fd)
fd.close()
def _write_output(self, writer):
if self.nmap_output == "":
return
writer.startElement("output", Attributes({"type": "interactive"}))
writer.characters(self.nmap_output)
writer.endElement("output")
def _write_runstats(self, writer):
##################
# Runstats element
writer.startElement("runstats", Attributes(dict()))
## Finished element
writer.startElement("finished",
Attributes(dict(time=str(self.finish_epoc_time),
timestr=time.ctime(time.mktime(
self.get_finish_time())))))
writer.endElement("finished")
## Hosts element
writer.startElement("hosts",
Attributes(dict(up=str(self.hosts_up),
down=str(self.hosts_down),
total=str(self.hosts_scanned))))
writer.endElement("hosts")
writer.endElement("runstats")
# End of Runstats element
#########################
def _write_hosts(self, writer):
for host in self.hosts:
# Start host element
writer.startElement("host",
Attributes(dict(comment=host.comment)))
# Status element
writer.startElement("status",
Attributes(dict(state=host.state)))
writer.endElement("status")
##################
# Address elements
## IPv4
if host.ip is not None:
writer.startElement("address",
Attributes(dict(addr=host.ip.get("addr", ""),
vendor=host.ip.get("vendor", ""),
addrtype=host.ip.get("type", ""))))
writer.endElement("address")
## IPv6
if host.ipv6 is not None:
writer.startElement("address",
Attributes(dict(addr=host.ipv6.get("addr", ""),
vendor=host.ipv6.get("vendor", ""),
addrtype=host.ipv6.get("type", ""))))
writer.endElement("address")
## MAC
if host.mac is not None:
writer.startElement("address",
Attributes(dict(addr=host.mac.get("addr", ""),
vendor=host.mac.get("vendor", ""),
addrtype=host.mac.get("type", ""))))
writer.endElement("address")
# End of Address elements
#########################
###################
# Hostnames element
writer.startElement("hostnames", Attributes({}))
for hname in host.hostnames:
writer.startElement("hostname",
Attributes(dict(name=hname.get("hostname", ""),
type=hname.get("hostname_type", ""))))
writer.endElement("hostname")
writer.endElement("hostnames")
# End of Hostnames element
##########################
###############
# Ports element
writer.startElement("ports", Attributes({}))
## Extraports elements
for ext in host.get_extraports():
writer.startElement("extraports",
Attributes(dict(count=ext.get("count", ""),
state=ext.get("state", ""))))
writer.endElement("extraports")
## Port elements
for p in host.ports:
writer.startElement("port",
Attributes(dict(portid=p.get("portid", ""),
protocol=p.get("protocol", ""))))
### Port state
writer.startElement("state",
Attributes(dict(state=p.get("port_state", ""),
reason=p.get("reason", ""),
reason_ttl=p.get("reason_ttl", ""))))
writer.endElement("state")
### Port service info
d = {}
for xml_attr, member in (("conf", "service_conf"),
("method", "service_method"),
("name", "service_name"),
("product", "service_product"),
("version", "service_version"),
("extrainfo", "service_extrainfo")):
if p.get(member):
d[xml_attr] = p.get(member)
writer.startElement("service", Attributes(d))
writer.endElement("service")
writer.endElement("port")
writer.endElement("ports")
# End of Ports element
######################
############
# OS element
writer.startElement("os", Attributes({}))
## Ports used elements
for pu in host.ports_used:
writer.startElement("portused",
Attributes(dict(state=pu.get("state", ""),
proto=pu.get("proto", ""),
portid=pu.get("portid", ""))))
writer.endElement("portused")
## Osmatch elements
for om in host.osmatches:
writer.startElement("osmatch",
Attributes(dict(name=om.get("name", ""),
accuracy=om.get("accuracy", ""),
line=om.get("line", ""))))
## Osclass elements
for oc in om['osclasses']:
writer.startElement("osclass",
Attributes(dict(vendor=oc.get("vendor", ""),
osfamily=oc.get("osfamily", ""),
type=oc.get("type", ""),
osgen=oc.get("osgen", ""),
accuracy=oc.get("accuracy", ""))))
writer.endElement("osclass")
writer.endElement("osmatch")
writer.endElement("os")
# End of OS element
###################
# Uptime element
writer.startElement("uptime",
Attributes(dict(seconds=host.uptime.get("seconds", ""),
lastboot=host.uptime.get("lastboot", ""))))
writer.endElement("uptime")
#####################
# Sequences elements
## TCP Sequence element
# Cannot use dict() here, because of the 'class' attribute.
writer.startElement("tcpsequence",
Attributes({"index": host.tcpsequence.get("index", ""),
"difficulty": host.tcpsequence.get("difficulty", ""),
"values": host.tcpsequence.get("values", "")}))
writer.endElement("tcpsequence")
## IP ID Sequence element
writer.startElement("ipidsequence",
Attributes({"class": host.ipidsequence.get("class", ""),
"values": host.ipidsequence.get("values", "")}))
writer.endElement("ipidsequence")
## TCP TS Sequence element
writer.startElement("tcptssequence",
Attributes({"class": host.tcptssequence.get("class", ""),
"values": host.tcptssequence.get("values", "")}))
writer.endElement("tcptssequence")
# End of sequences elements
###########################
## Trace element
if len(host.trace) > 0:
writer.startElement("trace",
Attributes({"proto": host.trace.get("proto", ""),
"port": host.trace.get("port", "")}))
if "hops" in host.trace:
for hop in host.trace["hops"]:
writer.startElement("hop",
Attributes({"ttl": hop["ttl"],
"rtt": hop["rtt"],
"ipaddr": hop["ipaddr"],
"host": hop["host"]}))
writer.endElement("hop")
if "error" in host.trace:
writer.startElement("error",
Attributes({"errorstr": host.trace["error"]}))
writer.endElement("error")
writer.endElement("trace")
# End of trace element
###########################
# End host element
writer.endElement("host")
def _write_debugging(self, writer):
writer.startElement("debugging", Attributes(dict(
level=str(self.debugging_level))))
writer.endElement("debugging")
def _write_verbose(self, writer):
writer.startElement("verbose", Attributes(dict(
level=str(self.verbose_level))))
writer.endElement("verbose")
def _write_scaninfo(self, writer):
for scan in self.scaninfo:
writer.startElement("scaninfo",
Attributes(dict(type=scan.get("type", ""),
protocol=scan.get("protocol", ""),
numservices=scan.get("numservices", ""),
services=scan.get("services", ""))))
writer.endElement("scaninfo")
def _write_nmaprun(self, writer):
writer.startElement("nmaprun",
Attributes(dict(args=str(self.nmap_command),
profile_name=str(self.profile_name),
scanner=str(self.scanner),
start=str(self.start),
startstr=time.ctime(
time.mktime(self.get_date())),
version=str(self.scanner_version),
xmloutputversion=str(XML_OUTPUT_VERSION))))
def set_unsaved(self):
self.unsaved = True
def is_unsaved(self):
return self.unsaved
class OverrideEntityResolver(EntityResolver):
"""This class overrides the default behavior of xml.sax to download
remote DTDs, instead returning blank strings"""
empty = StringIO()
def resolveEntity(self, publicId, systemId):
return OverrideEntityResolver.empty
def nmap_parser_sax():
parser = make_parser()
nmap_parser = NmapParserSAX()
parser.setContentHandler(nmap_parser)
parser.setEntityResolver(OverrideEntityResolver())
nmap_parser.set_parser(parser)
return nmap_parser
NmapParser = nmap_parser_sax
if __name__ == '__main__':
import sys
file_to_parse = sys.argv[1]
np = NmapParser()
np.parse_file(file_to_parse)
for host in np.hosts:
print "%s:" % host.ip["addr"]
print " Comment:", repr(host.comment)
print " TCP sequence:", repr(host.tcpsequence)
print " TCP TS sequence:", repr(host.tcptssequence)
print " IP ID sequence:", repr(host.ipidsequence)
print " Uptime:", repr(host.uptime)
print " OS Match:", repr(host.osmatches)
print " Ports:"
for p in host.ports:
print "\t%s" % repr(p)
print " Ports used:", repr(host.ports_used)
print " OS Matches:", repr(host.osmatches)
print " Hostnames:", repr(host.hostnames)
print " IP:", repr(host.ip)
print " IPv6:", repr(host.ipv6)
print " MAC:", repr(host.mac)
print " State:", repr(host.state)
if "hops" in host.trace:
print " Trace:"
for hop in host.trace["hops"]:
print " ", repr(hop)
print