bandit/bandit/core/result_store.py

414 lines
17 KiB
Python

# -*- coding:utf-8 -*-
#
# Copyright 2014 Hewlett-Packard Development Company, L.P.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
"""An object to store/access results associated with Bandit tests."""
from collections import OrderedDict
from datetime import datetime
import json
import linecache
from operator import itemgetter
import re
import constants
import utils
class BanditResultStore():
resstore = OrderedDict()
count = 0
skipped = None
def __init__(self, logger, config, agg_type):
self.count = 0
self.skipped = []
self.logger = logger
self.config = config
self.agg_type = agg_type
@property
def count(self):
'''Count property - used to get the current number of test results
:return: The current count of test results
'''
return self.count
def skip(self, filename, reason):
'''Indicates that the specified file was skipped and why
:param filename: The file that was skipped
:param reason: Why the file was skipped
:return: -
'''
self.skipped.append((filename, reason))
def add(self, context, test, issue):
'''Adds a result, with the context and the issue that was found
:param context: Context of the node
:param test: The type (function name) of the test
:param issue: Which issue was found
:return: -
'''
filename, lineno = context['filename'], context['lineno']
(issue_type, issue_text) = issue
# XXX(fletcher): tuple usage is fragile because ordering changes on
# agg_type; ordering is important for reporting
if self.agg_type == 'vuln':
if test in self.resstore:
self.resstore[test].append((filename, lineno, issue_type,
issue_text))
else:
self.resstore[test] = [(filename, lineno, issue_type,
issue_text)]
else:
if filename in self.resstore:
self.resstore[filename].append((lineno, test, issue_type,
issue_text))
else:
self.resstore[filename] = [(lineno, test, issue_type,
issue_text), ]
self.count += 1
def report_json(self, output_filename, stats=None, lines=1):
'''Prints/returns warnings in JSON format
:param output_filename: File to output the results (optional)
:param stats: dictionary of stats for each file
:param lines: number of lines around code to print
:return: JSON string
'''
machine_output = dict({'results': [], 'errors': [], 'stats': []})
collector = list()
for (fname, reason) in self.skipped:
machine_output['errors'].append({'filename': fname,
'reason': reason})
for filer, score in stats.iteritems():
machine_output['stats'].append({'filename': filer,
'score': score})
# array indeces are determined by order of tuples defined in add()
if self.agg_type == 'file':
"""
XXX(fletcher): We currently pass around tuples, whose order change
depending on agg_type, which leads to confusing code like what's
below.
In this context an item in resstore looks like:
('examples/imports-telnetlib.py', [(1, 'blacklist_imports',
'ERROR','Telnet...other encrypted protocol.')])
So the list/tuple associated with the file
'examples/imports-telnetlib.py' looks like:
(1, 'blacklist_imports', 'ERROR', 'Telnet...other encrypted
protocol.')
This means:
line number = [0] = 1
error label = [1] = 'blacklist_imports'
error type = [2] 'ERROR'
reason = [3] = 'Telnet...other encrypted protocol.'
"""
for item in self.resstore.items():
filename = item[0]
filelist = item[1]
for x in filelist:
line_num = str(x[0])
error_label = str(x[1]).strip()
error_type = str(x[2]).strip()
reason = str(x[3]).strip()
code = ""
for i in utils.mid_range(int(line_num), lines):
code += linecache.getline(filename, i)
holder = dict({"filename": filename,
"line_num": line_num,
"error_label": error_label,
"error_type": error_type,
"code": code,
"reason": reason})
collector.append(holder)
else:
"""
XXX(fletcher): We currently pass around tuples, whose order change
depending on agg_type, which leads to confusing code like what's
below.
In this context an item in resstore looks like:
('random_lib_imports', [('examples/random.py', 1, 'INFO', 'Random
library should...cryptographic purposes')])
So the list/tuple associated with error label 'random_lib_imports'
looks like:
('examples/random.py', 1, 'INFO', 'Random library
should...cryptographic purposes')
This means:
filename = [0] = 'examples/random.py'
line number = [1] = 1
error type = [2] = 'INFO'
reason = [3] = 'Random library should...cryptographic purposes'
"""
for item in self.resstore.items():
vuln_label = item[0]
filelist = item[1]
for x in filelist:
filename = str(x[0])
line_num = str(x[1])
error_type = str(x[2]).strip()
reason = str(x[3]).strip()
code = ""
for i in utils.mid_range(int(line_num), lines):
code += linecache.getline(filename, i)
holder = dict({"filename": filename,
"line_num": line_num,
"error_label": vuln_label.strip(),
"error_type": error_type,
"code": code,
"reason": reason})
collector.append(holder)
if self.agg_type == 'vuln':
machine_output['results'] = sorted(collector,
key=itemgetter('error_type'))
else:
machine_output['results'] = sorted(collector,
key=itemgetter('filename'))
return json.dumps(machine_output, sort_keys=True,
indent=2, separators=(',', ': '))
def report_txt(self, scope, scores, lines=0, level=1):
'''Returns TXT string of results
:param scope: Which files were inspected
:param scores: The scores awarded to each file in the scope
:param lines: # of lines around the issue line to display (optional)
:param level: What level of severity to display (optional)
:return: TXT string
'''
if level >= len(constants.SEVERITY):
level = len(constants.SEVERITY) - 1
tmpstr_list = []
# print header
tmpstr_list.append("Run started:\n\t%s\n" % datetime.utcnow())
# print which files were inspected
tmpstr_list.append("Files in scope (%s):\n" % (len(scope)))
for item in zip(scope, scores):
tmpstr_list.append("\t%s (score: %i)\n" % item)
# print which files were skipped and why
tmpstr_list.append("Files skipped (%s):" % len(self.skipped))
for (fname, reason) in self.skipped:
tmpstr_list.append("\n\t%s (%s)" % (fname, reason))
# print the results
tmpstr_list.append("\nTest results:\n")
if self.count == 0:
tmpstr_list.append("\tNo issues identified.\n")
# if aggregating by vulnerability type
elif self.agg_type == 'vuln':
for test, issues in self.resstore.items():
for filename, lineno, issue_type, issue_text in issues:
issue_line = linecache.getline(filename, lineno)
# if the line doesn't have one of the skip tags, keep going
if re.search(constants.SKIP_RE, issue_line):
continue
# if the result in't filtered out by severity
if constants.SEVERITY.index(issue_type) >= level:
tmpstr_list.append(">> %s\n - %s::%s\n" % (
issue_text, filename, lineno
))
for i in utils.mid_range(lineno, lines):
line = linecache.getline(filename, i)
# linecache returns '' if line does not exist
if line != '':
tmpstr_list.append("\t%3d %s" % (
i, linecache.getline(filename, i)
))
# otherwise, aggregating by filename
else:
for filename, issues in self.resstore.items():
for lineno, test, issue_type, issue_text in issues:
issue_line = linecache.getline(filename, lineno)
# if the line doesn't have one of the skip tags, keep going
if re.search(constants.SKIP_RE, issue_line):
continue
# if the result isn't filtered out by severity
if constants.SEVERITY.index(issue_type) >= level:
tmpstr_list.append(">> %s\n - %s::%s\n" % (
issue_text, filename, lineno
))
for i in utils.mid_range(lineno, lines):
line = linecache.getline(filename, i)
# linecache returns '' if line does not exist
if line != '':
tmpstr_list.append("\t%3d %s" % (
i, linecache.getline(filename, i)
))
return "".join(tmpstr_list)
def report_tty(self, scope, scores, lines=0, level=1):
'''Prints the contents of the result store
:param scope: Which files were inspected
:param scores: The scores awarded to each file in the scope
:param lines: # of lines around the issue line to display (optional)
:param level: What level of severity to display (optional)
:return: TXT string with appropriate TTY coloring for terminals
'''
if level >= len(constants.SEVERITY):
level = len(constants.SEVERITY) - 1
tmpstr_list = []
# get text colors from settings
get_setting = self.config.get_setting
color = {'HEADER': get_setting('color_HEADER'),
'DEFAULT': get_setting('color_DEFAULT'),
'INFO': get_setting('color_INFO'),
'WARN': get_setting('color_WARN'),
'ERROR': get_setting('color_ERROR')
}
# print header
tmpstr_list.append("%sRun started:%s\n\t%s\n" % (
color['HEADER'],
color['DEFAULT'],
datetime.utcnow()
))
# print which files were inspected
tmpstr_list.append("%sFiles in scope (%s):%s\n" % (
color['HEADER'], len(scope),
color['DEFAULT']
))
for item in zip(scope, scores):
tmpstr_list.append("\t%s (score: %i)\n" % item)
# print which files were skipped and why
tmpstr_list.append("%sFiles skipped (%s):%s" % (
color['HEADER'], len(self.skipped),
color['DEFAULT']
))
for (fname, reason) in self.skipped:
tmpstr_list.append("\n\t%s (%s)" % (fname, reason))
# print the results
tmpstr_list.append("\n%sTest results:%s\n" % (
color['HEADER'], color['DEFAULT']
))
if self.count == 0:
tmpstr_list.append("\tNo issues identified.\n")
# if aggregating by vulnerability type
elif self.agg_type == 'vuln':
for test, issues in self.resstore.items():
for filename, lineno, issue_type, issue_text in issues:
issue_line = linecache.getline(filename, lineno)
# if the line doesn't have one of the skip tags, keep going
if re.search(constants.SKIP_RE, issue_line):
continue
# if the result in't filtered out by severity
if constants.SEVERITY.index(issue_type) >= level:
tmpstr_list.append("%s>> %s\n - %s::%s%s\n" % (
color.get(issue_type, color['DEFAULT']),
issue_text, filename, lineno,
color['DEFAULT']
))
for i in utils.mid_range(lineno, lines):
line = linecache.getline(filename, i)
# linecache returns '' if line does not exist
if line != '':
tmpstr_list.append("\t%3d %s" % (
i, linecache.getline(filename, i)
))
# otherwise, aggregating by filename
else:
for filename, issues in self.resstore.items():
for lineno, test, issue_type, issue_text in issues:
issue_line = linecache.getline(filename, lineno)
# if the line doesn't have one of the skip tags, keep going
if re.search(constants.SKIP_RE, issue_line):
continue
# if the result isn't filtered out by severity
if constants.SEVERITY.index(issue_type) >= level:
tmpstr_list.append("%s>> %s\n - %s::%s%s\n" % (
color.get(
issue_type, color['DEFAULT']
),
issue_text, filename, lineno,
color['DEFAULT']
))
for i in utils.mid_range(lineno, lines):
line = linecache.getline(filename, i)
# linecache returns '' if line does not exist
if line != '':
tmpstr_list.append("\t%3d %s" % (
i, linecache.getline(filename, i)
))
return ''.join(tmpstr_list)
def report(self, scope, scores, lines=0, level=1, output_filename=None,
output_format=None):
'''Prints the contents of the result store
:param scope: Which files were inspected
:param scores: The scores awarded to each file in the scope
:param lines: # of lines around the issue line to display (optional)
:param level: What level of severity to display (optional)
:param output_filename: File to output the results (optional)
:param output_format: File type to output (json|txt)
:return: -
'''
scores_dict = dict(zip(scope, scores))
if output_filename is None and output_format == 'txt':
print self.report_tty(scope, scores, lines, level) # noqa
return
if output_filename is None and output_format == 'json':
print self.report_json(output_filename, scores_dict) # noqa
return
if output_format == 'txt':
outer = self.report_txt(scope, scores, lines, level)
with open(output_filename, 'w') as fout:
fout.write(outer)
print("TXT output written to file: %s" % output_filename)
return
else:
outer = self.report_json(output_filename, scores_dict)
with open(output_filename, 'w') as fout:
fout.write(outer)
print("JSON output written to file: %s" % output_filename)
return