From 0bfee91edaaf243111e35e9252d955665437ef53 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Fri, 12 Jul 2013 14:38:12 -0400
Subject: [PATCH 01/13] Cleaned up and refactored TestResultsDiffer to redesign
 specification.

---
 test/script/regression.py | 206 +++++++++++++++++---------------------
 1 file changed, 91 insertions(+), 115 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index ddaade4ec1..e15197a518 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -843,26 +843,33 @@ class TestResultsDiffer(object):
             databaseDiff: TskDbDiff object created based off test_data
         """
         try:
-            # Extract gold archive file to output/gold/tmp/
-            extrctr = zipfile.ZipFile(test_data.gold_archive, 'r', compression=zipfile.ZIP_DEFLATED)
-            extrctr.extractall(test_data.main_config.gold)
-            extrctr.close
-            time.sleep(2)
 
-            # Lists of tests to run
-            TestResultsDiffer._compare_errors(test_data)
-
-            # Compare database count to gold
+            # Diff the gold and output databases
             test_data.db_diff_results = TskDbDiff(test_data).run_diff()
 
+            # Compare Exceptions
+            replace = lambda file: re.sub(re.compile("\d"), "d", file)
+            output_errors = test_data.get_sorted_errors_path(DBType.OUTPUT)
+            gold_errors = test_data.get_sorted_errors_path(DBType.GOLD)
+
+            TestResultsDiffer._compare_text(output_errors, gold_errors,
+            test_data, replace)
+
             # Compare smart blackboard results
-            TestResultsDiffer._compare_text(test_data.get_sorted_data_path(DBType.OUTPUT), "SortedData", test_data)
+            output_data = test_data.get_sorted_data_path(DBType.OUTPUT)
+            gold_data = test_data.get_sorted_data_path(DBType.GOLD)
+            TestResultsDiffer._compare_text(output_data, gold_data, test_data)
 
             # Compare the rest of the database (non-BB)
-            TestResultsDiffer._compare_text(test_data.test_dbdump, "DBDump", test_data)
+            output_dump = test_data.get_db_dump_path(DBType.OUTPUT)
+            gold_dump = test_data.get_db_dump_path(DBType.GOLD)
+            TestResultsDiffer._compare_text(output_dump, gold_dump, test_data)
 
             # Compare html output
-            TestResultsDiffer._compare_to_gold_html(test_data)
+            gold_report_path = test_data.get_html_report_path(DBType.GOLD)
+            output_report_path = test_data.get_html_report_path(DBType.OUTPUT)
+            TestResultsDiffer._html_report_diff(test_data, gold_report_path,
+            output_report_path)
 
             # Clean up tmp folder
             del_dir(test_data.gold_data_dir)
@@ -873,124 +880,84 @@ class TestResultsDiffer(object):
             print(traceback.format_exc())
 
 
-
     # TODO: _compare_text could be made more generic with how it forms the paths (i.e. not add ".txt" in the method) and probably merged with
     # compare_errors since they both do basic comparison of text files
 
-    def _compare_text(output_file, gold_file, test_data):
+    def _compare_text(output_file, gold_file, test_data, process=None):
         """Compare two text files.
 
         Args:
             output_file: a pathto_File, the output text file
             gold_file: a pathto_File, the input text file
             test_data: the TestData of the test being performed
+            pre-process: (optional) a function of String -> String that will be
+            called on each input file before the diff, if specified.
         """
-        gold_dir = Emailer.make_path(test_config.img_gold, test_data.image_name, test_data.image_name + gold_file + ".txt")
         if(not Emailer.file_exists(output_file)):
             return
-        srtd_data = codecs.open(output_file, "r", "utf_8")
-        gold_data = codecs.open(gold_dir, "r", "utf_8")
-        gold_dat = gold_data.read()
-        srtd_dat = srtd_data.read()
-        if (not(gold_dat == srtd_dat)):
-            diff_dir = Emailer.make_local_path(test_config.output_dir, test_data.image_name, test_data.image_name+gold_file+"-Diff.txt")
-            diff_file = codecs.open(diff_dir, "wb", "utf_8")
-            dffcmdlst = ["diff", test_data.get_sorted_data_path(DBType.OUTPUT), gold_dir]
+        output_data = codecs.open(output_file, "r", "utf_8").read()
+        gold_data = codecs.open(gold_file, "r", "utf_8").read()
+
+        if process is not None:
+            output_data = process(output_data)
+            gold_data = process(gold_data)
+
+        if (not(gold_data == output_data)):
+            filename = os.path.basename(output_file)
+            diff_path = os.path.join(test_data.output_path, filename +
+            "-Diff.txt")
+            diff_file = codecs.open(diff_path, "wb", "utf_8")
+            dffcmdlst = ["diff", output_file, gold_file]
             subprocess.call(dffcmdlst, stdout = diff_file)
             global attachl
             global errorem
             global failedbool
             attachl.append(diff_dir)
-            errorem += test_data.image_name + ":There was a  difference in the database file " + gold_file + ".\n"
-            printerror(test_data, "There was a database difference for " + test_data.image_name + " versus " + gold_file + ".\n")
+            msg = test_data.image_name + ":There was a difference in "
+            msg += os.path.basename(output_file) + ".\n"
+            errorem += msg
+            printerror(test_data, msg)
             failedbool = True
             global imgfail
             imgfail = True
 
-    def _compare_errors(test_data):
-        """Compare merged error log files.
-
-        Args:
-            test_data: the TestData of the test being performed
-        """
-        gold_dir = test_data.get_sorted_errors_path(DBType.GOLD)
-        common_log = codecs.open(test_data.sorted_log, "r", "utf_8")
-        gold_log = codecs.open(gold_dir, "r", "utf_8")
-        gold_dat = gold_log.read()
-        common_dat = common_log.read()
-        patrn = re.compile("\d")
-        if (not((re.sub(patrn, 'd', gold_dat)) == (re.sub(patrn, 'd', common_dat)))):
-            diff_dir = Emailer.make_local_path(test_config.output_dir, test_data.image_name, test_data.image_name+"AutopsyErrors-Diff.txt")
-            diff_file = open(diff_dir, "w")
-            dffcmdlst = ["diff", test_data.sorted_log, gold_dir]
-            subprocess.call(dffcmdlst, stdout = diff_file)
-            global attachl
-            global errorem
-            global failedbool
-            attachl.append(test_data.sorted_log)
-            attachl.append(diff_dir)
-            errorem += test_data.image_name + ":There was a difference in the exceptions Log.\n"
-            printerror(test_data, "Exceptions didn't match.\n")
-            failedbool = True
-            global imgfail
-            imgfail = True
-
-    def _compare_to_gold_html(test_data):
+    # TODO: get rid of test_data by changing the error reporting
+    def _html_report_diff(test_data, gold_report_path, output_report_path):
         """Compare the output and gold html reports.
 
         Args:
             test_data: the TestData of the test being performed.
+            gold_report_path: a pathto_Dir, the gold HTML report directory
+            output_report_path: a pathto_Dir, the output HTML report directory
         """
-        gold_html_file = Emailer.make_path(test_config.img_gold, test_data.image_name, "Report", "index.html")
-        htmlfolder = ""
-        for fs in os.listdir(Emailer.make_path(test_config.output_dir, test_data.image_name, AUTOPSY_TEST_CASE, "Reports")):
-            if os.path.isdir(Emailer.make_path(test_config.output_dir, test_data.image_name, AUTOPSY_TEST_CASE, "Reports", fs)):
-                htmlfolder = fs
-        autopsy_html_path = Emailer.make_path(test_config.output_dir, test_data.image_name, AUTOPSY_TEST_CASE, "Reports", htmlfolder, "HTML Report")
-
-
         try:
-            autopsy_html_file = get_file_in_dir(autopsy_html_path, "index.html")
-            if not Emailer.file_exists(gold_html_file):
-                printerror(test_data, "Error: No gold html report exists at:")
-                printerror(test_data, gold_html_file + "\n")
-                return
-            if not Emailer.file_exists(autopsy_html_file):
-                printerror(test_data, "Error: No test_config html report exists at:")
-                printerror(test_data, autopsy_html_file + "\n")
-                return
-            #Find all gold .html files belonging to this test_config
-            ListGoldHTML = []
-            for fs in os.listdir(Emailer.make_path(test_config.output_dir, test_data.image_name, AUTOPSY_TEST_CASE, "Reports", htmlfolder)):
-                if(fs.endswith(".html")):
-                    ListGoldHTML.append(Emailer.make_path(test_config.output_dir, test_data.image_name, AUTOPSY_TEST_CASE, "Reports", htmlfolder, fs))
-            #Find all new .html files belonging to this test_config
-            ListNewHTML = []
-            if(os.path.exists(Emailer.make_path(test_config.img_gold, test_data.image_name))):
-                for fs in os.listdir(Emailer.make_path(test_config.img_gold, test_data.image_name)):
-                    if (fs.endswith(".html")):
-                        ListNewHTML.append(Emailer.make_path(test_config.img_gold, test_data.image_name, fs))
+            gold_html_files = get_files_by_ext(gold_report_path, ".html")
+            output_html_files = get_files_by_ext(output_report_path, ".html")
+
             #ensure both reports have the same number of files and are in the same order
-            if(len(ListGoldHTML) != len(ListNewHTML)):
-                printerror(test_data, "The reports did not have the same number of files. One of the reports may have been corrupted")
+            if(len(gold_html_files) != len(output_html_files)):
+                msg = "The reports did not have the same number or files."
+                msg += "One of the reports may have been corrupted."
+                printerror(test_data, msg)
             else:
-                ListGoldHTML.sort()
-                ListNewHTML.sort()
+                gold_html_files.sort()
+                output_html_files.sort()
 
             total = {"Gold": 0, "New": 0}
-            for x in range(0, len(ListGoldHTML)):
-                count = TestResultsDiffer._compare_report_files(ListGoldHTML[x], ListNewHTML[x])
-                total["Gold"]+=count[0]
-                total["New"]+=count[1]
+            for gold, output in zip(gold_html_files, output_html_files):
+                count = TestResultsDiffer._compare_report_files(gold, output)
+                total["Gold"] += count[0]
+                total["New"] += count[1]
+
             okay = "The test report matches the gold report."
             errors=["Gold report had " + str(total["Gold"]) +" errors", "New report had " + str(total["New"]) + " errors."]
             print_report(test_data, errors, "REPORT COMPARISON", okay)
+
             if total["Gold"] == total["New"]:
                 test_data.report_passed = True
             else:
                 printerror(test_data, "The reports did not match each other.\n " + errors[0] +" and the " + errors[1])
-        except FileNotFoundException as e:
-            e.print_error()
+
         except DirNotFoundException as e:
             e.print_error()
         except Exception as e:
@@ -1029,6 +996,17 @@ class TestResultsDiffer(object):
     def _split(input, size):
         return [input[start:start+size] for start in range(0, len(input), size)]
 
+
+def get_files_by_ext(dir_path, ext):
+    """Get a list of all the files with a given extenstion in the directory.
+
+    Args:
+        dir: a pathto_Dir, the directory to search.
+        ext: a String, the extension to search for. i.e. ".html"
+    """
+    return [ os.path.join(dir_path, file) for file in os.listdir(dir_path) if
+    file.endswith(ext) ]
+
 class TestData(object):
     """Container for the input and output of a single image.
 
@@ -1160,7 +1138,7 @@ class TestData(object):
                 html_path = Emailer.make_path(self.reports_dir, fs)
                 if os.path.isdir(html_path):
                     break
-            return Emailer.make_path(html_path, "HTML Report")
+            return Emailer.make_path(html_path, os.listdir(html_path)[0])
 
     def get_sorted_data_path(self, file_type):
         """Get the path to the SortedData file that corresponds to the given DBType.
@@ -1981,12 +1959,18 @@ class TestRunner(object):
         global html
         global attachl
 
-        test_data_list = TestRunner._generate_test_data()
+        test_data_list = [ TestData(image, test_config) for image in test_config.images ]
 
         Reports.html_add_images(test_config.images)
 
         logres =[]
         for test_data in test_data_list:
+            if not (test_config.args.rebuild or
+                os.path.exists(test_data.gold_archive)):
+                msg = "Gold standard doesn't exist, skipping image:"
+                printerror(test_data, msg)
+                printerror(test_data, test_data.gold_archive)
+                continue
             TestRunner._run_autopsy_ingest(test_data)
 
             if test_config.args.rebuild:
@@ -2020,19 +2004,6 @@ class TestRunner(object):
         except NameError:
             printerror(test_data, "Could not send e-mail because of no XML file --maybe");
 
-    def _generate_test_data():
-        """Create TestData objects for each image in the TestConfiguration object.
-
-        Returns:
-            listof_TestData, the TestData object generated.
-        """
-        return [ TestData(image, test_config) for image in test_config.images ]
-        #test_data_list = []
-        #for img in test_config.images:
-        #    test_data = TestData(test_config)
-        #    test_data_list.append(test_data)
-        #return test_data_list
-
     def _run_autopsy_ingest(test_data):
         """Run Autopsy ingest for the image in the given TestData.
 
@@ -2076,6 +2047,8 @@ class TestRunner(object):
         Returns:
             logres?
         """
+        TestRunner._extract_gold(test_data)
+
         # Look for core exceptions
         # @@@ Should be moved to TestResultsDiffer, but it didn't know about logres -- need to look into that
         logres = Logs.search_common_log("TskCoreException", test_data)
@@ -2090,6 +2063,17 @@ class TestRunner(object):
             attachl.append(test_data.common_log_path)
         return logres
 
+    def _extract_gold(test_data):
+        """Extract gold archive file to output/gold/tmp/
+
+        Args:
+            test_data: the TestData
+        """
+        extrctr = zipfile.ZipFile(test_data.gold_archive, 'r', compression=zipfile.ZIP_DEFLATED)
+        extrctr.extractall(test_data.main_config.gold)
+        extrctr.close
+        time.sleep(2)
+
     def _handle_solr(test_data):
         """Clean up SOLR index if in keep mode (-k).
 
@@ -2224,23 +2208,15 @@ class TestRunner(object):
 def main():
     # Global variables
     global failedbool
-    global inform
-    global fl
     global test_config
     global errorem
     global attachl
-    global daycount
-    global redo
-    global passed
-    daycount = 0
     failedbool = False
-    redo = False
     errorem = ""
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)
     attachl = []
-    passed = False
     # The arguments were given wrong:
     if not parse_result:
         test_config.reset()

From ba50b7fbad5af7dff041f9453eff3b348ffeb416 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Fri, 12 Jul 2013 15:25:32 -0400
Subject: [PATCH 02/13] Reorganized regression.py and Emailer.py. Moved util
 functions to a new file, regression_utils.py

---
 test/script/Emailer.py          | 179 ++++-------
 test/script/regression.py       | 508 +++++++++++++-------------------
 test/script/regression_utils.py | 154 ++++++++++
 3 files changed, 412 insertions(+), 429 deletions(-)
 create mode 100644 test/script/regression_utils.py

diff --git a/test/script/Emailer.py b/test/script/Emailer.py
index d1accc0e6a..7be20d406e 100644
--- a/test/script/Emailer.py
+++ b/test/script/Emailer.py
@@ -1,124 +1,55 @@
-import smtplib
-from email.mime.image import MIMEImage
-from email.mime.multipart import MIMEMultipart
-from email.mime.text import MIMEText
-from email.mime.base import MIMEBase
-from email import encoders
-import xml
-from time import localtime, strftime
-from xml.dom.minidom import parse, parseString
-import subprocess
-import sys
-import os
-
-def send_email(parsed, errorem, attachl, passFail):
-	element = parsed.getElementsByTagName("email")
-	if(len(element)<=0):
-		return
-	element = element[0]
-	toval = element.getAttribute("value").encode().decode("utf_8")
-	if(toval==None):
-		return
-	element = parsed.getElementsByTagName("mail_server")[0]
-	serverval = element.getAttribute("value").encode().decode("utf_8")
-	# Create the container (outer) email message.
-	msg = MIMEMultipart()
-	element = parsed.getElementsByTagName("subject")[0]
-	subval = element.getAttribute("value").encode().decode("utf_8")
-	if(passFail):
-		msg['Subject'] = '[Test]Autopsy ' + subval + ' test passed.'
-	else:
-		msg['Subject'] = '[Test]Autopsy ' + subval + ' test failed.'
-	# me == the sender's email address
-	# family = the list of all recipients' email addresses
-	msg['From'] = 'AutopsyTest'
-	msg['To'] = toval
-	msg.preamble = 'This is a test'
-	container = MIMEText(errorem, 'plain')
-	msg.attach(container)
-	Build_email(msg, attachl)
-	s = smtplib.SMTP(serverval)
-	try:
-		print('Sending Email')
-		s.sendmail(msg['From'], msg['To'], msg.as_string())
-	except Exception as e:
-		print(str(e))
-	s.quit()
-	
-def Build_email(msg, attachl):
-	for file in attachl:
-		part = MIMEBase('application', "octet-stream")
-		atach = open(file, "rb")
-		attch = atach.read()
-		noml = file.split("\\")
-		nom = noml[len(noml)-1]
-		part.set_payload(attch)
-		encoders.encode_base64(part)
-		part.add_header('Content-Disposition', 'attachment; filename="' + nom + '"')
-		msg.attach(part)
-		
-# Returns a Windows style path starting with the cwd and
-# ending with the list of directories given
-def make_local_path(*dirs):
-	path = wgetcwd().decode("utf-8")
-	for dir in dirs:
-		path += ("\\" + str(dir))
-	return path_fix(path)
-
-# Returns a Windows style path based only off the given directories
-def make_path(*dirs):
-	path = dirs[0]
-	for dir in dirs[1:]:
-		path += ("\\" + str(dir))
-	return path_fix(path)
-	
-# Fix a standard os.path by making it Windows format
-def path_fix(path):
-	return path.replace("/", "\\")
-	
-# Gets the true current working directory instead of Cygwin's
-def wgetcwd():
-	proc = subprocess.Popen(("cygpath", "-m", os.getcwd()), stdout=subprocess.PIPE)
-	out,err = proc.communicate()
-	tst = out.rstrip()
-	if os.getcwd == tst:
-		return os.getcwd
-	else:
-		proc = subprocess.Popen(("cygpath", "-m", os.getcwd()), stdout=subprocess.PIPE)
-		out,err = proc.communicate()
-		return out.rstrip()
-# Verifies a file's existance
-def file_exists(file):
-	try:
-		if os.path.exists(file):
-			return os.path.isfile(file)
-	except:
-		return False
-		
-# Verifies a directory's existance
-def dir_exists(dir):
-	try:
-		return os.path.exists(dir)
-	except:
-		return False
-
-
-
-# Returns the nth word in the given string or "" if n is out of bounds
-# n starts at 0 for the first word
-def get_word_at(string, n):
-	words = string.split(" ")
-	if len(words) >= n:
-		return words[n]
-	else:
-		return ""
-
-# Returns true if the given file is one of the required input files
-# for ingest testing
-def required_input_file(name):
-	if ((name == "notablehashes.txt-md5.idx") or
-	   (name == "notablekeywords.xml") or
-	   (name == "nsrl.txt-md5.idx")): 
-	   return True
-	else:
-		return False
\ No newline at end of file
+import smtplib
+from email.mime.image import MIMEImage
+from email.mime.multipart import MIMEMultipart
+from email.mime.text import MIMEText
+from email.mime.base import MIMEBase
+from email import encoders
+import xml
+from xml.dom.minidom import parse, parseString
+
+def send_email(parsed, errorem, attachl, passFail):
+	element = parsed.getElementsByTagName("email")
+	if(len(element)<=0):
+		return
+	element = element[0]
+	toval = element.getAttribute("value").encode().decode("utf_8")
+	if(toval==None):
+		return
+	element = parsed.getElementsByTagName("mail_server")[0]
+	serverval = element.getAttribute("value").encode().decode("utf_8")
+	# Create the container (outer) email message.
+	msg = MIMEMultipart()
+	element = parsed.getElementsByTagName("subject")[0]
+	subval = element.getAttribute("value").encode().decode("utf_8")
+	if(passFail):
+		msg['Subject'] = '[Test]Autopsy ' + subval + ' test passed.'
+	else:
+		msg['Subject'] = '[Test]Autopsy ' + subval + ' test failed.'
+	# me == the sender's email address
+	# family = the list of all recipients' email addresses
+	msg['From'] = 'AutopsyTest'
+	msg['To'] = toval
+	msg.preamble = 'This is a test'
+	container = MIMEText(errorem, 'plain')
+	msg.attach(container)
+	Build_email(msg, attachl)
+	s = smtplib.SMTP(serverval)
+	try:
+		print('Sending Email')
+		s.sendmail(msg['From'], msg['To'], msg.as_string())
+	except Exception as e:
+		print(str(e))
+	s.quit()
+
+def Build_email(msg, attachl):
+	for file in attachl:
+		part = MIMEBase('application', "octet-stream")
+		atach = open(file, "rb")
+		attch = atach.read()
+		noml = file.split("\\")
+		nom = noml[len(noml)-1]
+		part.set_payload(attch)
+		encoders.encode_base64(part)
+		part.add_header('Content-Disposition', 'attachment; filename="' + nom + '"')
+		msg.attach(part)
+
diff --git a/test/script/regression.py b/test/script/regression.py
index e15197a518..b6a802c0d2 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -42,6 +42,7 @@ import zipfile
 import zlib
 import Emailer
 import srcupdater
+from regression_utils import *
 
 #
 # Please read me...
@@ -76,14 +77,6 @@ import srcupdater
 # Image:        An image
 #
 
-#####
-# Enumeration definition (python 3.2 doesn't have enumerations, this is a common solution
-# that allows you to access a named enum in a Java-like style, i.e. Numbers.ONE)
-#####
-def enum(*seq, **named):
-    enums = dict(zip(seq, range(len(seq))), **named)
-    return type('Enum', (), enums)
-
 # Enumeration of database types used for the simplification of generating database paths
 DBType = enum('OUTPUT', 'GOLD', 'BACKUP')
 
@@ -148,9 +141,9 @@ class Args(object):
                 #try: @@@ Commented out until a more specific except statement is added
                     arg = sys.argv.pop(0)
                     print("Running on a single file:")
-                    print(Emailer.path_fix(arg) + "\n")
+                    print(path_fix(arg) + "\n")
                     self.single = True
-                    self.single_file = Emailer.path_fix(arg)
+                    self.single_file = path_fix(arg)
                 #except:
                 #   print("Error: No single file given.\n")
             #       return False
@@ -239,9 +232,9 @@ class TestConfiguration(object):
         self.args = args
         # Paths:
         self.output_dir = ""
-        self.input_dir = Emailer.make_local_path("..","input")
-        self.gold = Emailer.make_path("..", "output", "gold")
-        self.img_gold = Emailer.make_path(self.gold, 'tmp')
+        self.input_dir = make_local_path("..","input")
+        self.gold = make_path("..", "output", "gold")
+        self.img_gold = make_path(self.gold, 'tmp')
         # Logs:
         self.csv = ""
         self.global_csv = ""
@@ -296,14 +289,14 @@ class TestConfiguration(object):
             return
         # If working from a configuration file
         if self.args.list:
-           if not Emailer.file_exists(self.args.config_file):
+           if not file_exists(self.args.config_file):
                msg = "Configuration file does not exist at:" + self.args.config_file
                self._print_error(msg)
                return
            self._load_config_file(self.args.config_file)
         # Else if working on a single file
         elif self.args.single:
-           if not Emailer.file_exists(self.args.single_file):
+           if not file_exists(self.args.single_file):
                msg = "Image file does not exist at: " + self.args.single_file
                self._print_error(msg)
                return
@@ -313,7 +306,7 @@ class TestConfiguration(object):
         #  the input directory, continue on to parsing ../input
         if (not self.args.single) and (not self.args.ignore) and (not self.args.list):
            self.args.config_file = "config.xml"
-           if not Emailer.file_exists(self.args.config_file):
+           if not file_exists(self.args.config_file):
                msg = "Configuration file does not exist at: " + self.args.config_file
                self._print_error(msg)
                return
@@ -321,12 +314,12 @@ class TestConfiguration(object):
 
     def _init_logs(self):
         """Setup output folder, logs, and reporting infrastructure."""
-        if(not Emailer.dir_exists(Emailer.make_path("..", "output", "results"))):
-            os.makedirs(Emailer.make_path("..", "output", "results",))
-        self.output_dir = Emailer.make_path("..", "output", "results", time.strftime("%Y.%m.%d-%H.%M.%S"))
+        if(not dir_exists(make_path("..", "output", "results"))):
+            os.makedirs(make_path("..", "output", "results",))
+        self.output_dir = make_path("..", "output", "results", time.strftime("%Y.%m.%d-%H.%M.%S"))
         os.makedirs(self.output_dir)
-        self.csv = Emailer.make_local_path(self.output_dir, "CSV.txt")
-        self.html_log = Emailer.make_path(self.output_dir, "AutopsyTestCase.html")
+        self.csv = make_local_path(self.output_dir, "CSV.txt")
+        self.html_log = make_path(self.output_dir, "AutopsyTestCase.html")
         log_name = self.output_dir + "\\regression.log"
         logging.basicConfig(filename=log_name, level=logging.DEBUG)
 
@@ -336,18 +329,18 @@ class TestConfiguration(object):
         if(self.args.list):
             build_elements = parsed.getElementsByTagName("build")
             if(len(build_elements) <= 0):
-                build_path = Emailer.make_path("..", "build.xml")
+                build_path = make_path("..", "build.xml")
             else:
                 build_element = build_elements[0]
                 build_path = build_element.getAttribute("value").encode().decode("utf_8")
                 if(build_path == None):
-                    build_path = Emailer.make_path("..", "build.xml")
+                    build_path = make_path("..", "build.xml")
         else:
-            build_path = Emailer.make_path("..", "build.xml")
+            build_path = make_path("..", "build.xml")
         self.build_path = build_path
-        self.known_bad_path = Emailer.make_path(self.input_dir, "notablehashes.txt-md5.idx")
-        self.keyword_path = Emailer.make_path(self.input_dir, "notablekeywords.xml")
-        self.nsrl_path = Emailer.make_path(self.input_dir, "nsrl.txt-md5.idx")
+        self.known_bad_path = make_path(self.input_dir, "notablehashes.txt-md5.idx")
+        self.keyword_path = make_path(self.input_dir, "notablekeywords.xml")
+        self.nsrl_path = make_path(self.input_dir, "nsrl.txt-md5.idx")
 
     def _load_config_file(self, config_file):
         """Updates this TestConfiguration's attributes from the config file.
@@ -370,17 +363,17 @@ class TestConfiguration(object):
                 self.input_dir = parsed.getElementsByTagName("indir")[0].getAttribute("value").encode().decode("utf_8")
             if parsed.getElementsByTagName("global_csv"):
                 self.global_csv = parsed.getElementsByTagName("global_csv")[0].getAttribute("value").encode().decode("utf_8")
-                self.global_csv = Emailer.make_local_path(self.global_csv)
+                self.global_csv = make_local_path(self.global_csv)
             if parsed.getElementsByTagName("golddir"):
                 self.gold = parsed.getElementsByTagName("golddir")[0].getAttribute("value").encode().decode("utf_8")
-                self.img_gold = Emailer.make_path(self.gold, 'tmp')
+                self.img_gold = make_path(self.gold, 'tmp')
 
             # Generate the top navbar of the HTML for easy access to all images
             images = []
             for element in parsed.getElementsByTagName("image"):
                 value = element.getAttribute("value").encode().decode("utf_8")
                 print ("Image in Config File: " + value)
-                if Emailer.file_exists(value):
+                if file_exists(value):
                     self.images.append(value)
                 else:
                     msg = "File: " + value + " doesn't exist"
@@ -591,11 +584,11 @@ class TskDbDiff(object):
         Note: SQLITE needs unix style pathing
         """
         # Check to make sure both db files exist
-        if not Emailer.file_exists(self.autopsy_db_file):
+        if not file_exists(self.autopsy_db_file):
             printerror(self.test_data, "Error: TskDbDiff file does not exist at:")
             printerror(self.test_data, self.autopsy_db_file + "\n")
             return
-        if not Emailer.file_exists(self.gold_db_file):
+        if not file_exists(self.gold_db_file):
             printerror(self.test_data, "Error: Gold database file does not exist at:")
             printerror(self.test_data, self.gold_db_file + "\n")
             return
@@ -828,6 +821,7 @@ class DiffResults(object):
         for error in self.attribute_comp:
             list.append(error)
         return ";".join(list)
+
 #-------------------------------------------------#
 #     Functions relating to comparing outputs     #
 #-------------------------------------------------#
@@ -893,7 +887,7 @@ class TestResultsDiffer(object):
             pre-process: (optional) a function of String -> String that will be
             called on each input file before the diff, if specified.
         """
-        if(not Emailer.file_exists(output_file)):
+        if(not file_exists(output_file)):
             return
         output_data = codecs.open(output_file, "r", "utf_8").read()
         gold_data = codecs.open(gold_file, "r", "utf_8").read()
@@ -996,17 +990,6 @@ class TestResultsDiffer(object):
     def _split(input, size):
         return [input[start:start+size] for start in range(0, len(input), size)]
 
-
-def get_files_by_ext(dir_path, ext):
-    """Get a list of all the files with a given extenstion in the directory.
-
-    Args:
-        dir: a pathto_Dir, the directory to search.
-        ext: a String, the extension to search for. i.e. ".html"
-    """
-    return [ os.path.join(dir_path, file) for file in os.listdir(dir_path) if
-    file.endswith(ext) ]
-
 class TestData(object):
     """Container for the input and output of a single image.
 
@@ -1056,20 +1039,20 @@ class TestData(object):
         # TODO: This 0 should be be refactored out, but it will require rebuilding and changing of outputs.
         self.image = get_image_name(self.image_file)
         self.image_name = self.image + "(0)"
-        self.output_path = Emailer.make_path(self.main_config.output_dir, self.image_name)
-        self.autopsy_data_file = Emailer.make_path(self.output_path, self.image_name + "Autopsy_data.txt")
-        self.warning_log = Emailer.make_local_path(self.output_path, "AutopsyLogs.txt")
-        self.antlog_dir = Emailer.make_local_path(self.output_path, "antlog.txt")
-        self.test_dbdump = Emailer.make_path(self.output_path, self.image_name +
+        self.output_path = make_path(self.main_config.output_dir, self.image_name)
+        self.autopsy_data_file = make_path(self.output_path, self.image_name + "Autopsy_data.txt")
+        self.warning_log = make_local_path(self.output_path, "AutopsyLogs.txt")
+        self.antlog_dir = make_local_path(self.output_path, "antlog.txt")
+        self.test_dbdump = make_path(self.output_path, self.image_name +
         "DBDump.txt")
-        self.common_log_path = Emailer.make_local_path(self.output_path, self.image_name + COMMON_LOG)
-        self.sorted_log = Emailer.make_local_path(self.output_path, self.image_name + "SortedErrors.txt")
-        self.reports_dir = Emailer.make_path(self.output_path, AUTOPSY_TEST_CASE, "Reports")
-        self.gold_data_dir = Emailer.make_path(self.main_config.img_gold, self.image_name)
-        self.gold_archive = Emailer.make_path(self.main_config.gold,
+        self.common_log_path = make_local_path(self.output_path, self.image_name + COMMON_LOG)
+        self.sorted_log = make_local_path(self.output_path, self.image_name + "SortedErrors.txt")
+        self.reports_dir = make_path(self.output_path, AUTOPSY_TEST_CASE, "Reports")
+        self.gold_data_dir = make_path(self.main_config.img_gold, self.image_name)
+        self.gold_archive = make_path(self.main_config.gold,
         self.image_name + "-archive.zip")
-        self.logs_dir = Emailer.make_path(self.output_path, "logs")
-        self.solr_index = Emailer.make_path(self.output_path, AUTOPSY_TEST_CASE,
+        self.logs_dir = make_path(self.output_path, "logs")
+        self.solr_index = make_path(self.output_path, AUTOPSY_TEST_CASE,
         "ModuleOutput", "KeywordSearch")
         self.db_diff_results = None
         self.total_test_time = ""
@@ -1085,28 +1068,6 @@ class TestData(object):
         self.printerror = []
         self.printout = []
 
-    def reset(self):
-        self.image = ""
-        self.image_file = ""
-        self.image_name = ""
-        self.sorted_log = ""
-        self.warning_log = ""
-        self.autopsy_data_file = ""
-        self.common_log_path = ""
-        self.antlog_dir = ""
-        self.test_dbdump = ""
-        self.total_test_time = ""
-        self.start_date = ""
-        self.end_date = ""
-        self.total_ingest_time = ""
-        self.artifact_count = 0
-        self.artifact_fail = 0
-        self.heap_space = ""
-        self.service_times = ""
-        # Error tracking
-        self.printerror = []
-        self.printout = []
-
     def get_db_path(self, db_type):
         """Get the path to the database file that corresponds to the given DBType.
 
@@ -1114,11 +1075,11 @@ class TestData(object):
             DBType: the DBType of the path to be generated.
         """
         if(db_type == DBType.GOLD):
-            db_path = Emailer.make_path(self.gold_data_dir, DB_FILENAME)
+            db_path = make_path(self.gold_data_dir, DB_FILENAME)
         elif(db_type == DBType.OUTPUT):
-            db_path = Emailer.make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, DB_FILENAME)
+            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, DB_FILENAME)
         else:
-            db_path = Emailer.make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, BACKUP_DB_FILENAME)
+            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, BACKUP_DB_FILENAME)
         return db_path
 
     def get_html_report_path(self, html_type):
@@ -1128,17 +1089,17 @@ class TestData(object):
             DBType: the DBType of the path to be generated.
         """
         if(html_type == DBType.GOLD):
-            return Emailer.make_path(self.gold_data_dir, "Report")
+            return make_path(self.gold_data_dir, "Report")
         else:
             # Autopsy creates an HTML report folder in the form AutopsyTestCase DATE-TIME
             # It's impossible to get the exact time the folder was created, but the folder
             # we are looking for is the only one in the self.reports_dir folder
             html_path = ""
             for fs in os.listdir(self.reports_dir):
-                html_path = Emailer.make_path(self.reports_dir, fs)
+                html_path = make_path(self.reports_dir, fs)
                 if os.path.isdir(html_path):
                     break
-            return Emailer.make_path(html_path, os.listdir(html_path)[0])
+            return make_path(html_path, os.listdir(html_path)[0])
 
     def get_sorted_data_path(self, file_type):
         """Get the path to the SortedData file that corresponds to the given DBType.
@@ -1174,9 +1135,9 @@ class TestData(object):
         """
         full_filename = self.image_name + file_name
         if(file_type == DBType.GOLD):
-            return Emailer.make_path(self.gold_data_dir, full_filename)
+            return make_path(self.gold_data_dir, full_filename)
         else:
-            return Emailer.make_path(self.output_path, full_filename)
+            return make_path(self.output_path, full_filename)
 
 class Reports(object):
     def generate_reports(csv_path, test_data):
@@ -1197,7 +1158,7 @@ class Reports(object):
         # If the file doesn't exist yet, this is the first test_config to run for
         # this test, so we need to make the start of the html log
         global imgfail
-        if not Emailer.file_exists(test_config.html_log):
+        if not file_exists(test_config.html_log):
             Reports.write_html_head()
         try:
             global html
@@ -1234,7 +1195,7 @@ class Reports(object):
                     <hr color='#282828'>"
             logs_path = test_data.logs_dir
             for file in os.listdir(logs_path):
-                logs += "<p><a href='file:\\" + Emailer.make_path(logs_path, file) + "' target='_blank'>" + file + "</a></p>"
+                logs += "<p><a href='file:\\" + make_path(logs_path, file) + "' target='_blank'>" + file + "</a></p>"
             logs += "</div>"
 
             # All the testing information
@@ -1358,7 +1319,7 @@ class Reports(object):
         """
         # If the file doesn't exist yet, this is the first test_config to run for
         # this test, so we need to make the start of the html log
-        if not Emailer.file_exists(test_config.html_log):
+        if not file_exists(test_config.html_log):
             Reports.write_html_head()
         html = open(test_config.html_log, "a")
         links = []
@@ -1373,7 +1334,7 @@ class Reports(object):
         try:
             # If the CSV file hasn't already been generated, this is the
             # first run, and we need to add the column names
-            if not Emailer.file_exists(csv_path):
+            if not file_exists(csv_path):
                 Reports.csv_header(csv_path)
             # Now add on the fields to a new row
             csv = open(csv_path, "a")
@@ -1404,10 +1365,10 @@ class Reports(object):
             vars.append( str(test_data.db_diff_results.output_objs) )
             vars.append( str(test_data.db_diff_results.output_artifacts) )
             vars.append( str(test_data.db_diff_results.output_objs) )
-            vars.append( Emailer.make_local_path("gold", test_data.image_name, DB_FILENAME) )
+            vars.append( make_local_path("gold", test_data.image_name, DB_FILENAME) )
             vars.append( test_data.db_diff_results.get_artifact_comparison() )
             vars.append( test_data.db_diff_results.get_attribute_comparison() )
-            vars.append( Emailer.make_local_path("gold", test_data.image_name, "standard.html") )
+            vars.append( make_local_path("gold", test_data.image_name, "standard.html") )
             vars.append( str(test_data.report_passed) )
             vars.append( test_config.ant_to_string() )
             # Join it together with a ", "
@@ -1496,10 +1457,10 @@ class Logs(object):
             common_log.write("--------------------------------------------------\n")
             common_log.write(test_data.image_name + "\n")
             common_log.write("--------------------------------------------------\n")
-            rep_path = Emailer.make_local_path(test_config.output_dir)
+            rep_path = make_local_path(test_config.output_dir)
             rep_path = rep_path.replace("\\\\", "\\")
             for file in os.listdir(logs_path):
-                log = codecs.open(Emailer.make_path(logs_path, file), "r", "utf_8")
+                log = codecs.open(make_path(logs_path, file), "r", "utf_8")
                 for line in log:
                     line = line.replace(rep_path, "test_data")
                     if line.startswith("Exception"):
@@ -1526,7 +1487,7 @@ class Logs(object):
         """Fill the global test config's variables that require the log files."""
         try:
             # Open autopsy.log.0
-            log_path = Emailer.make_path(test_data.logs_dir, "autopsy.log.0")
+            log_path = make_path(test_data.logs_dir, "autopsy.log.0")
             log = open(log_path)
 
             # Set the test_config starting time based off the first line of autopsy.log.0
@@ -1551,12 +1512,12 @@ class Logs(object):
             # Set Autopsy version, heap space, ingest time, and service times
 
             version_line = search_logs("INFO: Application name: Autopsy, version:", test_data)[0]
-            test_config.autopsy_version = Emailer.get_word_at(version_line, 5).rstrip(",")
+            test_config.autopsy_version = get_word_at(version_line, 5).rstrip(",")
 
             test_data.heap_space = search_logs("Heap memory usage:", test_data)[0].rstrip().split(": ")[1]
 
             ingest_line = search_logs("Ingest (including enqueue)", test_data)[0]
-            test_data.total_ingest_time = Emailer.get_word_at(ingest_line, 6).rstrip()
+            test_data.total_ingest_time = get_word_at(ingest_line, 6).rstrip()
 
             message_line = search_log_set("autopsy", "Ingest messages count:", test_data)[0]
             test_config.ingest_messages = int(message_line.rstrip().split(": ")[2])
@@ -1622,91 +1583,6 @@ class Logs(object):
         log.close()
         return results
 
-# Returns the type of image file, based off extension
-class IMGTYPE:
-    RAW, ENCASE, SPLIT, UNKNOWN = range(4)
-
-def image_type(image_file):
-    ext_start = image_file.rfind(".")
-    if (ext_start == -1):
-        return IMGTYPE.UNKNOWN
-    ext = image_file[ext_start:].lower()
-    if (ext == ".img" or ext == ".dd"):
-        return IMGTYPE.RAW
-    elif (ext == ".e01"):
-        return IMGTYPE.ENCASE
-    elif (ext == ".aa" or ext == ".001"):
-        return IMGTYPE.SPLIT
-    else:
-        return IMGTYPE.UNKNOWN
-
-def search_logs(string, test_data):
-    """Search through all the known log files for a given string.
-
-    Args:
-        string: the String to search for.
-        test_data: the TestData that holds the logs to search.
-
-    Returns:
-        a listof_String, the lines that contained the given String.
-    """
-    logs_path = test_data.logs_dir
-    results = []
-    for file in os.listdir(logs_path):
-        log = codecs.open(Emailer.make_path(logs_path, file), "r", "utf_8")
-        for line in log:
-            if string in line:
-                results.append(line)
-        log.close()
-    return results
-
-def search_log(log, string, test_data):
-    """Search the given log for any instances of a given string.
-
-    Args:
-        log: a pathto_File, the log to search in
-        string: the String to search for.
-        test_data: the TestData that holds the log to search.
-
-    Returns:
-        a listof_String, all the lines that the string is found on
-    """
-    logs_path = Emailer.make_path(test_data.logs_dir, log)
-    try:
-        results = []
-        log = codecs.open(logs_path, "r", "utf_8")
-        for line in log:
-            if string in line:
-                results.append(line)
-        log.close()
-        if results:
-            return results
-    except:
-        raise FileNotFoundException(logs_path)
-
-# Search through all the the logs of the given type
-# Types include autopsy, tika, and solr
-def search_log_set(type, string, test_data):
-    """Search through all logs to the given type for the given string.
-
-    Args:
-        type: the type of log to search in.
-        string: the String to search for.
-        test_data: the TestData containing the logs to search.
-
-    Returns:
-        a listof_String, the lines on which the String was found.
-    """
-    logs_path = test_data.logs_dir
-    results = []
-    for file in os.listdir(logs_path):
-        if type in file:
-            log = codecs.open(Emailer.make_path(logs_path, file), "r", "utf_8")
-            for line in log:
-                if string in line:
-                    results.append(line)
-            log.close()
-    return results
 
 def print_report(test_data, errors, name, okay):
     """Print a report with the specified information.
@@ -1737,28 +1613,6 @@ def printout(test_data, string):
     print(string)
     test_data.printout.append(string)
 
-#----------------------------------#
-#        Helper functions          #
-#----------------------------------#
-
-def get_image_name(image_file):
-    path_end = image_file.rfind("/")
-    path_end2 = image_file.rfind("\\")
-    ext_start = image_file.rfind(".")
-    if(ext_start == -1):
-        name = image_file
-    if(path_end2 != -1):
-        name = image_file[path_end2+1:ext_start]
-    elif(ext_start == -1):
-        name = image_file[path_end+1:]
-    elif(path_end == -1):
-        name = image_file[:ext_start]
-    elif(path_end!=-1 and ext_start!=-1):
-        name = image_file[path_end+1:ext_start]
-    else:
-        name = image_file[path_end2+1:ext_start]
-    return name
-
 def get_exceptions(test_data):
     """Get a list of the exceptions in the autopsy logs.
 
@@ -1770,7 +1624,7 @@ def get_exceptions(test_data):
     results = []
     for file in os.listdir(logs_path):
         if "autopsy.log" in file:
-            log = codecs.open(Emailer.make_path(logs_path, file), "r", "utf_8")
+            log = codecs.open(make_path(logs_path, file), "r", "utf_8")
             ex = re.compile("\SException")
             er = re.compile("\SError")
             for line in log:
@@ -1802,67 +1656,6 @@ def copy_logs(test_data):
         printerror(test_data,str(e) + "\n")
         logging.warning(traceback.format_exc())
 
-def clear_dir(dir):
-    """Clears all files from a directory and remakes it."""
-    try:
-        if Emailer.dir_exists(dir):
-            shutil.rmtree(dir)
-        os.makedirs(dir)
-        return True;
-    except Exception as e:
-        printerror(test_data,"Error: Cannot clear the given directory:")
-        printerror(test_data,dir + "\n")
-        print(str(e))
-        return False;
-
-def del_dir(dir):
-    try:
-        if Emailer.dir_exists(dir):
-            shutil.rmtree(dir)
-        return True;
-    except:
-        printerror(test_data,"Error: Cannot delete the given directory:")
-        printerror(test_data,dir + "\n")
-        return False;
-
-def copy_file(ffrom, to):
-    """Copies a given file from "ffrom" to "to"."""
-    try :
-        shutil.copy(ffrom, to)
-    except Exception as e:
-        print(str(e))
-        print(traceback.format_exc())
-
-def copy_dir(ffrom, to):
-    """Copies a directory file from "ffrom" to "to"."""
-    try :
-        if not os.path.isdir(ffrom):
-            raise FileNotFoundException(ffrom)
-        shutil.copytree(ffrom, to)
-    except:
-        raise FileNotFoundException(to)
-
-def get_file_in_dir(dir, ext):
-    """Returns the first file in the given directory with the given extension."""
-    try:
-        for file in os.listdir(dir):
-            if file.endswith(ext):
-                return Emailer.make_path(dir, file)
-        # If nothing has been found, raise an exception
-        raise FileNotFoundException(dir)
-    except:
-        raise DirNotFoundException(dir)
-
-def find_file_in_dir(dir, name, ext):
-    try:
-        for file in os.listdir(dir):
-            if file.startswith(name):
-                if file.endswith(ext):
-                    return Emailer.make_path(dir, file)
-        raise FileNotFoundException(dir)
-    except:
-        raise DirNotFoundException(dir)
-
 def setDay():
     global Day
     Day = int(strftime("%d", localtime()))
@@ -1876,34 +1669,6 @@ def getDay():
 def newDay():
     return getLastDay() != getDay()
 
-def usage():
-    """Return the usage description of the test script."""
-    return """
-Usage:  ./regression.py [-f FILE] [OPTIONS]
-
-        Run RegressionTest.java, and compare the result with a gold standard.
-        By default, the script tests every image in ../input
-        When the -f flag is set, this script only tests a single given image.
-        When the -l flag is set, the script looks for a configuration file,
-        which may outsource to a new input directory and to individual images.
-
-        Expected files:
-          An NSRL database at:          ../input/nsrl.txt-md5.idx
-          A notable hash database at:    ../input/notablehashes.txt-md5.idx
-          A notable keyword file at:      ../input/notablekeywords.xml
-
-Options:
-  -r            Rebuild the gold standards for the image(s) tested.
-  -i            Ignores the ../input directory and all files within it.
-  -u            Tells Autopsy not to ingest unallocated space.
-  -k            Keeps each image's Solr index instead of deleting it.
-  -v            Verbose mode; prints all errors to the screen.
-  -e ex      Prints out all errors containing ex.
-  -l cfg        Runs from configuration file cfg.
-  -c            Runs in a loop over the configuration file until canceled. Must be used in conjunction with -l
-  -fr           Will not try download gold standard images
-    """
-
 #------------------------------------------------------------#
 # Exception classes to manage "acceptable" thrown exceptions #
 #         versus unexpected and fatal exceptions            #
@@ -2107,22 +1872,22 @@ class TestRunner(object):
         # Delete the current gold standards
         gold_dir = test_config.img_gold
         clear_dir(test_config.img_gold)
-        tmpdir = Emailer.make_path(gold_dir, test_data.image_name)
+        tmpdir = make_path(gold_dir, test_data.image_name)
         dbinpth = test_data.get_db_path(DBType.OUTPUT)
-        dboutpth = Emailer.make_path(tmpdir, DB_FILENAME)
-        dataoutpth = Emailer.make_path(tmpdir, test_data.image_name + "SortedData.txt")
+        dboutpth = make_path(tmpdir, DB_FILENAME)
+        dataoutpth = make_path(tmpdir, test_data.image_name + "SortedData.txt")
         dbdumpinpth = test_data.get_db_dump_path(DBType.OUTPUT)
-        dbdumpoutpth = Emailer.make_path(tmpdir, test_data.image_name + "DBDump.txt")
+        dbdumpoutpth = make_path(tmpdir, test_data.image_name + "DBDump.txt")
         if not os.path.exists(test_config.img_gold):
             os.makedirs(test_config.img_gold)
         if not os.path.exists(tmpdir):
             os.makedirs(tmpdir)
         try:
             copy_file(dbinpth, dboutpth)
-            if Emailer.file_exists(test_data.get_sorted_data_path(DBType.OUTPUT)):
+            if file_exists(test_data.get_sorted_data_path(DBType.OUTPUT)):
                 copy_file(test_data.get_sorted_data_path(DBType.OUTPUT), dataoutpth)
             copy_file(dbdumpinpth, dbdumpoutpth)
-            error_pth = Emailer.make_path(tmpdir, test_data.image_name+"SortedErrors.txt")
+            error_pth = make_path(tmpdir, test_data.image_name+"SortedErrors.txt")
             copy_file(test_data.sorted_log, error_pth)
         except Exception as e:
             printerror(test_data, str(e))
@@ -2130,7 +1895,7 @@ class TestRunner(object):
             print(traceback.format_exc())
         # Rebuild the HTML report
         output_html_report_dir = test_data.get_html_report_path(DBType.OUTPUT)
-        gold_html_report_dir = Emailer.make_path(tmpdir, "Report")
+        gold_html_report_dir = make_path(tmpdir, "Report")
 
         try:
             copy_dir(output_html_report_dir, gold_html_report_dir)
@@ -2145,7 +1910,7 @@ class TestRunner(object):
         os.chdir(zpdir)
         os.chdir("..")
         img_gold = "tmp"
-        img_archive = Emailer.make_path(test_data.image_name+"-archive.zip")
+        img_archive = make_path(test_data.image_name+"-archive.zip")
         comprssr = zipfile.ZipFile(img_archive, 'w',compression=zipfile.ZIP_DEFLATED)
         TestRunner.zipdir(img_gold, comprssr)
         comprssr.close()
@@ -2169,7 +1934,7 @@ class TestRunner(object):
         """
         # Set up the directories
         test_config_path = os.path.join(test_config.output_dir, test_data.image_name)
-        if Emailer.dir_exists(test_config_path):
+        if dir_exists(test_config_path):
             shutil.rmtree(test_config_path)
         os.makedirs(test_config_path)
         test_config.ant = ["ant"]
@@ -2186,14 +1951,14 @@ class TestRunner(object):
         test_config.ant.append("-Dnsrl_path=" + test_config.nsrl_path)
         test_config.ant.append("-Dgold_path=" + test_config.gold)
         test_config.ant.append("-Dout_path=" +
-        Emailer.make_local_path(test_data.output_path))
+        make_local_path(test_data.output_path))
         test_config.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
         test_config.ant.append("-Dtest.timeout=" + str(test_config.timeout))
 
         printout(test_data, "Ingesting Image:\n" + test_data.image_file + "\n")
         printout(test_data, "CMD: " + " ".join(test_config.ant))
         printout(test_data, "Starting test...\n")
-        antoutpth = Emailer.make_local_path(test_config.output_dir, "antRunOutput.txt")
+        antoutpth = make_local_path(test_config.output_dir, "antRunOutput.txt")
         antout = open(antoutpth, "a")
         if SYS is OS.CYGWIN:
             subprocess.call(test_config.ant, stdout=subprocess.PIPE)
@@ -2202,6 +1967,139 @@ class TestRunner(object):
             theproc.communicate()
         antout.close()
 
+####
+# Helper Functions
+####
+def search_logs(string, test_data):
+    """Search through all the known log files for a given string.
+
+    Args:
+        string: the String to search for.
+        test_data: the TestData that holds the logs to search.
+
+    Returns:
+        a listof_String, the lines that contained the given String.
+    """
+    logs_path = test_data.logs_dir
+    results = []
+    for file in os.listdir(logs_path):
+        log = codecs.open(make_path(logs_path, file), "r", "utf_8")
+        for line in log:
+            if string in line:
+                results.append(line)
+        log.close()
+    return results
+
+def search_log(log, string, test_data):
+    """Search the given log for any instances of a given string.
+
+    Args:
+        log: a pathto_File, the log to search in
+        string: the String to search for.
+        test_data: the TestData that holds the log to search.
+
+    Returns:
+        a listof_String, all the lines that the string is found on
+    """
+    logs_path = make_path(test_data.logs_dir, log)
+    try:
+        results = []
+        log = codecs.open(logs_path, "r", "utf_8")
+        for line in log:
+            if string in line:
+                results.append(line)
+        log.close()
+        if results:
+            return results
+    except:
+        raise FileNotFoundException(logs_path)
+
+# Search through all the the logs of the given type
+# Types include autopsy, tika, and solr
+def search_log_set(type, string, test_data):
+    """Search through all logs to the given type for the given string.
+
+    Args:
+        type: the type of log to search in.
+        string: the String to search for.
+        test_data: the TestData containing the logs to search.
+
+    Returns:
+        a listof_String, the lines on which the String was found.
+    """
+    logs_path = test_data.logs_dir
+    results = []
+    for file in os.listdir(logs_path):
+        if type in file:
+            log = codecs.open(make_path(logs_path, file), "r", "utf_8")
+            for line in log:
+                if string in line:
+                    results.append(line)
+            log.close()
+    return results
+
+
+def clear_dir(dir):
+    """Clears all files from a directory and remakes it."""
+    try:
+        if dir_exists(dir):
+            shutil.rmtree(dir)
+        os.makedirs(dir)
+        return True;
+    except Exception as e:
+        printerror(test_data,"Error: Cannot clear the given directory:")
+        printerror(test_data,dir + "\n")
+        print(str(e))
+        return False;
+
+def del_dir(dir):
+    try:
+        if dir_exists(dir):
+            shutil.rmtree(dir)
+        return True;
+    except:
+        printerror(test_data,"Error: Cannot delete the given directory:")
+        printerror(test_data,dir + "\n")
+        return False;
+
+def copy_file(ffrom, to):
+    """Copies a given file from "ffrom" to "to"."""
+    try :
+        shutil.copy(ffrom, to)
+    except Exception as e:
+        print(str(e))
+        print(traceback.format_exc())
+
+def copy_dir(ffrom, to):
+    """Copies a directory file from "ffrom" to "to"."""
+    try :
+        if not os.path.isdir(ffrom):
+            raise FileNotFoundException(ffrom)
+        shutil.copytree(ffrom, to)
+    except:
+        raise FileNotFoundException(to)
+
+def get_file_in_dir(dir, ext):
+    """Returns the first file in the given directory with the given extension."""
+    try:
+        for file in os.listdir(dir):
+            if file.endswith(ext):
+                return make_path(dir, file)
+        # If nothing has been found, raise an exception
+        raise FileNotFoundException(dir)
+    except:
+        raise DirNotFoundException(dir)
+
+def find_file_in_dir(dir, name, ext):
+    try:
+        for file in os.listdir(dir):
+            if file.startswith(name):
+                if file.endswith(ext):
+                    return make_path(dir, file)
+        raise FileNotFoundException(dir)
+    except:
+        raise DirNotFoundException(dir)
+
 #----------------------#
 #        Main          #
 #----------------------#
diff --git a/test/script/regression_utils.py b/test/script/regression_utils.py
new file mode 100644
index 0000000000..cf3c117df4
--- /dev/null
+++ b/test/script/regression_utils.py
@@ -0,0 +1,154 @@
+import os
+import sys
+import subprocess
+from time import localtime, strftime
+import traceback
+
+# Returns a Windows style path starting with the cwd and
+# ending with the list of directories given
+def make_local_path(*dirs):
+	path = wgetcwd().decode("utf-8")
+	for dir in dirs:
+		path += ("\\" + str(dir))
+	return path_fix(path)
+
+# Returns a Windows style path based only off the given directories
+def make_path(*dirs):
+	path = dirs[0]
+	for dir in dirs[1:]:
+		path += ("\\" + str(dir))
+	return path_fix(path)
+
+# Fix a standard os.path by making it Windows format
+def path_fix(path):
+	return path.replace("/", "\\")
+
+# Gets the true current working directory instead of Cygwin's
+def wgetcwd():
+	proc = subprocess.Popen(("cygpath", "-m", os.getcwd()), stdout=subprocess.PIPE)
+	out,err = proc.communicate()
+	tst = out.rstrip()
+	if os.getcwd == tst:
+		return os.getcwd
+	else:
+		proc = subprocess.Popen(("cygpath", "-m", os.getcwd()), stdout=subprocess.PIPE)
+		out,err = proc.communicate()
+		return out.rstrip()
+# Verifies a file's existance
+def file_exists(file):
+	try:
+		if os.path.exists(file):
+			return os.path.isfile(file)
+	except:
+		return False
+
+# Verifies a directory's existance
+def dir_exists(dir):
+	try:
+		return os.path.exists(dir)
+	except:
+		return False
+
+
+
+# Returns the nth word in the given string or "" if n is out of bounds
+# n starts at 0 for the first word
+def get_word_at(string, n):
+	words = string.split(" ")
+	if len(words) >= n:
+		return words[n]
+	else:
+		return ""
+
+# Returns true if the given file is one of the required input files
+# for ingest testing
+def required_input_file(name):
+	if ((name == "notablehashes.txt-md5.idx") or
+	   (name == "notablekeywords.xml") or
+	   (name == "nsrl.txt-md5.idx")):
+	   return True
+	else:
+		return False
+
+def image_type(image_file):
+    ext_start = image_file.rfind(".")
+    if (ext_start == -1):
+        return IMGTYPE.UNKNOWN
+    ext = image_file[ext_start:].lower()
+    if (ext == ".img" or ext == ".dd"):
+        return IMGTYPE.RAW
+    elif (ext == ".e01"):
+        return IMGTYPE.ENCASE
+    elif (ext == ".aa" or ext == ".001"):
+        return IMGTYPE.SPLIT
+    else:
+        return IMGTYPE.UNKNOWN
+
+# Returns the type of image file, based off extension
+class IMGTYPE:
+    RAW, ENCASE, SPLIT, UNKNOWN = range(4)
+
+def get_image_name(image_file):
+    path_end = image_file.rfind("/")
+    path_end2 = image_file.rfind("\\")
+    ext_start = image_file.rfind(".")
+    if(ext_start == -1):
+        name = image_file
+    if(path_end2 != -1):
+        name = image_file[path_end2+1:ext_start]
+    elif(ext_start == -1):
+        name = image_file[path_end+1:]
+    elif(path_end == -1):
+        name = image_file[:ext_start]
+    elif(path_end!=-1 and ext_start!=-1):
+        name = image_file[path_end+1:ext_start]
+    else:
+        name = image_file[path_end2+1:ext_start]
+    return name
+
+def usage():
+    """Return the usage description of the test script."""
+    return """
+Usage:  ./regression.py [-f FILE] [OPTIONS]
+
+        Run RegressionTest.java, and compare the result with a gold standard.
+        By default, the script tests every image in ../input
+        When the -f flag is set, this script only tests a single given image.
+        When the -l flag is set, the script looks for a configuration file,
+        which may outsource to a new input directory and to individual images.
+
+        Expected files:
+          An NSRL database at:          ../input/nsrl.txt-md5.idx
+          A notable hash database at:    ../input/notablehashes.txt-md5.idx
+          A notable keyword file at:      ../input/notablekeywords.xml
+
+Options:
+  -r            Rebuild the gold standards for the image(s) tested.
+  -i            Ignores the ../input directory and all files within it.
+  -u            Tells Autopsy not to ingest unallocated space.
+  -k            Keeps each image's Solr index instead of deleting it.
+  -v            Verbose mode; prints all errors to the screen.
+  -e ex      Prints out all errors containing ex.
+  -l cfg        Runs from configuration file cfg.
+  -c            Runs in a loop over the configuration file until canceled. Must be used in conjunction with -l
+  -fr           Will not try download gold standard images
+    """
+
+#####
+# Enumeration definition (python 3.2 doesn't have enumerations, this is a common solution
+# that allows you to access a named enum in a Java-like style, i.e. Numbers.ONE)
+#####
+def enum(*seq, **named):
+    enums = dict(zip(seq, range(len(seq))), **named)
+    return type('Enum', (), enums)
+
+
+def get_files_by_ext(dir_path, ext):
+    """Get a list of all the files with a given extenstion in the directory.
+
+    Args:
+        dir: a pathto_Dir, the directory to search.
+        ext: a String, the extension to search for. i.e. ".html"
+    """
+    return [ os.path.join(dir_path, file) for file in os.listdir(dir_path) if
+    file.endswith(ext) ]

From d87b0972b1ff4ad873d6ff35cb891317bd7f77c2 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Mon, 15 Jul 2013 12:30:08 -0400
Subject: [PATCH 03/13] Moved error reporting to a central class

---
 test/script/regression.py | 234 ++++++++++++++++++++------------------
 1 file changed, 124 insertions(+), 110 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index b6a802c0d2..158fbf1fbd 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -285,20 +285,20 @@ class TestConfiguration(object):
         # If user wants to do a single file and a list (contradictory?)
         if self.args.single and self.args.list:
             msg = "Cannot run both from config file and on a single file."
-            self._print_error(msg)
+            Errors.add_email_msg(msg)
             return
         # If working from a configuration file
         if self.args.list:
            if not file_exists(self.args.config_file):
                msg = "Configuration file does not exist at:" + self.args.config_file
-               self._print_error(msg)
+               Errors.add_email_msg(msg)
                return
            self._load_config_file(self.args.config_file)
         # Else if working on a single file
         elif self.args.single:
            if not file_exists(self.args.single_file):
                msg = "Image file does not exist at: " + self.args.single_file
-               self._print_error(msg)
+               Errors.add_email_msg(msg)
                return
            test_config.images.append(self.args.single_file)
 
@@ -308,7 +308,7 @@ class TestConfiguration(object):
            self.args.config_file = "config.xml"
            if not file_exists(self.args.config_file):
                msg = "Configuration file does not exist at: " + self.args.config_file
-               self._print_error(msg)
+               Errors.add_email_msg(msg)
                return
            self._load_config_file(self.args.config_file)
 
@@ -353,7 +353,6 @@ class TestConfiguration(object):
         """
         try:
             global parsed
-            global errorem
             global attachl
             count = 0
             parsed = parse(config_file)
@@ -377,7 +376,7 @@ class TestConfiguration(object):
                     self.images.append(value)
                 else:
                     msg = "File: " + value + " doesn't exist"
-                    self._print_error(msg)
+                    Errors.add_email_msg(msg)
             image_count = len(images)
 
             # Sanity check to see if there are obvious gold images that we are not testing
@@ -394,21 +393,10 @@ class TestConfiguration(object):
         except Exception as e:
             msg = "There was an error running with the configuration file.\n"
             msg += "\t" + str(e)
-            self._print_error(msg)
+            Errors.add_email_msg(msg)
             logging.critical(traceback.format_exc())
             print(traceback.format_exc())
 
-    def _print_error(self, msg):
-        """Append the given error message to the global error message and print the message to the screen.
-
-        Args:
-            msg: String - the error message to print
-        """
-        global errorem
-        error_msg = "Configuration: " + msg
-        print(error_msg)
-        errorem += error_msg + "\n"
-
 class TskDbDiff(object):
     """Represents the differences between the gold and output databases.
 
@@ -492,12 +480,12 @@ class TskDbDiff(object):
         exceptions = []
         try:
             global failedbool
-            global errorem
             if self.gold_artifacts != self.autopsy_artifacts:
                 failedbool = True
                 global imgfail
                 imgfail = True
-                errorem += self.test_data.image + ":There was a difference in the number of artifacts.\n"
+                msg = "There was a difference in the number of artifacts.\n"
+                Errors.add_email_msg(msg)
             rner = len(self.gold_artifacts)
             for type_id in range(1, rner):
                 if self.gold_artifacts[type_id] != self.autopsy_artifacts[type_id]:
@@ -521,11 +509,11 @@ class TskDbDiff(object):
                 error += str("Gold: %d, Test: %d" % (self.gold_attributes, self.autopsy_attributes))
                 exceptions.append(error)
                 global failedbool
-                global errorem
                 failedbool = True
                 global imgfail
                 imgfail = True
-                errorem += self.test_data.image + ":There was a difference in the number of attributes.\n"
+                msg = "There was a difference in the number of attributes.\n"
+                Errors.add_email_msg(msg)
                 return exceptions
         except Exception as e:
             exceptions.append("Error: Unable to compare blackboard_attributes.\n")
@@ -540,11 +528,11 @@ class TskDbDiff(object):
                 error += str("Gold: %d, Test: %d" % (self.gold_objects, self.autopsy_objects))
                 exceptions.append(error)
                 global failedbool
-                global errorem
                 failedbool = True
                 global imgfail
                 imgfail = True
-                errorem += self.test_data.image + ":There was a difference between the tsk object counts.\n"
+                msg ="There was a difference between the tsk object counts.\n"
+                Errors.add_email_msg(msg)
                 return exceptions
         except Exception as e:
             exceptions.append("Error: Unable to compare tsk_objects.\n")
@@ -617,9 +605,9 @@ class TskDbDiff(object):
         self.attribute_comparison = exceptions[2]
 
         okay = "All counts match."
-        print_report(self.test_data, exceptions[0], "COMPARE TSK OBJECTS", okay)
-        print_report(self.test_data, exceptions[1], "COMPARE ARTIFACTS", okay)
-        print_report(self.test_data, exceptions[2], "COMPARE ATTRIBUTES", okay)
+        print_report(exceptions[0], "COMPARE TSK OBJECTS", okay)
+        print_report(exceptions[1], "COMPARE ARTIFACTS", okay)
+        print_report(exceptions[2], "COMPARE ATTRIBUTES", okay)
 
         return DiffResults(self)
 
@@ -635,7 +623,6 @@ class TskDbDiff(object):
             test_data: the TestData that corresponds with this dump.
         """
         autopsy_cur2 = autopsy_con.cursor()
-        global errorem
         global attachl
         global failedbool
         # Get the list of all artifacts
@@ -665,10 +652,11 @@ class TskDbDiff(object):
                     autopsy_cur1.execute("SELECT blackboard_attributes.source, blackboard_attribute_types.display_name, blackboard_attributes.value_type, blackboard_attributes.value_text, blackboard_attributes.value_int32, blackboard_attributes.value_int64, blackboard_attributes.value_double FROM blackboard_attributes INNER JOIN blackboard_attribute_types ON blackboard_attributes.attribute_type_id = blackboard_attribute_types.attribute_type_id WHERE artifact_id =? ORDER BY blackboard_attributes.source, blackboard_attribute_types.display_name, blackboard_attributes.value_type, blackboard_attributes.value_text, blackboard_attributes.value_int32, blackboard_attributes.value_int64, blackboard_attributes.value_double", key)
                     attributes = autopsy_cur1.fetchall()
                 except Exception as e:
-                    printerror(test_data, str(e))
-                    printerror(test_data, str(rw[3]))
+                    Errors.print_error(str(e))
+                    Errors.print_error(str(rw[3]))
                     print(test_data.image_name)
-                    errorem += test_data.image_name + ":Attributes in artifact id (in output DB)# " + str(rw[3]) + " encountered an error: " + str(e) +" .\n"
+                    msg ="Attributes in artifact id (in output DB)# " + str(rw[3]) + " encountered an error: " + str(e) +" .\n"
+                    Errors.add_email_msg(msg)
                     looptry = False
                     print(test_data.artifact_fail)
                     test_data.artifact_fail += 1
@@ -685,15 +673,17 @@ class TskDbDiff(object):
                             if(attr[x] != None):
                                 numvals += 1
                         if(numvals > 1):
-                            errorem += test_data.image_name + ":There were too many values for attribute type: " + attr[1] + " for artifact with id #" + str(rw[3]) + ".\n"
-                            printerror(test_data, "There were too many values for attribute type: " + attr[1] + " for artifact with id #" + str(rw[3]) + " for image " + test_data.image_name + ".")
+                            msg = "There were too many values for attribute type: " + attr[1] + " for artifact with id #" + str(rw[3]) + ".\n"
+                            Errors.add_email_msg(msg)
+                            Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
                                 attachl.append(autopsy_db_file)
                                 appnd = True
                         if(not attr[0] == src):
-                            errorem += test_data.image_name + ":There were inconsistent sources for artifact with id #" + str(rw[3]) + ".\n"
-                            printerror(test_data, "There were inconsistent sources for artifact with id #" + str(rw[3]) + " for image " + test_data.image_name + ".")
+                            msg ="There were inconsistent sources for artifact with id #" + str(rw[3]) + ".\n"
+                            Errors.add_email_msg(msg)
+                            Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
                                 attachl.append(autopsy_db_file)
@@ -708,9 +698,9 @@ class TskDbDiff(object):
                             try:
                                 database_log.write(inpval)
                             except Exception as e:
-                                printerror(test_data, "Inner exception" + outp)
+                                Errors.print_error("Inner exception" + outp)
                         except Exception as e:
-                                printerror(test_data, str(e))
+                                Errors.print_error(str(e))
                         database_log.write('" />')
                 database_log.write(' <artifact/>\n')
                 rw = autopsy_cur2.fetchone()
@@ -720,9 +710,10 @@ class TskDbDiff(object):
             subprocess.call(srtcmdlst)
             print(test_data.artifact_fail)
             if(test_data.artifact_fail > 0):
-                errorem += test_data.image_name + ":There were " + str(test_data.artifact_count) + " artifacts and " + str(test_data.artifact_fail) + " threw an exception while loading.\n"
+                msg ="There were " + str(test_data.artifact_count) + " artifacts and " + str(test_data.artifact_fail) + " threw an exception while loading.\n"
+                Errors.add_email_msg(msg)
         except Exception as e:
-            printerror(test_data, 'outer exception: ' + str(e))
+            Errors.print_error('outer exception: ' + str(e))
 
     def _dump_output_db_nonbb(test_data):
         """Dumps a database to a text file.
@@ -749,9 +740,9 @@ class TskDbDiff(object):
                 try:
                     database_log.write(line + "\n")
                 except Exception as e:
-                    printerror(test_data, "dump_output_db_nonbb: Inner dump Exception:" + str(e))
+                    Errors.print_error("dump_output_db_nonbb: Inner dump Exception:" + str(e))
         except Exception as e:
-            printerror(test_data, "dump_output_db_nonbb: Outer dump Exception:" + str(e))
+            Errors.print_error("dump_output_db_nonbb: Outer dump Exception:" + str(e))
 
 
     def dump_output_db(test_data):
@@ -803,7 +794,6 @@ class DiffResults(object):
             return "All counts matched"
         else:
             global failedbool
-            global errorem
             failedbool = True
             global imgfail
             imgfail = True
@@ -813,7 +803,6 @@ class DiffResults(object):
         if not self.attribute_comp:
             return "All counts matched"
         global failedbool
-        global errorem
         failedbool = True
         global imgfail
         imgfail = True
@@ -869,8 +858,8 @@ class TestResultsDiffer(object):
             del_dir(test_data.gold_data_dir)
 
         except Exception as e:
-            printerror(test_data, "Tests failed due to an error, try rebuilding or creating gold standards.\n")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Tests failed due to an error, try rebuilding or creating gold standards.\n")
+            Errors.print_error(str(e) + "\n")
             print(traceback.format_exc())
 
 
@@ -897,20 +886,18 @@ class TestResultsDiffer(object):
             gold_data = process(gold_data)
 
         if (not(gold_data == output_data)):
-            filename = os.path.basename(output_file)
-            diff_path = os.path.join(test_data.output_path, filename +
-            "-Diff.txt")
+            diff_path = os.path.splitext(os.path.basename(output_file))[0]
+            diff_path += "-Diff.txt"
             diff_file = codecs.open(diff_path, "wb", "utf_8")
             dffcmdlst = ["diff", output_file, gold_file]
             subprocess.call(dffcmdlst, stdout = diff_file)
             global attachl
-            global errorem
             global failedbool
-            attachl.append(diff_dir)
+            attachl.append(diff_path)
             msg = test_data.image_name + ":There was a difference in "
             msg += os.path.basename(output_file) + ".\n"
-            errorem += msg
-            printerror(test_data, msg)
+            Errors.add_email_msg(msg)
+            Errors.print_error(msg)
             failedbool = True
             global imgfail
             imgfail = True
@@ -932,7 +919,7 @@ class TestResultsDiffer(object):
             if(len(gold_html_files) != len(output_html_files)):
                 msg = "The reports did not have the same number or files."
                 msg += "One of the reports may have been corrupted."
-                printerror(test_data, msg)
+                Errors.print_error(msg)
             else:
                 gold_html_files.sort()
                 output_html_files.sort()
@@ -945,18 +932,18 @@ class TestResultsDiffer(object):
 
             okay = "The test report matches the gold report."
             errors=["Gold report had " + str(total["Gold"]) +" errors", "New report had " + str(total["New"]) + " errors."]
-            print_report(test_data, errors, "REPORT COMPARISON", okay)
+            print_report(errors, "REPORT COMPARISON", okay)
 
             if total["Gold"] == total["New"]:
                 test_data.report_passed = True
             else:
-                printerror(test_data, "The reports did not match each other.\n " + errors[0] +" and the " + errors[1])
+                Errors.print_error("The reports did not match each other.\n " + errors[0] +" and the " + errors[1])
 
         except DirNotFoundException as e:
             e.print_error()
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error comparing reports.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error comparing reports.")
+            Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
 
     def _compare_report_files(a_path, b_path):
@@ -1272,9 +1259,9 @@ class Reports(object):
             html.write(output)
             html.close()
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error when creating HTML log at:")
-            printerror(test_data, test_config.html_log)
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error when creating HTML log at:")
+            Errors.print_error(test_config.html_log)
+            Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
 
     def write_html_head():
@@ -1378,9 +1365,9 @@ class Reports(object):
             csv.write(output)
             csv.close()
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error when creating CSV file at:")
-            printerror(test_data, csv_path)
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error when creating CSV file at:")
+            Errors.print_error(csv_path)
+            Errors.print_error(str(e) + "\n")
             print(traceback.format_exc())
             logging.critical(traceback.format_exc())
 
@@ -1439,14 +1426,14 @@ class Logs(object):
         try:
             Logs._fill_test_config_data(test_data)
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error when filling test_config data.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error when filling test_config data.")
+            Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
         # If running in verbose mode (-v)
         if test_config.args.verbose:
             errors = Logs._report_all_errors()
             okay = "No warnings or errors in any log files."
-            print_report(test_data, errors, "VERBOSE", okay)
+            print_report(errors, "VERBOSE", okay)
     # Generate the "common log": a log of all exceptions and warnings
     # from each log file generated by Autopsy
     def _generate_common_log(test_data):
@@ -1478,9 +1465,9 @@ class Logs(object):
             srtcmdlst = ["sort", test_data.common_log_path, "-o", test_data.sorted_log]
             subprocess.call(srtcmdlst)
         except Exception as e:
-            printerror(test_data, "Error: Unable to generate the common log.")
-            printerror(test_data, str(e) + "\n")
-            printerror(test_data, traceback.format_exc())
+            Errors.print_error("Error: Unable to generate the common log.")
+            Errors.print_error(str(e) + "\n")
+            Errors.print_error(traceback.format_exc())
             logging.critical(traceback.format_exc())
 
     def _fill_test_config_data(test_data):
@@ -1497,8 +1484,8 @@ class Logs(object):
             # Set the test_config ending time based off the "create" time (when the file was copied)
             test_data.end_date = time.ctime(os.path.getmtime(log_path))
         except Exception as e:
-            printerror(test_data, "Error: Unable to open autopsy.log.0.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unable to open autopsy.log.0.")
+            Errors.print_error(str(e) + "\n")
             logging.warning(traceback.format_exc())
         # Set the test_config total test time
         # Start date must look like: "Jul 16, 2012 12:57:53 PM"
@@ -1528,8 +1515,8 @@ class Logs(object):
             chunks_line = search_log_set("autopsy", "Indexed file chunks count:", test_data)[0]
             test_config.indexed_chunks = int(chunks_line.rstrip().split(": ")[2])
         except Exception as e:
-            printerror(test_data, "Error: Unable to find the required information to fill test_config data.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unable to find the required information to fill test_config data.")
+            Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
             print(traceback.format_exc())
         try:
@@ -1548,8 +1535,8 @@ class Logs(object):
                 service_list.append(times)
             test_data.service_times = "; ".join(service_list)
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error when finding service times.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error when finding service times.")
+            Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
 
     def _report_all_errors():
@@ -1561,8 +1548,8 @@ class Logs(object):
         try:
             return get_warnings() + get_exceptions()
         except Exception as e:
-            printerror(test_data, "Error: Unknown fatal error when reporting all errors.")
-            printerror(test_data, str(e) + "\n")
+            Errors.print_error("Error: Unknown fatal error when reporting all errors.")
+            Errors.print_error(str(e) + "\n")
             logging.warning(traceback.format_exc())
 
     def search_common_log(string, test_data):
@@ -1584,32 +1571,31 @@ class Logs(object):
         return results
 
 
-def print_report(test_data, errors, name, okay):
+def print_report(errors, name, okay):
     """Print a report with the specified information.
 
     Args:
-        test_data: the TestData to report about.
         errors: a listof_String, the errors to report.
         name: a String, the name of the report.
         okay: the String to print when there are no errors.
     """
     if errors:
-        printerror(test_data, "--------< " + name + " >----------")
+        Errors.print_error("--------< " + name + " >----------")
         for error in errors:
-            printerror(test_data, str(error))
-        printerror(test_data, "--------< / " + name + " >--------\n")
+            Errors.print_error(str(error))
+        Errors.print_error("--------< / " + name + " >--------\n")
     else:
-        printout(test_data, "-----------------------------------------------------------------")
-        printout(test_data, "< " + name + " - " + okay + " />")
-        printout(test_data, "-----------------------------------------------------------------\n")
+        Errors.print_out("-----------------------------------------------------------------")
+        Errors.print_out("< " + name + " - " + okay + " />")
+        Errors.print_out("-----------------------------------------------------------------\n")
 
 # Used instead of the print command when printing out an error
-def printerror(test_data, string):
+def print_error(string):
     print(string)
     test_data.printerror.append(string)
 
 # Used instead of the print command when printing out anything besides errors
-def printout(test_data, string):
+def print_out(string):
     print(string)
     test_data.printout.append(string)
 
@@ -1701,8 +1687,8 @@ class DirNotFoundException(Exception):
         self.strerror = "DirNotFoundException: " + dir
 
     def print_error(self):
-        printerror(test_data, "Error: Directory could not be found at:")
-        printerror(test_data, self.dir + "\n")
+        Errors.print_error("Error: Directory could not be found at:")
+        Errors.print_error(self.dir + "\n")
     def error(self):
         error = "Error: Directory could not be found at:\n" + self.dir + "\n"
         return error
@@ -1719,7 +1705,6 @@ class TestRunner(object):
         the mode (rebuild or testing)
         """
         global parsed
-        global errorem
         global failedbool
         global html
         global attachl
@@ -1730,11 +1715,13 @@ class TestRunner(object):
 
         logres =[]
         for test_data in test_data_list:
+            Errors.clear_print_logs()
+            Errors.set_testing_phase(test_data.image)
             if not (test_config.args.rebuild or
                 os.path.exists(test_data.gold_archive)):
                 msg = "Gold standard doesn't exist, skipping image:"
-                printerror(test_data, msg)
-                printerror(test_data, test_data.gold_archive)
+                Errors.print_error(msg)
+                Errors.print_error(test_data.gold_archive)
                 continue
             TestRunner._run_autopsy_ingest(test_data)
 
@@ -1742,6 +1729,8 @@ class TestRunner(object):
                 TestRunner.rebuild(test_data)
             else:
                 logres.append(TestRunner._run_test(test_data))
+            test_data.printout = Errors.printout
+            test_data.printerror = Errors.printerror
 
         Reports.write_html_foot()
         if (len(logres)>0):
@@ -1750,24 +1739,25 @@ class TestRunner(object):
             passFail = False
             for lm in logres:
                 for ln in lm:
-                    errorem += ln
+                    Errors.add_email_msg(ln)
         if failedbool:
             passFail = False
-            errorem += "The test output didn't match the gold standard.\n"
-            errorem += "Autopsy test failed.\n"
+            msg = "The test output didn't match the gold standard.\n"
+            msg += "autopsy test failed.\n"
+            Errors.add_email_msg(msg)
             html = open(test_config.html_log)
             attachl.insert(0, html.name)
             html.close()
         else:
-            errorem += "Autopsy test passed.\n"
+            Errors.add_email_msg("Autopsy test passed.\n")
             passFail = True
             attachl = []
 
         # @@@ This fails here if we didn't parse an XML file
         try:
-            Emailer.send_email(parsed, errorem, attachl, passFail)
+            Emailer.send_email(parsed, Errors.email_body, attachl, passFail)
         except NameError:
-            printerror(test_data, "Could not send e-mail because of no XML file --maybe");
+            Errors.print_error("Could not send e-mail because of no XML file --maybe");
 
     def _run_autopsy_ingest(test_data):
         """Run Autopsy ingest for the image in the given TestData.
@@ -1782,8 +1772,8 @@ class TestRunner(object):
         global failedbool
         imgfail = False
         if image_type(test_data.image_file) == IMGTYPE.UNKNOWN:
-            printerror(test_data, "Error: Image type is unrecognized:")
-            printerror(test_data, test_data.image_file + "\n")
+            Errors.print_error("Error: Image type is unrecognized:")
+            Errors.print_error(test_data.image_file + "\n")
             return
 
         logging.debug("--------------------")
@@ -1847,9 +1837,9 @@ class TestRunner(object):
         """
         if not test_config.args.keep:
             if clear_dir(test_data.solr_index):
-                print_report(test_data, [], "DELETE SOLR INDEX", "Solr index deleted.")
+                print_report([], "DELETE SOLR INDEX", "Solr index deleted.")
         else:
-            print_report(test_data, [], "KEEP SOLR INDEX", "Solr index has been kept.")
+            print_report([], "KEEP SOLR INDEX", "Solr index has been kept.")
 
     def _handle_exception(test_data):
         """If running in exception mode, print exceptions to log.
@@ -1860,7 +1850,7 @@ class TestRunner(object):
         if test_config.args.exception:
             exceptions = search_logs(test_config.args.exception_string, test_data)
             okay = "No warnings or exceptions found containing text '" + test_config.args.exception_string + "'."
-            print_report(test_data, exceptions, "EXCEPTION", okay)
+            print_report(exceptions, "EXCEPTION", okay)
 
     def rebuild(test_data):
         """Rebuild the gold standard with the given TestData.
@@ -1890,7 +1880,7 @@ class TestRunner(object):
             error_pth = make_path(tmpdir, test_data.image_name+"SortedErrors.txt")
             copy_file(test_data.sorted_log, error_pth)
         except Exception as e:
-            printerror(test_data, str(e))
+            Errors.print_error(str(e))
             print(str(e))
             print(traceback.format_exc())
         # Rebuild the HTML report
@@ -1917,7 +1907,7 @@ class TestRunner(object):
         os.chdir(oldcwd)
         del_dir(test_config.img_gold)
         okay = "Sucessfully rebuilt all gold standards."
-        print_report(test_data, errors, "REBUILDING", okay)
+        print_report(errors, "REBUILDING", okay)
 
     def zipdir(path, zip):
         for root, dirs, files in os.walk(path):
@@ -1955,9 +1945,9 @@ class TestRunner(object):
         test_config.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
         test_config.ant.append("-Dtest.timeout=" + str(test_config.timeout))
 
-        printout(test_data, "Ingesting Image:\n" + test_data.image_file + "\n")
-        printout(test_data, "CMD: " + " ".join(test_config.ant))
-        printout(test_data, "Starting test...\n")
+        Errors.print_out("Ingesting Image:\n" + test_data.image_file + "\n")
+        Errors.print_out("CMD: " + " ".join(test_config.ant))
+        Errors.print_out("Starting test...\n")
         antoutpth = make_local_path(test_config.output_dir, "antRunOutput.txt")
         antout = open(antoutpth, "a")
         if SYS is OS.CYGWIN:
@@ -1967,6 +1957,32 @@ class TestRunner(object):
             theproc.communicate()
         antout.close()
 
+class Errors:
+    """
+    """
+    printout = []
+    printerror = []
+    email_body = ""
+    email_msg_prefix = "Configuration"
+
+    def set_testing_phase(image_name):
+        Errors.email_msg_prefix = image_name
+
+    def print_out(msg):
+        print(msg)
+        Errors.printout.append(msg)
+
+    def print_error(msg):
+        print(msg)
+        Errors.printerror.append(msg)
+
+    def clear_print_logs():
+        Errors.printout = []
+        Errors.printerror = []
+
+    def add_email_msg(msg):
+        Errors.email_body += Errors.email_msg_prefix + ":" + msg
+
 ####
 # Helper Functions
 ####
@@ -2107,10 +2123,8 @@ def main():
     # Global variables
     global failedbool
     global test_config
-    global errorem
     global attachl
     failedbool = False
-    errorem = ""
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)

From 3e1ef3712f58e722be216b350b7f2c25bc88b32b Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Mon, 15 Jul 2013 12:51:30 -0400
Subject: [PATCH 04/13] Email attachments are now stored in Errors class. Added
 documentation to Errors class.

---
 test/script/regression.py | 59 +++++++++++++++++++++++++++++----------
 1 file changed, 45 insertions(+), 14 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 158fbf1fbd..f2ecec355b 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -353,7 +353,6 @@ class TestConfiguration(object):
         """
         try:
             global parsed
-            global attachl
             count = 0
             parsed = parse(config_file)
             logres = []
@@ -623,7 +622,6 @@ class TskDbDiff(object):
             test_data: the TestData that corresponds with this dump.
         """
         autopsy_cur2 = autopsy_con.cursor()
-        global attachl
         global failedbool
         # Get the list of all artifacts
         # @@@ Could add a SORT by parent_path in here since that is how we are going to later sort it.
@@ -678,7 +676,7 @@ class TskDbDiff(object):
                             Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
-                                attachl.append(autopsy_db_file)
+                                Errors.add_email_attachment(autopsy_db_file)
                                 appnd = True
                         if(not attr[0] == src):
                             msg ="There were inconsistent sources for artifact with id #" + str(rw[3]) + ".\n"
@@ -686,7 +684,7 @@ class TskDbDiff(object):
                             Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
-                                attachl.append(autopsy_db_file)
+                                Errors.add_email_attachment(autopsy_db_file)
                                 appnd = True
                         try:
                             database_log.write('<attribute source="' + attr[0] + '" type="' + attr[1] + '" value="')
@@ -891,9 +889,8 @@ class TestResultsDiffer(object):
             diff_file = codecs.open(diff_path, "wb", "utf_8")
             dffcmdlst = ["diff", output_file, gold_file]
             subprocess.call(dffcmdlst, stdout = diff_file)
-            global attachl
             global failedbool
-            attachl.append(diff_path)
+            Errors.add_email_attachment(diff_path)
             msg = test_data.image_name + ":There was a difference in "
             msg += os.path.basename(output_file) + ".\n"
             Errors.add_email_msg(msg)
@@ -1707,7 +1704,6 @@ class TestRunner(object):
         global parsed
         global failedbool
         global html
-        global attachl
 
         test_data_list = [ TestData(image, test_config) for image in test_config.images ]
 
@@ -1746,16 +1742,15 @@ class TestRunner(object):
             msg += "autopsy test failed.\n"
             Errors.add_email_msg(msg)
             html = open(test_config.html_log)
-            attachl.insert(0, html.name)
+            Errors.add_email_attachment(html.name)
             html.close()
         else:
             Errors.add_email_msg("Autopsy test passed.\n")
             passFail = True
-            attachl = []
 
         # @@@ This fails here if we didn't parse an XML file
         try:
-            Emailer.send_email(parsed, Errors.email_body, attachl, passFail)
+            Emailer.send_email(parsed, Errors.email_body, Errors.email_attachs, passFail)
         except NameError:
             Errors.print_error("Could not send e-mail because of no XML file --maybe");
 
@@ -1815,7 +1810,7 @@ class TestRunner(object):
         Reports.generate_reports(test_config.csv, test_data)
         # Reset the test_config and return the tests sucessfully finished
         if(failedbool):
-            attachl.append(test_data.common_log_path)
+            Errors.add_email_attachment(test_data.common_log_path)
         return logres
 
     def _extract_gold(test_data):
@@ -1958,31 +1953,69 @@ class TestRunner(object):
         antout.close()
 
 class Errors:
-    """
+    """A class used to manage error reporting.
+
+    Attributes:
+        printout: a listof_String, the non-error messages that were printed
+        printerror: a listof_String, the error messages that were printed
+        email_body: a String, the body of the report email
+        email_msg_prefix: a String, the prefix for lines added to the email
+        email_attchs: a listof_pathto_File, the files to be attached to the
+        report email
     """
     printout = []
     printerror = []
     email_body = ""
     email_msg_prefix = "Configuration"
+    email_attachs = []
 
     def set_testing_phase(image_name):
+        """Change the email message prefix to be the given testing phase.
+
+        Args:
+            image_name: a String, representing the current image being tested
+        """
         Errors.email_msg_prefix = image_name
 
     def print_out(msg):
+        """Print out an informational message.
+
+        Args:
+            msg: a String, the message to be printed
+        """
         print(msg)
         Errors.printout.append(msg)
 
     def print_error(msg):
+        """Print out an error message.
+
+        Args:
+            msg: a String, the error message to be printed.
+        """
         print(msg)
         Errors.printerror.append(msg)
 
     def clear_print_logs():
+        """Reset the image-specific attributes of the Errors class."""
         Errors.printout = []
         Errors.printerror = []
 
     def add_email_msg(msg):
+        """Add the given message to the body of the report email.
+
+        Args:
+            msg: a String, the message to be added to the email
+        """
         Errors.email_body += Errors.email_msg_prefix + ":" + msg
 
+    def add_email_attachment(path):
+        """Add the given file to be an attachment for the report email
+
+        Args:
+            file: a pathto_File, the file to add
+        """
+        Errors.email_attachs.append(path)
+
 ####
 # Helper Functions
 ####
@@ -2123,12 +2156,10 @@ def main():
     # Global variables
     global failedbool
     global test_config
-    global attachl
     failedbool = False
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)
-    attachl = []
     # The arguments were given wrong:
     if not parse_result:
         test_config.reset()

From 151d35b8f20463ddd906f283e69bf2018a73a8fe Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Mon, 15 Jul 2013 13:18:57 -0400
Subject: [PATCH 05/13] Reorganized script. TskDbDiff no longer relies on
 TestData.

---
 test/script/regression.py | 1204 ++++++++++++++++++-------------------
 1 file changed, 600 insertions(+), 604 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index f2ecec355b..2996ff5a0e 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -95,103 +95,442 @@ AUTOPSY_TEST_CASE = "AutopsyTestCase"
 COMMON_LOG = "AutopsyErrors.txt"
 
 Day = 0
-#-------------------------------------------------------------#
-# Parses argv and stores booleans to match command line input #
-#-------------------------------------------------------------#
-class Args(object):
-    """A container for command line options and arguments.
+
+#----------------------#
+#        Main          #
+#----------------------#
+def main():
+    # Global variables
+    global failedbool
+    global test_config
+    failedbool = False
+    args = Args()
+    parse_result = args.parse()
+    test_config = TestConfiguration(args)
+    # The arguments were given wrong:
+    if not parse_result:
+        return
+    if(not args.fr):
+        antin = ["ant"]
+        antin.append("-f")
+        antin.append(os.path.join("..","..","build.xml"))
+        antin.append("test-download-imgs")
+        if SYS is OS.CYGWIN:
+            subprocess.call(antin)
+        elif SYS is OS.WIN:
+            theproc = subprocess.Popen(antin, shell = True, stdout=subprocess.PIPE)
+            theproc.communicate()
+    # Otherwise test away!
+    TestRunner.run_tests()
+
+class TestRunner(object):
+
+    def run_tests():
+        """Run the tests specified by the main TestConfiguration.
+
+        Executes the AutopsyIngest for each image and dispatches the results based on
+        the mode (rebuild or testing)
+        """
+        global parsed
+        global failedbool
+        global html
+
+        test_data_list = [ TestData(image, test_config) for image in test_config.images ]
+
+        Reports.html_add_images(test_config.images)
+
+        logres =[]
+        for test_data in test_data_list:
+            Errors.clear_print_logs()
+            Errors.set_testing_phase(test_data.image)
+            if not (test_config.args.rebuild or
+                os.path.exists(test_data.gold_archive)):
+                msg = "Gold standard doesn't exist, skipping image:"
+                Errors.print_error(msg)
+                Errors.print_error(test_data.gold_archive)
+                continue
+            TestRunner._run_autopsy_ingest(test_data)
+
+            if test_config.args.rebuild:
+                TestRunner.rebuild(test_data)
+            else:
+                logres.append(TestRunner._run_test(test_data))
+            test_data.printout = Errors.printout
+            test_data.printerror = Errors.printerror
+
+        Reports.write_html_foot()
+        if (len(logres)>0):
+            failedbool = True
+            imgfail = True
+            passFail = False
+            for lm in logres:
+                for ln in lm:
+                    Errors.add_email_msg(ln)
+        if failedbool:
+            passFail = False
+            msg = "The test output didn't match the gold standard.\n"
+            msg += "autopsy test failed.\n"
+            Errors.add_email_msg(msg)
+            html = open(test_config.html_log)
+            Errors.add_email_attachment(html.name)
+            html.close()
+        else:
+            Errors.add_email_msg("Autopsy test passed.\n")
+            passFail = True
+
+        # @@@ This fails here if we didn't parse an XML file
+        try:
+            Emailer.send_email(parsed, Errors.email_body, Errors.email_attachs, passFail)
+        except NameError:
+            Errors.print_error("Could not send e-mail because of no XML file --maybe");
+
+    def _run_autopsy_ingest(test_data):
+        """Run Autopsy ingest for the image in the given TestData.
+
+        Also generates the necessary logs for rebuilding or diff.
+
+        Args:
+            test_data: the TestData to run the ingest on.
+        """
+        global parsed
+        global imgfail
+        global failedbool
+        imgfail = False
+        if image_type(test_data.image_file) == IMGTYPE.UNKNOWN:
+            Errors.print_error("Error: Image type is unrecognized:")
+            Errors.print_error(test_data.image_file + "\n")
+            return
+
+        logging.debug("--------------------")
+        logging.debug(test_data.image_name)
+        logging.debug("--------------------")
+        TestRunner._run_ant(test_data)
+        time.sleep(2) # Give everything a second to process
+
+        # Dump the database before we diff or use it for rebuild
+        TskDbDiff.dump_output_db(test_data)
+
+        # merges logs into a single log for later diff / rebuild
+        copy_logs(test_data)
+        Logs.generate_log_data(test_data)
+
+        TestRunner._handle_solr(test_data)
+        TestRunner._handle_exception(test_data)
+
+    #TODO: figure out return type of _run_test (logres)
+    def _run_test(test_data):
+        """Compare the results of the output to the gold standard.
+
+        Args:
+            test_data: the TestData
+
+        Returns:
+            logres?
+        """
+        TestRunner._extract_gold(test_data)
+
+        # Look for core exceptions
+        # @@@ Should be moved to TestResultsDiffer, but it didn't know about logres -- need to look into that
+        logres = Logs.search_common_log("TskCoreException", test_data)
+
+        TestResultsDiffer.run_diff(test_data)
+
+        # @@@ COnsider if we want to do this for a rebuild.
+        # Make the CSV log and the html log viewer
+        Reports.generate_reports(test_config.csv, test_data)
+        # Reset the test_config and return the tests sucessfully finished
+        if(failedbool):
+            Errors.add_email_attachment(test_data.common_log_path)
+        return logres
+
+    def _extract_gold(test_data):
+        """Extract gold archive file to output/gold/tmp/
+
+        Args:
+            test_data: the TestData
+        """
+        extrctr = zipfile.ZipFile(test_data.gold_archive, 'r', compression=zipfile.ZIP_DEFLATED)
+        extrctr.extractall(test_data.main_config.gold)
+        extrctr.close
+        time.sleep(2)
+
+    def _handle_solr(test_data):
+        """Clean up SOLR index if in keep mode (-k).
+
+        Args:
+            test_data: the TestData
+        """
+        if not test_config.args.keep:
+            if clear_dir(test_data.solr_index):
+                print_report([], "DELETE SOLR INDEX", "Solr index deleted.")
+        else:
+            print_report([], "KEEP SOLR INDEX", "Solr index has been kept.")
+
+    def _handle_exception(test_data):
+        """If running in exception mode, print exceptions to log.
+
+        Args:
+            test_data: the TestData
+        """
+        if test_config.args.exception:
+            exceptions = search_logs(test_config.args.exception_string, test_data)
+            okay = "No warnings or exceptions found containing text '" + test_config.args.exception_string + "'."
+            print_report(exceptions, "EXCEPTION", okay)
+
+    def rebuild(test_data):
+        """Rebuild the gold standard with the given TestData.
+
+        Copies the test-generated database and html report files into the gold directory.
+        """
+        # Errors to print
+        errors = []
+        # Delete the current gold standards
+        gold_dir = test_config.img_gold
+        clear_dir(test_config.img_gold)
+        tmpdir = make_path(gold_dir, test_data.image_name)
+        dbinpth = test_data.get_db_path(DBType.OUTPUT)
+        dboutpth = make_path(tmpdir, DB_FILENAME)
+        dataoutpth = make_path(tmpdir, test_data.image_name + "SortedData.txt")
+        dbdumpinpth = test_data.get_db_dump_path(DBType.OUTPUT)
+        dbdumpoutpth = make_path(tmpdir, test_data.image_name + "DBDump.txt")
+        if not os.path.exists(test_config.img_gold):
+            os.makedirs(test_config.img_gold)
+        if not os.path.exists(tmpdir):
+            os.makedirs(tmpdir)
+        try:
+            copy_file(dbinpth, dboutpth)
+            if file_exists(test_data.get_sorted_data_path(DBType.OUTPUT)):
+                copy_file(test_data.get_sorted_data_path(DBType.OUTPUT), dataoutpth)
+            copy_file(dbdumpinpth, dbdumpoutpth)
+            error_pth = make_path(tmpdir, test_data.image_name+"SortedErrors.txt")
+            copy_file(test_data.sorted_log, error_pth)
+        except Exception as e:
+            Errors.print_error(str(e))
+            print(str(e))
+            print(traceback.format_exc())
+        # Rebuild the HTML report
+        output_html_report_dir = test_data.get_html_report_path(DBType.OUTPUT)
+        gold_html_report_dir = make_path(tmpdir, "Report")
+
+        try:
+            copy_dir(output_html_report_dir, gold_html_report_dir)
+        except FileNotFoundException as e:
+            errors.append(e.error())
+        except Exception as e:
+            errors.append("Error: Unknown fatal error when rebuilding the gold html report.")
+            errors.append(str(e) + "\n")
+            print(traceback.format_exc())
+        oldcwd = os.getcwd()
+        zpdir = gold_dir
+        os.chdir(zpdir)
+        os.chdir("..")
+        img_gold = "tmp"
+        img_archive = make_path(test_data.image_name+"-archive.zip")
+        comprssr = zipfile.ZipFile(img_archive, 'w',compression=zipfile.ZIP_DEFLATED)
+        TestRunner.zipdir(img_gold, comprssr)
+        comprssr.close()
+        os.chdir(oldcwd)
+        del_dir(test_config.img_gold)
+        okay = "Sucessfully rebuilt all gold standards."
+        print_report(errors, "REBUILDING", okay)
+
+    def zipdir(path, zip):
+        for root, dirs, files in os.walk(path):
+            for file in files:
+                zip.write(os.path.join(root, file))
+
+    def _run_ant(test_data):
+        """Construct and run the ant build command for the given TestData.
+
+        Tests Autopsy by calling RegressionTest.java via the ant build file.
+
+        Args:
+            test_data: the TestData
+        """
+        # Set up the directories
+        test_config_path = os.path.join(test_config.output_dir, test_data.image_name)
+        if dir_exists(test_config_path):
+            shutil.rmtree(test_config_path)
+        os.makedirs(test_config_path)
+        test_config.ant = ["ant"]
+        test_config.ant.append("-v")
+        test_config.ant.append("-f")
+    #   case.ant.append(case.build_path)
+        test_config.ant.append(os.path.join("..","..","Testing","build.xml"))
+        test_config.ant.append("regression-test")
+        test_config.ant.append("-l")
+        test_config.ant.append(test_data.antlog_dir)
+        test_config.ant.append("-Dimg_path=" + test_data.image_file)
+        test_config.ant.append("-Dknown_bad_path=" + test_config.known_bad_path)
+        test_config.ant.append("-Dkeyword_path=" + test_config.keyword_path)
+        test_config.ant.append("-Dnsrl_path=" + test_config.nsrl_path)
+        test_config.ant.append("-Dgold_path=" + test_config.gold)
+        test_config.ant.append("-Dout_path=" +
+        make_local_path(test_data.output_path))
+        test_config.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
+        test_config.ant.append("-Dtest.timeout=" + str(test_config.timeout))
+
+        Errors.print_out("Ingesting Image:\n" + test_data.image_file + "\n")
+        Errors.print_out("CMD: " + " ".join(test_config.ant))
+        Errors.print_out("Starting test...\n")
+        antoutpth = make_local_path(test_config.output_dir, "antRunOutput.txt")
+        antout = open(antoutpth, "a")
+        if SYS is OS.CYGWIN:
+            subprocess.call(test_config.ant, stdout=subprocess.PIPE)
+        elif SYS is OS.WIN:
+            theproc = subprocess.Popen(test_config.ant, shell = True, stdout=subprocess.PIPE)
+            theproc.communicate()
+        antout.close()
+
+
+class TestData(object):
+    """Container for the input and output of a single image.
+
+    Represents data for the test of a single image, including path to the image,
+    database paths, etc.
 
     Attributes:
-        single: a boolean indicating whether to run in single file mode
-        single_file: an Image to run the test on
-        rebuild: a boolean indicating whether to run in rebuild mode
-        list: a boolean indicating a config file was specified
-        unallocated: a boolean indicating unallocated space should be ignored
-        ignore: a boolean indicating the input directory should be ingnored
-        keep: a boolean indicating whether to keep the SOLR index
-        verbose: a boolean indicating whether verbose output should be printed
-        exeception: a boolean indicating whether errors containing exception
-                    exception_string should be printed
-        exception_sring: a String representing and exception name
-        fr: a boolean indicating whether gold standard images will be downloaded
+        main_config: the global TestConfiguration
+        image_file: a pathto_Image, the image for this TestData
+        image: a String, the image file's name
+        image_name: a String, the image file's name with a trailing (0)
+        output_path: pathto_Dir, the output directory for this TestData
+        autopsy_data_file: a pathto_File, the IMAGE_NAMEAutopsy_data.txt file
+        warning_log: a pathto_File, the AutopsyLogs.txt file
+        antlog_dir: a pathto_File, the antlog.txt file
+        test_dbdump: a pathto_File, the database dump, IMAGENAMEDump.txt
+        common_log_path: a pathto_File, the IMAGE_NAMECOMMON_LOG file
+        sorted_log: a pathto_File, the IMAGENAMESortedErrors.txt file
+        reports_dir: a pathto_Dir, the AutopsyTestCase/Reports folder
+        gold_data_dir: a pathto_Dir, the gold standard directory
+        gold_archive: a pathto_File, the gold standard archive
+        logs_dir: a pathto_Dir, the location where autopsy logs are stored
+        solr_index: a pathto_Dir, the locatino of the solr index
+        db_diff_results: a DiffResults, the results of the database comparison
+        total_test_time: a String representation of the test duration
+        start_date: a String representation of this TestData's start date
+        end_date: a String representation of the TestData's end date
+        total_ingest_time: a String representation of the total ingest time
+        artifact_count: a Nat, the number of artifacts
+        artifact_fail: a Nat, the number of artifact failures
+        heap_space: a String representation of TODO
+        service_times: a String representation of TODO
+        report_passed: a boolean, indicating if the reports passed
+        printerror: a listof_String, the error messages printed during this TestData's test
+        printout: a listof_String, the messages pritned during this TestData's test
     """
-    def __init__(self):
-        self.single = False
-        self.single_file = ""
-        self.rebuild = False
-        self.list = False
-        self.config_file = ""
-        self.unallocated = False
-        self.ignore = False
-        self.keep = False
-        self.verbose = False
-        self.exception = False
-        self.exception_string = ""
-        self.fr = False
 
-    def parse(self):
-        global nxtproc
-        nxtproc = []
-        nxtproc.append("python3")
-        nxtproc.append(sys.argv.pop(0))
-        while sys.argv:
-            arg = sys.argv.pop(0)
-            nxtproc.append(arg)
-            if(arg == "-f"):
-                #try: @@@ Commented out until a more specific except statement is added
-                    arg = sys.argv.pop(0)
-                    print("Running on a single file:")
-                    print(path_fix(arg) + "\n")
-                    self.single = True
-                    self.single_file = path_fix(arg)
-                #except:
-                #   print("Error: No single file given.\n")
-            #       return False
-            elif(arg == "-r" or arg == "--rebuild"):
-                print("Running in rebuild mode.\n")
-                self.rebuild = True
-            elif(arg == "-l" or arg == "--list"):
-                try:
-                    arg = sys.argv.pop(0)
-                    nxtproc.append(arg)
-                    print("Running from configuration file:")
-                    print(arg + "\n")
-                    self.list = True
-                    self.config_file = arg
-                except:
-                    print("Error: No configuration file given.\n")
-                    return False
-            elif(arg == "-u" or arg == "--unallocated"):
-               print("Ignoring unallocated space.\n")
-               self.unallocated = True
-            elif(arg == "-k" or arg == "--keep"):
-                print("Keeping the Solr index.\n")
-                self.keep = True
-            elif(arg == "-v" or arg == "--verbose"):
-                print("Running in verbose mode:")
-                print("Printing all thrown exceptions.\n")
-                self.verbose = True
-            elif(arg == "-e" or arg == "--exception"):
-                try:
-                    arg = sys.argv.pop(0)
-                    nxtproc.append(arg)
-                    print("Running in exception mode: ")
-                    print("Printing all exceptions with the string '" + arg + "'\n")
-                    self.exception = True
-                    self.exception_string = arg
-                except:
-                    print("Error: No exception string given.")
-            elif arg == "-h" or arg == "--help":
-                print(usage())
-                return False
-            elif arg == "-fr" or arg == "--forcerun":
-                print("Not downloading new images")
-                self.fr = True
-            else:
-                print(usage())
-                return False
-        # Return the args were sucessfully parsed
-        return True
+    def __init__(self, image, main_config):
+        """Init this TestData with it's image and the test configuration.
+
+        Args:
+            image: the Image to be tested.
+            main_config: the global TestConfiguration.
+        """
+        self.main_config = main_config
+        self.image_file = str(image)
+        # TODO: This 0 should be be refactored out, but it will require rebuilding and changing of outputs.
+        self.image = get_image_name(self.image_file)
+        self.image_name = self.image + "(0)"
+        self.output_path = make_path(self.main_config.output_dir, self.image_name)
+        self.autopsy_data_file = make_path(self.output_path, self.image_name + "Autopsy_data.txt")
+        self.warning_log = make_local_path(self.output_path, "AutopsyLogs.txt")
+        self.antlog_dir = make_local_path(self.output_path, "antlog.txt")
+        self.test_dbdump = make_path(self.output_path, self.image_name +
+        "DBDump.txt")
+        self.common_log_path = make_local_path(self.output_path, self.image_name + COMMON_LOG)
+        self.sorted_log = make_local_path(self.output_path, self.image_name + "SortedErrors.txt")
+        self.reports_dir = make_path(self.output_path, AUTOPSY_TEST_CASE, "Reports")
+        self.gold_data_dir = make_path(self.main_config.img_gold, self.image_name)
+        self.gold_archive = make_path(self.main_config.gold,
+        self.image_name + "-archive.zip")
+        self.logs_dir = make_path(self.output_path, "logs")
+        self.solr_index = make_path(self.output_path, AUTOPSY_TEST_CASE,
+        "ModuleOutput", "KeywordSearch")
+        self.db_diff_results = None
+        self.total_test_time = ""
+        self.start_date = ""
+        self.end_date = ""
+        self.total_ingest_time = ""
+        self.artifact_count = 0
+        self.artifact_fail = 0
+        self.heap_space = ""
+        self.service_times = ""
+        self.report_passed = False
+        # Error tracking
+        self.printerror = []
+        self.printout = []
+
+    def get_db_path(self, db_type):
+        """Get the path to the database file that corresponds to the given DBType.
+
+        Args:
+            DBType: the DBType of the path to be generated.
+        """
+        if(db_type == DBType.GOLD):
+            db_path = make_path(self.gold_data_dir, DB_FILENAME)
+        elif(db_type == DBType.OUTPUT):
+            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, DB_FILENAME)
+        else:
+            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, BACKUP_DB_FILENAME)
+        return db_path
+
+    def get_html_report_path(self, html_type):
+        """Get the path to the HTML Report folder that corresponds to the given DBType.
+
+        Args:
+            DBType: the DBType of the path to be generated.
+        """
+        if(html_type == DBType.GOLD):
+            return make_path(self.gold_data_dir, "Report")
+        else:
+            # Autopsy creates an HTML report folder in the form AutopsyTestCase DATE-TIME
+            # It's impossible to get the exact time the folder was created, but the folder
+            # we are looking for is the only one in the self.reports_dir folder
+            html_path = ""
+            for fs in os.listdir(self.reports_dir):
+                html_path = make_path(self.reports_dir, fs)
+                if os.path.isdir(html_path):
+                    break
+            return make_path(html_path, os.listdir(html_path)[0])
+
+    def get_sorted_data_path(self, file_type):
+        """Get the path to the SortedData file that corresponds to the given DBType.
+
+        Args:
+            file_type: the DBType of the path to be generated
+        """
+        return self._get_path_to_file(file_type, "SortedData.txt")
+
+    def get_sorted_errors_path(self, file_type):
+        """Get the path to the SortedErrors file that correspodns to the given
+        DBType.
+
+        Args:
+            file_type: the DBType of the path to be generated
+        """
+        return self._get_path_to_file(file_type, "SortedErrors.txt")
+
+    def get_db_dump_path(self, file_type):
+        """Get the path to the DBDump file that corresponds to the given DBType.
+
+        Args:
+            file_type: the DBType of the path to be generated
+        """
+        return self._get_path_to_file(file_type, "DBDump.txt")
+
+    def _get_path_to_file(self, file_type, file_name):
+        """Get the path to the specified file with the specified type.
+
+        Args:
+            file_type: the DBType of the path to be generated
+            file_name: a String, the filename of the path to be generated
+        """
+        full_filename = self.image_name + file_name
+        if(file_type == DBType.GOLD):
+            return make_path(self.gold_data_dir, full_filename)
+        else:
+            return make_path(self.output_path, full_filename)
 
 
 class TestConfiguration(object):
@@ -399,8 +738,7 @@ class TestConfiguration(object):
 class TskDbDiff(object):
     """Represents the differences between the gold and output databases.
 
-    Contains methods to compare two databases and internally
-    store some of the results
+    Contains methods to compare two databases.
 
     Attributes:
         gold_artifacts:
@@ -415,7 +753,7 @@ class TskDbDiff(object):
         autopsy_db_file:
         gold_db_file:
     """
-    def __init__(self, test_data):
+    def __init__(self, output_db_path, gold_db_path):
         """Constructor for TskDbDiff.
 
         Args:
@@ -429,9 +767,8 @@ class TskDbDiff(object):
         self.autopsy_objects = 0
         self.artifact_comparison = []
         self.attribute_comparison = []
-        self.test_data = test_data
-        self.autopsy_db_file = self.test_data.get_db_path(DBType.OUTPUT)
-        self.gold_db_file = self.test_data.get_db_path(DBType.GOLD)
+        self.autopsy_db_file = output_db_path
+        self.gold_db_file = gold_db_path
 
     def _get_artifacts(self, cursor):
         """Get a list of artifacts from the given SQLCursor.
@@ -495,7 +832,7 @@ class TskDbDiff(object):
                     exceptions.append(error)
             return exceptions
         except Exception as e:
-            printerror(self.test_data, str(e))
+            Errors.print_error(str(e))
             exceptions.append("Error: Unable to compare blackboard_artifacts.\n")
             return exceptions
 
@@ -562,7 +899,7 @@ class TskDbDiff(object):
             self.gold_attributes = self._count_attributes(gold_cur)
             self.autopsy_attributes = self._count_attributes(autopsy_cur)
         except Exception as e:
-            printerror(self.test_data, "Way out:" + str(e))
+            Errors.print_error("Way out:" + str(e))
 
     def run_diff(self):
         """Basic test between output and gold databases.
@@ -572,12 +909,12 @@ class TskDbDiff(object):
         """
         # Check to make sure both db files exist
         if not file_exists(self.autopsy_db_file):
-            printerror(self.test_data, "Error: TskDbDiff file does not exist at:")
-            printerror(self.test_data, self.autopsy_db_file + "\n")
+            Errors.print_error("Error: TskDbDiff file does not exist at:")
+            Errors.print_error(self.autopsy_db_file + "\n")
             return
         if not file_exists(self.gold_db_file):
-            printerror(self.test_data, "Error: Gold database file does not exist at:")
-            printerror(self.test_data, self.gold_db_file + "\n")
+            Errors.print_error("Error: Gold database file does not exist at:")
+            Errors.print_error(self.gold_db_file + "\n")
             return
 
         # Get connections and cursors to output / gold databases
@@ -758,63 +1095,11 @@ class TskDbDiff(object):
         TskDbDiff._dump_output_db_nonbb(test_data)
         autopsy_con.close()
 
-class DiffResults(object):
-    """Container for the results of the database diff tests.
-
-    Stores artifact, object, and attribute counts and comparisons generated by
-    TskDbDiff.
-
-    Attributes:
-        gold_attrs: a Nat, the number of gold attributes
-        output_attrs: a Nat, the number of output attributes
-        gold_objs: a Nat, the number of gold objects
-        output_objs: a Nat, the number of output objects
-        artifact_comp: a listof_String, describing the differences
-        attribute_comp: a listof_String, describing the differences
-    """
-    def __init__(self, tsk_diff):
-        """Inits a DiffResults
-
-        Args:
-            tsk_diff: a TskDBDiff
-        """
-        self.gold_attrs = tsk_diff.gold_attributes
-        self.output_attrs = tsk_diff.autopsy_attributes
-        self.gold_objs = tsk_diff.gold_objects
-        self.output_objs = tsk_diff.autopsy_objects
-        self.artifact_comp = tsk_diff.artifact_comparison
-        self.attribute_comp = tsk_diff.attribute_comparison
-        self.gold_artifacts = len(tsk_diff.gold_artifacts)
-        self.output_artifacts = len(tsk_diff.autopsy_artifacts)
-
-    def get_artifact_comparison(self):
-        if not self.artifact_comp:
-            return "All counts matched"
-        else:
-            global failedbool
-            failedbool = True
-            global imgfail
-            imgfail = True
-            return "; ".join(self.artifact_comp)
-
-    def get_attribute_comparison(self):
-        if not self.attribute_comp:
-            return "All counts matched"
-        global failedbool
-        failedbool = True
-        global imgfail
-        imgfail = True
-        list = []
-        for error in self.attribute_comp:
-            list.append(error)
-        return ";".join(list)
-
 #-------------------------------------------------#
 #     Functions relating to comparing outputs     #
 #-------------------------------------------------#
 class TestResultsDiffer(object):
-    """Compares results for a single test.
-    """
+    """Compares results for a single test."""
 
     def run_diff(test_data):
         """Compares results for a single test.
@@ -826,9 +1111,14 @@ class TestResultsDiffer(object):
         try:
 
             # Diff the gold and output databases
-            test_data.db_diff_results = TskDbDiff(test_data).run_diff()
+            output_db_path = test_data.get_db_path(DBType.OUTPUT)
+            gold_db_path = test_data.get_db_path(DBType.GOLD)
+            db_diff = TskDbDiff(output_db_path, gold_db_path)
+            test_data.db_diff_results = db_diff.run_diff()
 
             # Compare Exceptions
+            # replace is a fucntion that replaces strings of digits with 'd'
+            # this is needed so dates and times will not cause the diff to fail
             replace = lambda file: re.sub(re.compile("\d"), "d", file)
             output_errors = test_data.get_sorted_errors_path(DBType.OUTPUT)
             gold_errors = test_data.get_sorted_errors_path(DBType.GOLD)
@@ -974,154 +1264,6 @@ class TestResultsDiffer(object):
     def _split(input, size):
         return [input[start:start+size] for start in range(0, len(input), size)]
 
-class TestData(object):
-    """Container for the input and output of a single image.
-
-    Represents data for the test of a single image, including path to the image,
-    database paths, etc.
-
-    Attributes:
-        main_config: the global TestConfiguration
-        image_file: a pathto_Image, the image for this TestData
-        image: a String, the image file's name
-        image_name: a String, the image file's name with a trailing (0)
-        output_path: pathto_Dir, the output directory for this TestData
-        autopsy_data_file: a pathto_File, the IMAGE_NAMEAutopsy_data.txt file
-        warning_log: a pathto_File, the AutopsyLogs.txt file
-        antlog_dir: a pathto_File, the antlog.txt file
-        test_dbdump: a pathto_File, the database dump, IMAGENAMEDump.txt
-        common_log_path: a pathto_File, the IMAGE_NAMECOMMON_LOG file
-        sorted_log: a pathto_File, the IMAGENAMESortedErrors.txt file
-        reports_dir: a pathto_Dir, the AutopsyTestCase/Reports folder
-        gold_data_dir: a pathto_Dir, the gold standard directory
-        gold_archive: a pathto_File, the gold standard archive
-        logs_dir: a pathto_Dir, the location where autopsy logs are stored
-        solr_index: a pathto_Dir, the locatino of the solr index
-        db_diff_results: a DiffResults, the results of the database comparison
-        total_test_time: a String representation of the test duration
-        start_date: a String representation of this TestData's start date
-        end_date: a String representation of the TestData's end date
-        total_ingest_time: a String representation of the total ingest time
-        artifact_count: a Nat, the number of artifacts
-        artifact_fail: a Nat, the number of artifact failures
-        heap_space: a String representation of TODO
-        service_times: a String representation of TODO
-        report_passed: a boolean, indicating if the reports passed
-        printerror: a listof_String, the error messages printed during this TestData's test
-        printout: a listof_String, the messages pritned during this TestData's test
-    """
-
-    def __init__(self, image, main_config):
-        """Init this TestData with it's image and the test configuration.
-
-        Args:
-            image: the Image to be tested.
-            main_config: the global TestConfiguration.
-        """
-        self.main_config = main_config
-        self.image_file = str(image)
-        # TODO: This 0 should be be refactored out, but it will require rebuilding and changing of outputs.
-        self.image = get_image_name(self.image_file)
-        self.image_name = self.image + "(0)"
-        self.output_path = make_path(self.main_config.output_dir, self.image_name)
-        self.autopsy_data_file = make_path(self.output_path, self.image_name + "Autopsy_data.txt")
-        self.warning_log = make_local_path(self.output_path, "AutopsyLogs.txt")
-        self.antlog_dir = make_local_path(self.output_path, "antlog.txt")
-        self.test_dbdump = make_path(self.output_path, self.image_name +
-        "DBDump.txt")
-        self.common_log_path = make_local_path(self.output_path, self.image_name + COMMON_LOG)
-        self.sorted_log = make_local_path(self.output_path, self.image_name + "SortedErrors.txt")
-        self.reports_dir = make_path(self.output_path, AUTOPSY_TEST_CASE, "Reports")
-        self.gold_data_dir = make_path(self.main_config.img_gold, self.image_name)
-        self.gold_archive = make_path(self.main_config.gold,
-        self.image_name + "-archive.zip")
-        self.logs_dir = make_path(self.output_path, "logs")
-        self.solr_index = make_path(self.output_path, AUTOPSY_TEST_CASE,
-        "ModuleOutput", "KeywordSearch")
-        self.db_diff_results = None
-        self.total_test_time = ""
-        self.start_date = ""
-        self.end_date = ""
-        self.total_ingest_time = ""
-        self.artifact_count = 0
-        self.artifact_fail = 0
-        self.heap_space = ""
-        self.service_times = ""
-        self.report_passed = False
-        # Error tracking
-        self.printerror = []
-        self.printout = []
-
-    def get_db_path(self, db_type):
-        """Get the path to the database file that corresponds to the given DBType.
-
-        Args:
-            DBType: the DBType of the path to be generated.
-        """
-        if(db_type == DBType.GOLD):
-            db_path = make_path(self.gold_data_dir, DB_FILENAME)
-        elif(db_type == DBType.OUTPUT):
-            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, DB_FILENAME)
-        else:
-            db_path = make_path(self.main_config.output_dir, self.image_name, AUTOPSY_TEST_CASE, BACKUP_DB_FILENAME)
-        return db_path
-
-    def get_html_report_path(self, html_type):
-        """Get the path to the HTML Report folder that corresponds to the given DBType.
-
-        Args:
-            DBType: the DBType of the path to be generated.
-        """
-        if(html_type == DBType.GOLD):
-            return make_path(self.gold_data_dir, "Report")
-        else:
-            # Autopsy creates an HTML report folder in the form AutopsyTestCase DATE-TIME
-            # It's impossible to get the exact time the folder was created, but the folder
-            # we are looking for is the only one in the self.reports_dir folder
-            html_path = ""
-            for fs in os.listdir(self.reports_dir):
-                html_path = make_path(self.reports_dir, fs)
-                if os.path.isdir(html_path):
-                    break
-            return make_path(html_path, os.listdir(html_path)[0])
-
-    def get_sorted_data_path(self, file_type):
-        """Get the path to the SortedData file that corresponds to the given DBType.
-
-        Args:
-            file_type: the DBType of the path to be generated
-        """
-        return self._get_path_to_file(file_type, "SortedData.txt")
-
-    def get_sorted_errors_path(self, file_type):
-        """Get the path to the SortedErrors file that correspodns to the given
-        DBType.
-
-        Args:
-            file_type: the DBType of the path to be generated
-        """
-        return self._get_path_to_file(file_type, "SortedErrors.txt")
-
-    def get_db_dump_path(self, file_type):
-        """Get the path to the DBDump file that corresponds to the given DBType.
-
-        Args:
-            file_type: the DBType of the path to be generated
-        """
-        return self._get_path_to_file(file_type, "DBDump.txt")
-
-    def _get_path_to_file(self, file_type, file_name):
-        """Get the path to the specified file with the specified type.
-
-        Args:
-            file_type: the DBType of the path to be generated
-            file_name: a String, the filename of the path to be generated
-        """
-        full_filename = self.image_name + file_name
-        if(file_type == DBType.GOLD):
-            return make_path(self.gold_data_dir, full_filename)
-        else:
-            return make_path(self.output_path, full_filename)
 
 class Reports(object):
     def generate_reports(csv_path, test_data):
@@ -1586,15 +1728,6 @@ def print_report(errors, name, okay):
         Errors.print_out("< " + name + " - " + okay + " />")
         Errors.print_out("-----------------------------------------------------------------\n")
 
-# Used instead of the print command when printing out an error
-def print_error(string):
-    print(string)
-    test_data.printerror.append(string)
-
-# Used instead of the print command when printing out anything besides errors
-def print_out(string):
-    print(string)
-    test_data.printout.append(string)
 
 def get_exceptions(test_data):
     """Get a list of the exceptions in the autopsy logs.
@@ -1690,267 +1823,6 @@ class DirNotFoundException(Exception):
         error = "Error: Directory could not be found at:\n" + self.dir + "\n"
         return error
 
-#############################
-#   Main Testing Functions  #
-#############################
-class TestRunner(object):
-
-    def run_tests():
-        """Run the tests specified by the main TestConfiguration.
-
-        Executes the AutopsyIngest for each image and dispatches the results based on
-        the mode (rebuild or testing)
-        """
-        global parsed
-        global failedbool
-        global html
-
-        test_data_list = [ TestData(image, test_config) for image in test_config.images ]
-
-        Reports.html_add_images(test_config.images)
-
-        logres =[]
-        for test_data in test_data_list:
-            Errors.clear_print_logs()
-            Errors.set_testing_phase(test_data.image)
-            if not (test_config.args.rebuild or
-                os.path.exists(test_data.gold_archive)):
-                msg = "Gold standard doesn't exist, skipping image:"
-                Errors.print_error(msg)
-                Errors.print_error(test_data.gold_archive)
-                continue
-            TestRunner._run_autopsy_ingest(test_data)
-
-            if test_config.args.rebuild:
-                TestRunner.rebuild(test_data)
-            else:
-                logres.append(TestRunner._run_test(test_data))
-            test_data.printout = Errors.printout
-            test_data.printerror = Errors.printerror
-
-        Reports.write_html_foot()
-        if (len(logres)>0):
-            failedbool = True
-            imgfail = True
-            passFail = False
-            for lm in logres:
-                for ln in lm:
-                    Errors.add_email_msg(ln)
-        if failedbool:
-            passFail = False
-            msg = "The test output didn't match the gold standard.\n"
-            msg += "autopsy test failed.\n"
-            Errors.add_email_msg(msg)
-            html = open(test_config.html_log)
-            Errors.add_email_attachment(html.name)
-            html.close()
-        else:
-            Errors.add_email_msg("Autopsy test passed.\n")
-            passFail = True
-
-        # @@@ This fails here if we didn't parse an XML file
-        try:
-            Emailer.send_email(parsed, Errors.email_body, Errors.email_attachs, passFail)
-        except NameError:
-            Errors.print_error("Could not send e-mail because of no XML file --maybe");
-
-    def _run_autopsy_ingest(test_data):
-        """Run Autopsy ingest for the image in the given TestData.
-
-        Also generates the necessary logs for rebuilding or diff.
-
-        Args:
-            test_data: the TestData to run the ingest on.
-        """
-        global parsed
-        global imgfail
-        global failedbool
-        imgfail = False
-        if image_type(test_data.image_file) == IMGTYPE.UNKNOWN:
-            Errors.print_error("Error: Image type is unrecognized:")
-            Errors.print_error(test_data.image_file + "\n")
-            return
-
-        logging.debug("--------------------")
-        logging.debug(test_data.image_name)
-        logging.debug("--------------------")
-        TestRunner._run_ant(test_data)
-        time.sleep(2) # Give everything a second to process
-
-        # Dump the database before we diff or use it for rebuild
-        TskDbDiff.dump_output_db(test_data)
-
-        # merges logs into a single log for later diff / rebuild
-        copy_logs(test_data)
-        Logs.generate_log_data(test_data)
-
-        TestRunner._handle_solr(test_data)
-        TestRunner._handle_exception(test_data)
-
-    #TODO: figure out return type of _run_test (logres)
-    def _run_test(test_data):
-        """Compare the results of the output to the gold standard.
-
-        Args:
-            test_data: the TestData
-
-        Returns:
-            logres?
-        """
-        TestRunner._extract_gold(test_data)
-
-        # Look for core exceptions
-        # @@@ Should be moved to TestResultsDiffer, but it didn't know about logres -- need to look into that
-        logres = Logs.search_common_log("TskCoreException", test_data)
-
-        TestResultsDiffer.run_diff(test_data)
-
-        # @@@ COnsider if we want to do this for a rebuild.
-        # Make the CSV log and the html log viewer
-        Reports.generate_reports(test_config.csv, test_data)
-        # Reset the test_config and return the tests sucessfully finished
-        if(failedbool):
-            Errors.add_email_attachment(test_data.common_log_path)
-        return logres
-
-    def _extract_gold(test_data):
-        """Extract gold archive file to output/gold/tmp/
-
-        Args:
-            test_data: the TestData
-        """
-        extrctr = zipfile.ZipFile(test_data.gold_archive, 'r', compression=zipfile.ZIP_DEFLATED)
-        extrctr.extractall(test_data.main_config.gold)
-        extrctr.close
-        time.sleep(2)
-
-    def _handle_solr(test_data):
-        """Clean up SOLR index if in keep mode (-k).
-
-        Args:
-            test_data: the TestData
-        """
-        if not test_config.args.keep:
-            if clear_dir(test_data.solr_index):
-                print_report([], "DELETE SOLR INDEX", "Solr index deleted.")
-        else:
-            print_report([], "KEEP SOLR INDEX", "Solr index has been kept.")
-
-    def _handle_exception(test_data):
-        """If running in exception mode, print exceptions to log.
-
-        Args:
-            test_data: the TestData
-        """
-        if test_config.args.exception:
-            exceptions = search_logs(test_config.args.exception_string, test_data)
-            okay = "No warnings or exceptions found containing text '" + test_config.args.exception_string + "'."
-            print_report(exceptions, "EXCEPTION", okay)
-
-    def rebuild(test_data):
-        """Rebuild the gold standard with the given TestData.
-
-        Copies the test-generated database and html report files into the gold directory.
-        """
-        # Errors to print
-        errors = []
-        # Delete the current gold standards
-        gold_dir = test_config.img_gold
-        clear_dir(test_config.img_gold)
-        tmpdir = make_path(gold_dir, test_data.image_name)
-        dbinpth = test_data.get_db_path(DBType.OUTPUT)
-        dboutpth = make_path(tmpdir, DB_FILENAME)
-        dataoutpth = make_path(tmpdir, test_data.image_name + "SortedData.txt")
-        dbdumpinpth = test_data.get_db_dump_path(DBType.OUTPUT)
-        dbdumpoutpth = make_path(tmpdir, test_data.image_name + "DBDump.txt")
-        if not os.path.exists(test_config.img_gold):
-            os.makedirs(test_config.img_gold)
-        if not os.path.exists(tmpdir):
-            os.makedirs(tmpdir)
-        try:
-            copy_file(dbinpth, dboutpth)
-            if file_exists(test_data.get_sorted_data_path(DBType.OUTPUT)):
-                copy_file(test_data.get_sorted_data_path(DBType.OUTPUT), dataoutpth)
-            copy_file(dbdumpinpth, dbdumpoutpth)
-            error_pth = make_path(tmpdir, test_data.image_name+"SortedErrors.txt")
-            copy_file(test_data.sorted_log, error_pth)
-        except Exception as e:
-            Errors.print_error(str(e))
-            print(str(e))
-            print(traceback.format_exc())
-        # Rebuild the HTML report
-        output_html_report_dir = test_data.get_html_report_path(DBType.OUTPUT)
-        gold_html_report_dir = make_path(tmpdir, "Report")
-
-        try:
-            copy_dir(output_html_report_dir, gold_html_report_dir)
-        except FileNotFoundException as e:
-            errors.append(e.error())
-        except Exception as e:
-            errors.append("Error: Unknown fatal error when rebuilding the gold html report.")
-            errors.append(str(e) + "\n")
-            print(traceback.format_exc())
-        oldcwd = os.getcwd()
-        zpdir = gold_dir
-        os.chdir(zpdir)
-        os.chdir("..")
-        img_gold = "tmp"
-        img_archive = make_path(test_data.image_name+"-archive.zip")
-        comprssr = zipfile.ZipFile(img_archive, 'w',compression=zipfile.ZIP_DEFLATED)
-        TestRunner.zipdir(img_gold, comprssr)
-        comprssr.close()
-        os.chdir(oldcwd)
-        del_dir(test_config.img_gold)
-        okay = "Sucessfully rebuilt all gold standards."
-        print_report(errors, "REBUILDING", okay)
-
-    def zipdir(path, zip):
-        for root, dirs, files in os.walk(path):
-            for file in files:
-                zip.write(os.path.join(root, file))
-
-    def _run_ant(test_data):
-        """Construct and run the ant build command for the given TestData.
-
-        Tests Autopsy by calling RegressionTest.java via the ant build file.
-
-        Args:
-            test_data: the TestData
-        """
-        # Set up the directories
-        test_config_path = os.path.join(test_config.output_dir, test_data.image_name)
-        if dir_exists(test_config_path):
-            shutil.rmtree(test_config_path)
-        os.makedirs(test_config_path)
-        test_config.ant = ["ant"]
-        test_config.ant.append("-v")
-        test_config.ant.append("-f")
-    #   case.ant.append(case.build_path)
-        test_config.ant.append(os.path.join("..","..","Testing","build.xml"))
-        test_config.ant.append("regression-test")
-        test_config.ant.append("-l")
-        test_config.ant.append(test_data.antlog_dir)
-        test_config.ant.append("-Dimg_path=" + test_data.image_file)
-        test_config.ant.append("-Dknown_bad_path=" + test_config.known_bad_path)
-        test_config.ant.append("-Dkeyword_path=" + test_config.keyword_path)
-        test_config.ant.append("-Dnsrl_path=" + test_config.nsrl_path)
-        test_config.ant.append("-Dgold_path=" + test_config.gold)
-        test_config.ant.append("-Dout_path=" +
-        make_local_path(test_data.output_path))
-        test_config.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
-        test_config.ant.append("-Dtest.timeout=" + str(test_config.timeout))
-
-        Errors.print_out("Ingesting Image:\n" + test_data.image_file + "\n")
-        Errors.print_out("CMD: " + " ".join(test_config.ant))
-        Errors.print_out("Starting test...\n")
-        antoutpth = make_local_path(test_config.output_dir, "antRunOutput.txt")
-        antout = open(antoutpth, "a")
-        if SYS is OS.CYGWIN:
-            subprocess.call(test_config.ant, stdout=subprocess.PIPE)
-        elif SYS is OS.WIN:
-            theproc = subprocess.Popen(test_config.ant, shell = True, stdout=subprocess.PIPE)
-            theproc.communicate()
-        antout.close()
 
 class Errors:
     """A class used to manage error reporting.
@@ -2016,6 +1888,157 @@ class Errors:
         """
         Errors.email_attachs.append(path)
 
+
+class DiffResults(object):
+    """Container for the results of the database diff tests.
+
+    Stores artifact, object, and attribute counts and comparisons generated by
+    TskDbDiff.
+
+    Attributes:
+        gold_attrs: a Nat, the number of gold attributes
+        output_attrs: a Nat, the number of output attributes
+        gold_objs: a Nat, the number of gold objects
+        output_objs: a Nat, the number of output objects
+        artifact_comp: a listof_String, describing the differences
+        attribute_comp: a listof_String, describing the differences
+    """
+    def __init__(self, tsk_diff):
+        """Inits a DiffResults
+
+        Args:
+            tsk_diff: a TskDBDiff
+        """
+        self.gold_attrs = tsk_diff.gold_attributes
+        self.output_attrs = tsk_diff.autopsy_attributes
+        self.gold_objs = tsk_diff.gold_objects
+        self.output_objs = tsk_diff.autopsy_objects
+        self.artifact_comp = tsk_diff.artifact_comparison
+        self.attribute_comp = tsk_diff.attribute_comparison
+        self.gold_artifacts = len(tsk_diff.gold_artifacts)
+        self.output_artifacts = len(tsk_diff.autopsy_artifacts)
+
+    def get_artifact_comparison(self):
+        if not self.artifact_comp:
+            return "All counts matched"
+        else:
+            global failedbool
+            failedbool = True
+            global imgfail
+            imgfail = True
+            return "; ".join(self.artifact_comp)
+
+    def get_attribute_comparison(self):
+        if not self.attribute_comp:
+            return "All counts matched"
+        global failedbool
+        failedbool = True
+        global imgfail
+        imgfail = True
+        list = []
+        for error in self.attribute_comp:
+            list.append(error)
+        return ";".join(list)
+
+
+#-------------------------------------------------------------#
+# Parses argv and stores booleans to match command line input #
+#-------------------------------------------------------------#
+class Args(object):
+    """A container for command line options and arguments.
+
+    Attributes:
+        single: a boolean indicating whether to run in single file mode
+        single_file: an Image to run the test on
+        rebuild: a boolean indicating whether to run in rebuild mode
+        list: a boolean indicating a config file was specified
+        unallocated: a boolean indicating unallocated space should be ignored
+        ignore: a boolean indicating the input directory should be ingnored
+        keep: a boolean indicating whether to keep the SOLR index
+        verbose: a boolean indicating whether verbose output should be printed
+        exeception: a boolean indicating whether errors containing exception
+                    exception_string should be printed
+        exception_sring: a String representing and exception name
+        fr: a boolean indicating whether gold standard images will be downloaded
+    """
+    def __init__(self):
+        self.single = False
+        self.single_file = ""
+        self.rebuild = False
+        self.list = False
+        self.config_file = ""
+        self.unallocated = False
+        self.ignore = False
+        self.keep = False
+        self.verbose = False
+        self.exception = False
+        self.exception_string = ""
+        self.fr = False
+
+    def parse(self):
+        global nxtproc
+        nxtproc = []
+        nxtproc.append("python3")
+        nxtproc.append(sys.argv.pop(0))
+        while sys.argv:
+            arg = sys.argv.pop(0)
+            nxtproc.append(arg)
+            if(arg == "-f"):
+                #try: @@@ Commented out until a more specific except statement is added
+                    arg = sys.argv.pop(0)
+                    print("Running on a single file:")
+                    print(path_fix(arg) + "\n")
+                    self.single = True
+                    self.single_file = path_fix(arg)
+                #except:
+                #   print("Error: No single file given.\n")
+            #       return False
+            elif(arg == "-r" or arg == "--rebuild"):
+                print("Running in rebuild mode.\n")
+                self.rebuild = True
+            elif(arg == "-l" or arg == "--list"):
+                try:
+                    arg = sys.argv.pop(0)
+                    nxtproc.append(arg)
+                    print("Running from configuration file:")
+                    print(arg + "\n")
+                    self.list = True
+                    self.config_file = arg
+                except:
+                    print("Error: No configuration file given.\n")
+                    return False
+            elif(arg == "-u" or arg == "--unallocated"):
+               print("Ignoring unallocated space.\n")
+               self.unallocated = True
+            elif(arg == "-k" or arg == "--keep"):
+                print("Keeping the Solr index.\n")
+                self.keep = True
+            elif(arg == "-v" or arg == "--verbose"):
+                print("Running in verbose mode:")
+                print("Printing all thrown exceptions.\n")
+                self.verbose = True
+            elif(arg == "-e" or arg == "--exception"):
+                try:
+                    arg = sys.argv.pop(0)
+                    nxtproc.append(arg)
+                    print("Running in exception mode: ")
+                    print("Printing all exceptions with the string '" + arg + "'\n")
+                    self.exception = True
+                    self.exception_string = arg
+                except:
+                    print("Error: No exception string given.")
+            elif arg == "-h" or arg == "--help":
+                print(usage())
+                return False
+            elif arg == "-fr" or arg == "--forcerun":
+                print("Not downloading new images")
+                self.fr = True
+            else:
+                print(usage())
+                return False
+        # Return the args were sucessfully parsed
+        return True
+
 ####
 # Helper Functions
 ####
@@ -2149,33 +2172,6 @@ def find_file_in_dir(dir, name, ext):
     except:
         raise DirNotFoundException(dir)
 
-#----------------------#
-#        Main          #
-#----------------------#
-def main():
-    # Global variables
-    global failedbool
-    global test_config
-    failedbool = False
-    args = Args()
-    parse_result = args.parse()
-    test_config = TestConfiguration(args)
-    # The arguments were given wrong:
-    if not parse_result:
-        test_config.reset()
-        return
-    if(not args.fr):
-        antin = ["ant"]
-        antin.append("-f")
-        antin.append(os.path.join("..","..","build.xml"))
-        antin.append("test-download-imgs")
-        if SYS is OS.CYGWIN:
-            subprocess.call(antin)
-        elif SYS is OS.WIN:
-            theproc = subprocess.Popen(antin, shell = True, stdout=subprocess.PIPE)
-            theproc.communicate()
-    # Otherwise test away!
-    TestRunner.run_tests()
 
 class OS:
   LINUX, MAC, WIN, CYGWIN = range(4)

From e89fb445231a17e6706f5bd7df9eaadad5882056 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Mon, 15 Jul 2013 13:54:09 -0400
Subject: [PATCH 06/13] TestData now stores pass/fail flags for the different
 'diffs': html report, database, and logs.

---
 test/script/regression.py | 61 +++++++++++++++++++++++++--------------
 1 file changed, 40 insertions(+), 21 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 2996ff5a0e..33bc4f101c 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -192,10 +192,6 @@ class TestRunner(object):
         Args:
             test_data: the TestData to run the ingest on.
         """
-        global parsed
-        global imgfail
-        global failedbool
-        imgfail = False
         if image_type(test_data.image_file) == IMGTYPE.UNKNOWN:
             Errors.print_error("Error: Image type is unrecognized:")
             Errors.print_error(test_data.image_file + "\n")
@@ -234,12 +230,14 @@ class TestRunner(object):
         logres = Logs.search_common_log("TskCoreException", test_data)
 
         TestResultsDiffer.run_diff(test_data)
+        test_data.overall_passed = (test_data.html_report_passed and
+        test_data.errors_diff_passed and test_data.sorted_data_passed and
+        test_data.db_dump_passed)
 
         # @@@ COnsider if we want to do this for a rebuild.
         # Make the CSV log and the html log viewer
         Reports.generate_reports(test_config.csv, test_data)
-        # Reset the test_config and return the tests sucessfully finished
-        if(failedbool):
+        if(not test_data.overall_passed):
             Errors.add_email_attachment(test_data.common_log_path)
         return logres
 
@@ -407,6 +405,10 @@ class TestData(object):
         logs_dir: a pathto_Dir, the location where autopsy logs are stored
         solr_index: a pathto_Dir, the locatino of the solr index
         db_diff_results: a DiffResults, the results of the database comparison
+        html_report_passed: a boolean, did the HTML report diff pass?
+        errors_diff_passed: a boolean, did the error diff pass?
+        db_dump_passed: a boolean, did the db dump diff pass?
+        overall_passed: a boolean, did the test pass?
         total_test_time: a String representation of the test duration
         start_date: a String representation of this TestData's start date
         end_date: a String representation of the TestData's end date
@@ -415,7 +417,6 @@ class TestData(object):
         artifact_fail: a Nat, the number of artifact failures
         heap_space: a String representation of TODO
         service_times: a String representation of TODO
-        report_passed: a boolean, indicating if the reports passed
         printerror: a listof_String, the error messages printed during this TestData's test
         printout: a listof_String, the messages pritned during this TestData's test
     """
@@ -427,11 +428,13 @@ class TestData(object):
             image: the Image to be tested.
             main_config: the global TestConfiguration.
         """
+        # Configuration Data
         self.main_config = main_config
         self.image_file = str(image)
         # TODO: This 0 should be be refactored out, but it will require rebuilding and changing of outputs.
         self.image = get_image_name(self.image_file)
         self.image_name = self.image + "(0)"
+        # Directory structure and files
         self.output_path = make_path(self.main_config.output_dir, self.image_name)
         self.autopsy_data_file = make_path(self.output_path, self.image_name + "Autopsy_data.txt")
         self.warning_log = make_local_path(self.output_path, "AutopsyLogs.txt")
@@ -447,7 +450,13 @@ class TestData(object):
         self.logs_dir = make_path(self.output_path, "logs")
         self.solr_index = make_path(self.output_path, AUTOPSY_TEST_CASE,
         "ModuleOutput", "KeywordSearch")
+        # Results and Info
         self.db_diff_results = None
+        self.html_report_passed = False
+        self.errors_diff_passed = False
+        self.sorted_data_passed = False
+        self.db_dump_passed = False
+        self.overall_passed = False
         self.total_test_time = ""
         self.start_date = ""
         self.end_date = ""
@@ -456,7 +465,7 @@ class TestData(object):
         self.artifact_fail = 0
         self.heap_space = ""
         self.service_times = ""
-        self.report_passed = False
+
         # Error tracking
         self.printerror = []
         self.printout = []
@@ -1122,25 +1131,28 @@ class TestResultsDiffer(object):
             replace = lambda file: re.sub(re.compile("\d"), "d", file)
             output_errors = test_data.get_sorted_errors_path(DBType.OUTPUT)
             gold_errors = test_data.get_sorted_errors_path(DBType.GOLD)
-
-            TestResultsDiffer._compare_text(output_errors, gold_errors,
-            test_data, replace)
+            passed = TestResultsDiffer._compare_text(output_errors, gold_errors,
+            replace)
+            test_data.errors_diff_passed = passed
 
             # Compare smart blackboard results
             output_data = test_data.get_sorted_data_path(DBType.OUTPUT)
             gold_data = test_data.get_sorted_data_path(DBType.GOLD)
-            TestResultsDiffer._compare_text(output_data, gold_data, test_data)
+            passed = TestResultsDiffer._compare_text(output_data, gold_data)
+            test_data.sorted_data_passed = passed
 
             # Compare the rest of the database (non-BB)
             output_dump = test_data.get_db_dump_path(DBType.OUTPUT)
             gold_dump = test_data.get_db_dump_path(DBType.GOLD)
-            TestResultsDiffer._compare_text(output_dump, gold_dump, test_data)
+            passed = TestResultsDiffer._compare_text(output_dump, gold_dump)
+            test_data.db_dump_passed = passed
 
             # Compare html output
             gold_report_path = test_data.get_html_report_path(DBType.GOLD)
             output_report_path = test_data.get_html_report_path(DBType.OUTPUT)
-            TestResultsDiffer._html_report_diff(test_data, gold_report_path,
+            passed = TestResultsDiffer._html_report_diff(test_data, gold_report_path,
             output_report_path)
+            test_data.html_report_passed = passed
 
             # Clean up tmp folder
             del_dir(test_data.gold_data_dir)
@@ -1154,18 +1166,17 @@ class TestResultsDiffer(object):
     # TODO: _compare_text could be made more generic with how it forms the paths (i.e. not add ".txt" in the method) and probably merged with
     # compare_errors since they both do basic comparison of text files
 
-    def _compare_text(output_file, gold_file, test_data, process=None):
+    def _compare_text(output_file, gold_file, process=None):
         """Compare two text files.
 
         Args:
             output_file: a pathto_File, the output text file
             gold_file: a pathto_File, the input text file
-            test_data: the TestData of the test being performed
             pre-process: (optional) a function of String -> String that will be
             called on each input file before the diff, if specified.
         """
         if(not file_exists(output_file)):
-            return
+            return False
         output_data = codecs.open(output_file, "r", "utf_8").read()
         gold_data = codecs.open(gold_file, "r", "utf_8").read()
 
@@ -1181,13 +1192,16 @@ class TestResultsDiffer(object):
             subprocess.call(dffcmdlst, stdout = diff_file)
             global failedbool
             Errors.add_email_attachment(diff_path)
-            msg = test_data.image_name + ":There was a difference in "
+            msg = "There was a difference in "
             msg += os.path.basename(output_file) + ".\n"
             Errors.add_email_msg(msg)
             Errors.print_error(msg)
             failedbool = True
             global imgfail
             imgfail = True
+            return False
+        else:
+            return True
 
     # TODO: get rid of test_data by changing the error reporting
     def _html_report_diff(test_data, gold_report_path, output_report_path):
@@ -1197,6 +1211,9 @@ class TestResultsDiffer(object):
             test_data: the TestData of the test being performed.
             gold_report_path: a pathto_Dir, the gold HTML report directory
             output_report_path: a pathto_Dir, the output HTML report directory
+
+        Returns:
+            true, if the reports match, false otherwise.
         """
         try:
             gold_html_files = get_files_by_ext(gold_report_path, ".html")
@@ -1222,16 +1239,18 @@ class TestResultsDiffer(object):
             print_report(errors, "REPORT COMPARISON", okay)
 
             if total["Gold"] == total["New"]:
-                test_data.report_passed = True
+                return True
             else:
                 Errors.print_error("The reports did not match each other.\n " + errors[0] +" and the " + errors[1])
-
+                return False
         except DirNotFoundException as e:
             e.print_error()
+            return False
         except Exception as e:
             Errors.print_error("Error: Unknown fatal error comparing reports.")
             Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
+            return False
 
     def _compare_report_files(a_path, b_path):
         """Compares the two specified report html files.
@@ -1495,7 +1514,7 @@ class Reports(object):
             vars.append( test_data.db_diff_results.get_artifact_comparison() )
             vars.append( test_data.db_diff_results.get_attribute_comparison() )
             vars.append( make_local_path("gold", test_data.image_name, "standard.html") )
-            vars.append( str(test_data.report_passed) )
+            vars.append( str(test_data.html_report_passed) )
             vars.append( test_config.ant_to_string() )
             # Join it together with a ", "
             output = "|".join(vars)

From c03872b5d9484bf85bfe850fe3b49cb065c681e9 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Mon, 15 Jul 2013 14:14:56 -0400
Subject: [PATCH 07/13] Replaced accidental deletion in previous commit.

---
 test/script/regression.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/test/script/regression.py b/test/script/regression.py
index 33bc4f101c..203698d93b 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -103,6 +103,8 @@ def main():
     # Global variables
     global failedbool
     global test_config
+    global imgfail
+    imgfail = False
     failedbool = False
     args = Args()
     parse_result = args.parse()

From c103c1ac6245a90975af5528a152ae6e0064662d Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 10:03:54 -0400
Subject: [PATCH 08/13] Replaced imgfail globabl variable with a TestData
 attribute.

---
 test/script/regression.py | 101 ++++++++++++++++++++------------------
 1 file changed, 52 insertions(+), 49 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 203698d93b..4180a051a4 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -103,8 +103,6 @@ def main():
     # Global variables
     global failedbool
     global test_config
-    global imgfail
-    imgfail = False
     failedbool = False
     args = Args()
     parse_result = args.parse()
@@ -125,6 +123,7 @@ def main():
     # Otherwise test away!
     TestRunner.run_tests()
 
+
 class TestRunner(object):
 
     def run_tests():
@@ -163,7 +162,6 @@ class TestRunner(object):
         Reports.write_html_foot()
         if (len(logres)>0):
             failedbool = True
-            imgfail = True
             passFail = False
             for lm in logres:
                 for ln in lm:
@@ -234,7 +232,7 @@ class TestRunner(object):
         TestResultsDiffer.run_diff(test_data)
         test_data.overall_passed = (test_data.html_report_passed and
         test_data.errors_diff_passed and test_data.sorted_data_passed and
-        test_data.db_dump_passed)
+        test_data.db_dump_passed and test_data.db_diff_results.passed)
 
         # @@@ COnsider if we want to do this for a rebuild.
         # Make the CSV log and the html log viewer
@@ -717,7 +715,6 @@ class TestConfiguration(object):
                 self.img_gold = make_path(self.gold, 'tmp')
 
             # Generate the top navbar of the HTML for easy access to all images
-            images = []
             for element in parsed.getElementsByTagName("image"):
                 value = element.getAttribute("value").encode().decode("utf_8")
                 print ("Image in Config File: " + value)
@@ -725,8 +722,9 @@ class TestConfiguration(object):
                     self.images.append(value)
                 else:
                     msg = "File: " + value + " doesn't exist"
+                    Errors.print_error(msg)
                     Errors.add_email_msg(msg)
-            image_count = len(images)
+            image_count = len(self.images)
 
             # Sanity check to see if there are obvious gold images that we are not testing
             gold_count = 0
@@ -760,7 +758,9 @@ class TskDbDiff(object):
         autopsy_objects:
         artifact_comparison:
         attribute_comparision:
-        test_data:
+        report_errors: a listof_listof_String, the error messages that will be
+        printed to screen in the run_diff method
+        passed: a boolean, did the diff pass?
         autopsy_db_file:
         gold_db_file:
     """
@@ -778,6 +778,7 @@ class TskDbDiff(object):
         self.autopsy_objects = 0
         self.artifact_comparison = []
         self.attribute_comparison = []
+        self.report_errors = []
         self.autopsy_db_file = output_db_path
         self.gold_db_file = gold_db_path
 
@@ -823,14 +824,15 @@ class TskDbDiff(object):
         return cursor.fetchone()[0]
 
     def _compare_bb_artifacts(self):
-        """Compares the blackboard artifact counts of two databases."""
+        """Compares the blackboard artifact counts of two databases.
+
+        Returns:
+            True if the artifacts are the same, false otherwise.
+        """
         exceptions = []
+        passed = True
         try:
-            global failedbool
             if self.gold_artifacts != self.autopsy_artifacts:
-                failedbool = True
-                global imgfail
-                imgfail = True
                 msg = "There was a difference in the number of artifacts.\n"
                 Errors.add_email_msg(msg)
             rner = len(self.gold_artifacts)
@@ -841,49 +843,59 @@ class TskDbDiff(object):
                                 (self.gold_artifacts[type_id],
                                  self.autopsy_artifacts[type_id]))
                     exceptions.append(error)
-            return exceptions
+                    passed = False
+            self.report_errors.append(exceptions)
+            return passed
         except Exception as e:
             Errors.print_error(str(e))
             exceptions.append("Error: Unable to compare blackboard_artifacts.\n")
-            return exceptions
+            self.report_errors.append(exceptions)
+            return False
 
     def _compare_bb_attributes(self):
-        """Compares the blackboard attribute counts of two databases."""
+        """Compares the blackboard attribute counts of two databases.
+
+        Updates this TskDbDiff's report_errors with the error messages from the
+        attribute diff
+
+        Returns:
+            True is the attributes are the same, False otherwise.
+        """
         exceptions = []
+        passed = True
         try:
             if self.gold_attributes != self.autopsy_attributes:
                 error = "Attribute counts do not match. "
                 error += str("Gold: %d, Test: %d" % (self.gold_attributes, self.autopsy_attributes))
                 exceptions.append(error)
-                global failedbool
-                failedbool = True
-                global imgfail
-                imgfail = True
                 msg = "There was a difference in the number of attributes.\n"
                 Errors.add_email_msg(msg)
-                return exceptions
+                passed = False
+            self.report_errors.append(exceptions)
+            return passed
         except Exception as e:
             exceptions.append("Error: Unable to compare blackboard_attributes.\n")
-            return exceptions
+            self.report_errors.append(exceptions)
+            return False
 
     def _compare_tsk_objects(self):
         """Compares the TSK object counts of two databases."""
         exceptions = []
+        passed = True
         try:
             if self.gold_objects != self.autopsy_objects:
                 error = "TSK Object counts do not match. "
                 error += str("Gold: %d, Test: %d" % (self.gold_objects, self.autopsy_objects))
                 exceptions.append(error)
-                global failedbool
-                failedbool = True
-                global imgfail
-                imgfail = True
                 msg ="There was a difference between the tsk object counts.\n"
                 Errors.add_email_msg(msg)
-                return exceptions
+                passed = False
+            self.report_errors.append(exceptions)
+            return passed
         except Exception as e:
             exceptions.append("Error: Unable to compare tsk_objects.\n")
-            return exceptions
+            self.report_errors.append(exceptions)
+            return False
 
     def _get_basic_counts(self, autopsy_cur, gold_cur):
         """Count the items necessary to compare the databases.
@@ -941,20 +953,20 @@ class TskDbDiff(object):
         autopsy_con.close()
         gold_con.close()
 
-        exceptions = []
-
         # Compare counts
-        exceptions.append(self._compare_tsk_objects())
-        exceptions.append(self._compare_bb_artifacts())
-        exceptions.append(self._compare_bb_attributes())
+        objects_passed = self._compare_tsk_objects()
+        artifacts_passed = self._compare_bb_artifacts()
+        attributes_passed = self._compare_bb_attributes()
 
-        self.artifact_comparison = exceptions[1]
-        self.attribute_comparison = exceptions[2]
+        self.passed = objects_passed and artifacts_passed and attributes_passed
+
+        self.artifact_comparison = self.report_errors[1]
+        self.attribute_comparison = self.report_errors[2]
 
         okay = "All counts match."
-        print_report(exceptions[0], "COMPARE TSK OBJECTS", okay)
-        print_report(exceptions[1], "COMPARE ARTIFACTS", okay)
-        print_report(exceptions[2], "COMPARE ATTRIBUTES", okay)
+        print_report(self.report_errors[0], "COMPARE TSK OBJECTS", okay)
+        print_report(self.report_errors[1], "COMPARE ARTIFACTS", okay)
+        print_report(self.report_errors[2], "COMPARE ATTRIBUTES", okay)
 
         return DiffResults(self)
 
@@ -1199,8 +1211,6 @@ class TestResultsDiffer(object):
             Errors.add_email_msg(msg)
             Errors.print_error(msg)
             failedbool = True
-            global imgfail
-            imgfail = True
             return False
         else:
             return True
@@ -1304,7 +1314,6 @@ class Reports(object):
         """Generate the HTML log file."""
         # If the file doesn't exist yet, this is the first test_config to run for
         # this test, so we need to make the start of the html log
-        global imgfail
         if not file_exists(test_config.html_log):
             Reports.write_html_head()
         try:
@@ -1320,7 +1329,7 @@ class Reports(object):
                      <a href='#" + test_data.image_name + "-logs'>Logs</a>\
                      </h2>"
             # The script errors found
-            if imgfail:
+            if not test_data.overall_passed:
                 ids = 'errors1'
             else:
                 ids = 'errors'
@@ -1923,6 +1932,7 @@ class DiffResults(object):
         output_objs: a Nat, the number of output objects
         artifact_comp: a listof_String, describing the differences
         attribute_comp: a listof_String, describing the differences
+        passed: a boolean, did the diff pass?
     """
     def __init__(self, tsk_diff):
         """Inits a DiffResults
@@ -1938,24 +1948,17 @@ class DiffResults(object):
         self.attribute_comp = tsk_diff.attribute_comparison
         self.gold_artifacts = len(tsk_diff.gold_artifacts)
         self.output_artifacts = len(tsk_diff.autopsy_artifacts)
+        self.passed = tsk_diff.passed
 
     def get_artifact_comparison(self):
         if not self.artifact_comp:
             return "All counts matched"
         else:
-            global failedbool
-            failedbool = True
-            global imgfail
-            imgfail = True
             return "; ".join(self.artifact_comp)
 
     def get_attribute_comparison(self):
         if not self.attribute_comp:
             return "All counts matched"
-        global failedbool
-        failedbool = True
-        global imgfail
-        imgfail = True
         list = []
         for error in self.attribute_comp:
             list.append(error)

From 625c7c8c3b839f1a60fb30f89ea640a107fba572 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 11:38:50 -0400
Subject: [PATCH 09/13] Database dump function now takes paths as arguments
 intstead of TestData

---
 test/script/regression.py | 38 +++++++++++++++++++++-----------------
 1 file changed, 21 insertions(+), 17 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 4180a051a4..7d26202139 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -970,26 +970,29 @@ class TskDbDiff(object):
 
         return DiffResults(self)
 
-    def _dump_output_db_bb(autopsy_con, autopsy_db_file, test_data):
-        """Dumps sorted text results to the output location stored in test_data.
+    def _dump_output_db_bb(autopsy_con, db_file, data_file, sorted_data_file):
+        """Dumps sorted text results to the given output location.
 
         Smart method that deals with a blackboard comparison to avoid issues
         with different IDs based on when artifacts were created.
 
         Args:
             autopsy_con: a SQLConn to the autopsy database.
-            autopsy_db_file: a pathto_File, the output database.
-            test_data: the TestData that corresponds with this dump.
+            db_file: a pathto_File, the output database.
+            data_file: a pathto_File, the dump file to write to
+            sorted_data_file: a pathto_File, the sorted dump file to write to
         """
         autopsy_cur2 = autopsy_con.cursor()
         global failedbool
         # Get the list of all artifacts
         # @@@ Could add a SORT by parent_path in here since that is how we are going to later sort it.
         autopsy_cur2.execute("SELECT tsk_files.parent_path, tsk_files.name, blackboard_artifact_types.display_name, blackboard_artifacts.artifact_id FROM blackboard_artifact_types INNER JOIN blackboard_artifacts ON blackboard_artifact_types.artifact_type_id = blackboard_artifacts.artifact_type_id INNER JOIN tsk_files ON tsk_files.obj_id = blackboard_artifacts.obj_id")
-        database_log = codecs.open(test_data.autopsy_data_file, "wb", "utf_8")
+        database_log = codecs.open(data_file, "wb", "utf_8")
         rw = autopsy_cur2.fetchone()
         appnd = False
         counter = 0
+        artifact_count = 0
+        artifact_fail = 0
         # Cycle through artifacts
         try:
             while (rw != None):
@@ -1002,7 +1005,7 @@ class TskDbDiff(object):
                 # Get attributes for this artifact
                 autopsy_cur1 = autopsy_con.cursor()
                 looptry = True
-                test_data.artifact_count += 1
+                artifact_count += 1
                 try:
                     key = ""
                     key = str(rw[3])
@@ -1012,13 +1015,12 @@ class TskDbDiff(object):
                 except Exception as e:
                     Errors.print_error(str(e))
                     Errors.print_error(str(rw[3]))
-                    print(test_data.image_name)
                     msg ="Attributes in artifact id (in output DB)# " + str(rw[3]) + " encountered an error: " + str(e) +" .\n"
                     Errors.add_email_msg(msg)
                     looptry = False
-                    print(test_data.artifact_fail)
-                    test_data.artifact_fail += 1
-                    print(test_data.artifact_fail)
+                    print(artifact_fail)
+                    artifact_fail += 1
+                    print(artifact_fail)
                     database_log.write('Error Extracting Attributes');
 
                 # Print attributes
@@ -1036,7 +1038,7 @@ class TskDbDiff(object):
                             Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
-                                Errors.add_email_attachment(autopsy_db_file)
+                                Errors.add_email_attachment(db_file)
                                 appnd = True
                         if(not attr[0] == src):
                             msg ="There were inconsistent sources for artifact with id #" + str(rw[3]) + ".\n"
@@ -1044,7 +1046,7 @@ class TskDbDiff(object):
                             Errors.print_error(msg)
                             failedbool = True
                             if(not appnd):
-                                Errors.add_email_attachment(autopsy_db_file)
+                                Errors.add_email_attachment(db_file)
                                 appnd = True
                         try:
                             database_log.write('<attribute source="' + attr[0] + '" type="' + attr[1] + '" value="')
@@ -1064,11 +1066,11 @@ class TskDbDiff(object):
                 rw = autopsy_cur2.fetchone()
 
             # Now sort the file
-            srtcmdlst = ["sort", test_data.autopsy_data_file, "-o", test_data.get_sorted_data_path(DBType.OUTPUT)]
+            srtcmdlst = ["sort", data_file, "-o", sorted_data_file]
             subprocess.call(srtcmdlst)
-            print(test_data.artifact_fail)
-            if(test_data.artifact_fail > 0):
-                msg ="There were " + str(test_data.artifact_count) + " artifacts and " + str(test_data.artifact_fail) + " threw an exception while loading.\n"
+            print(artifact_fail)
+            if(artifact_fail > 0):
+                msg ="There were " + str(artifact_count) + " artifacts and " + str(artifact_fail) + " threw an exception while loading.\n"
                 Errors.add_email_msg(msg)
         except Exception as e:
             Errors.print_error('outer exception: ' + str(e))
@@ -1114,7 +1116,9 @@ class TskDbDiff(object):
         autopsy_cur = autopsy_con.cursor()
         # Try to query the databases. Ignore any exceptions, the function will
         # return an error later on if these do fail
-        TskDbDiff._dump_output_db_bb(autopsy_con, autopsy_db_file, test_data)
+        TskDbDiff._dump_output_db_bb(autopsy_con, autopsy_db_file,
+        test_data.autopsy_data_file,
+        test_data.get_sorted_data_path(DBType.OUTPUT))
         TskDbDiff._dump_output_db_nonbb(test_data)
         autopsy_con.close()
 

From 62087cdc5b95d67dc5258a753226021c5088bb27 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 12:54:01 -0400
Subject: [PATCH 10/13] Added email data to test configuration, modified
 Emailer.py so it doesn't need a configuration file to send an email.

---
 test/script/Emailer.py    |  82 ++++++-------
 test/script/regression.py | 240 +++++++++++++++++++-------------------
 2 files changed, 159 insertions(+), 163 deletions(-)

diff --git a/test/script/Emailer.py b/test/script/Emailer.py
index 7be20d406e..5d12e6afa3 100644
--- a/test/script/Emailer.py
+++ b/test/script/Emailer.py
@@ -7,49 +7,43 @@ from email import encoders
 import xml
 from xml.dom.minidom import parse, parseString
 
-def send_email(parsed, errorem, attachl, passFail):
-	element = parsed.getElementsByTagName("email")
-	if(len(element)<=0):
-		return
-	element = element[0]
-	toval = element.getAttribute("value").encode().decode("utf_8")
-	if(toval==None):
-		return
-	element = parsed.getElementsByTagName("mail_server")[0]
-	serverval = element.getAttribute("value").encode().decode("utf_8")
-	# Create the container (outer) email message.
-	msg = MIMEMultipart()
-	element = parsed.getElementsByTagName("subject")[0]
-	subval = element.getAttribute("value").encode().decode("utf_8")
-	if(passFail):
-		msg['Subject'] = '[Test]Autopsy ' + subval + ' test passed.'
-	else:
-		msg['Subject'] = '[Test]Autopsy ' + subval + ' test failed.'
-	# me == the sender's email address
-	# family = the list of all recipients' email addresses
-	msg['From'] = 'AutopsyTest'
-	msg['To'] = toval
-	msg.preamble = 'This is a test'
-	container = MIMEText(errorem, 'plain')
-	msg.attach(container)
-	Build_email(msg, attachl)
-	s = smtplib.SMTP(serverval)
-	try:
-		print('Sending Email')
-		s.sendmail(msg['From'], msg['To'], msg.as_string())
-	except Exception as e:
-		print(str(e))
-	s.quit()
+def send_email(to, server, subj, body, attachments):
+    """Send an email with the given information.
 
-def Build_email(msg, attachl):
-	for file in attachl:
-		part = MIMEBase('application', "octet-stream")
-		atach = open(file, "rb")
-		attch = atach.read()
-		noml = file.split("\\")
-		nom = noml[len(noml)-1]
-		part.set_payload(attch)
-		encoders.encode_base64(part)
-		part.add_header('Content-Disposition', 'attachment; filename="' + nom + '"')
-		msg.attach(part)
+    Args:
+        to: a String, the email address to send the email to
+        server: a String, the mail server to send from
+        subj: a String, the subject line of the message
+        body: a String, the body of the message
+        attachments: a listof_pathto_File, the attachements to include
+    """
+    msg = MIMEMultipart()
+    msg['Subject'] = subj
+    # me == the sender's email address
+    # family = the list of all recipients' email addresses
+    msg['From'] = 'AutopsyTest'
+    msg['To'] = to
+    msg.preamble = 'This is a test'
+    container = MIMEText(body, 'plain')
+    msg.attach(container)
+    Build_email(msg, attachments)
+    s = smtplib.SMTP(server)
+    try:
+        print('Sending Email')
+        s.sendmail(msg['From'], msg['To'], msg.as_string())
+    except Exception as e:
+        print(str(e))
+    s.quit()
+
+def Build_email(msg, attachments):
+    for file in attachments:
+        part = MIMEBase('application', "octet-stream")
+        atach = open(file, "rb")
+        attch = atach.read()
+        noml = file.split("\\")
+        nom = noml[len(noml)-1]
+        part.set_payload(attch)
+        encoders.encode_base64(part)
+        part.add_header('Content-Disposition', 'attachment; filename="' + nom + '"')
+        msg.attach(part)
 
diff --git a/test/script/regression.py b/test/script/regression.py
index 7d26202139..2bf9f4a42c 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -132,7 +132,6 @@ class TestRunner(object):
         Executes the AutopsyIngest for each image and dispatches the results based on
         the mode (rebuild or testing)
         """
-        global parsed
         global failedbool
         global html
 
@@ -162,12 +161,11 @@ class TestRunner(object):
         Reports.write_html_foot()
         if (len(logres)>0):
             failedbool = True
-            passFail = False
+            print(logres)
             for lm in logres:
                 for ln in lm:
                     Errors.add_email_msg(ln)
         if failedbool:
-            passFail = False
             msg = "The test output didn't match the gold standard.\n"
             msg += "autopsy test failed.\n"
             Errors.add_email_msg(msg)
@@ -176,13 +174,11 @@ class TestRunner(object):
             html.close()
         else:
             Errors.add_email_msg("Autopsy test passed.\n")
-            passFail = True
 
         # @@@ This fails here if we didn't parse an XML file
-        try:
-            Emailer.send_email(parsed, Errors.email_body, Errors.email_attachs, passFail)
-        except NameError:
-            Errors.print_error("Could not send e-mail because of no XML file --maybe");
+        if test_config.email_enabled:
+            Emailer.send_email(test_config.mail_to, test_config.mail_server,
+            test_config.mail_subject, Errors.email_body, Errors.email_attachs)
 
     def _run_autopsy_ingest(test_data):
         """Run Autopsy ingest for the image in the given TestData.
@@ -588,10 +584,10 @@ class TestConfiguration(object):
         self.global_csv = ""
         self.html_log = ""
         # Ant info:
-        self.known_bad_path = ""
-        self.keyword_path = ""
-        self.nsrl_path = ""
-        self.build_path = ""
+        self.known_bad_path = make_path(self.input_dir, "notablehashes.txt-md5.idx")
+        self.keyword_path = make_path(self.input_dir, "notablekeywords.xml")
+        self.nsrl_path = make_path(self.input_dir, "nsrl.txt-md5.idx")
+        self.build_path = make_path("..", "build.xml")
         # test_config info
         self.autopsy_version = ""
         self.ingest_messages = 0
@@ -600,6 +596,11 @@ class TestConfiguration(object):
         # Infinite Testing info
         timer = 0
         self.images = []
+        # Email info
+        self.email_enabled = False
+        self.mail_server = ""
+        self.mail_to = ""
+        self.mail_subject = ""
         # Set the timeout to something huge
         # The entire tester should not timeout before this number in ms
         # However it only seems to take about half this time
@@ -607,11 +608,13 @@ class TestConfiguration(object):
         self.timeout = 24 * 60 * 60 * 1000 * 1000
         self.ant = []
 
-        # Initialize Attributes
+        if not self.args.single:
+            self._load_config_file(self.args.config_file)
+        else:
+            self.images.append(self.args.single_file)
         self._init_logs()
-        self._init_imgs()
-        self._init_build_info()
-
+        #self._init_imgs()
+        #self._init_build_info()
 
     def ant_to_string(self):
         string = ""
@@ -619,46 +622,39 @@ class TestConfiguration(object):
             string += (arg + " ")
         return string
 
-    def reset(self):
-        # Set the timeout to something huge
-        # The entire tester should not timeout before this number in ms
-        # However it only seems to take about half this time
-        # And it's very buggy, so we're being careful
-        self.timeout = 24 * 60 * 60 * 1000 * 1000
-        self.ant = []
+    def _load_config_file(self, config_file):
+        """Updates this TestConfiguration's attributes from the config file.
 
-    def _init_imgs(self):
-        """Initialize the list of images to run test on."""
-        #Identify tests to run and populate test_config with list
-        # If user wants to do a single file and a list (contradictory?)
-        if self.args.single and self.args.list:
-            msg = "Cannot run both from config file and on a single file."
+        Initializes this TestConfiguration by iterating through the XML config file
+        command-line argument. Populates self.images and optional email configuration
+
+        Args:
+            config_file: ConfigFile - the configuration file to load
+        """
+        try:
+            count = 0
+            parsed_config = parse(config_file)
+            logres = []
+            counts = {}
+            if parsed_config.getElementsByTagName("indir"):
+                self.input_dir = parsed.getElementsByTagName("indir")[0].getAttribute("value").encode().decode("utf_8")
+            if parsed_config.getElementsByTagName("global_csv"):
+                self.global_csv = parsed.getElementsByTagName("global_csv")[0].getAttribute("value").encode().decode("utf_8")
+                self.global_csv = make_local_path(self.global_csv)
+            if parsed_config.getElementsByTagName("golddir"):
+                self.gold = parsed.getElementsByTagName("golddir")[0].getAttribute("value").encode().decode("utf_8")
+                self.img_gold = make_path(self.gold, 'tmp')
+
+            self._init_imgs(parsed_config)
+            self._init_build_info(parsed_config)
+            self._init_email_info(parsed_config)
+
+        except Exception as e:
+            msg = "There was an error running with the configuration file.\n"
+            msg += "\t" + str(e)
             Errors.add_email_msg(msg)
-            return
-        # If working from a configuration file
-        if self.args.list:
-           if not file_exists(self.args.config_file):
-               msg = "Configuration file does not exist at:" + self.args.config_file
-               Errors.add_email_msg(msg)
-               return
-           self._load_config_file(self.args.config_file)
-        # Else if working on a single file
-        elif self.args.single:
-           if not file_exists(self.args.single_file):
-               msg = "Image file does not exist at: " + self.args.single_file
-               Errors.add_email_msg(msg)
-               return
-           test_config.images.append(self.args.single_file)
-
-        # If user has not selected a single file, and does not want to ignore
-        #  the input directory, continue on to parsing ../input
-        if (not self.args.single) and (not self.args.ignore) and (not self.args.list):
-           self.args.config_file = "config.xml"
-           if not file_exists(self.args.config_file):
-               msg = "Configuration file does not exist at: " + self.args.config_file
-               Errors.add_email_msg(msg)
-               return
-           self._load_config_file(self.args.config_file)
+            logging.critical(traceback.format_exc())
+            print(traceback.format_exc())
 
     def _init_logs(self):
         """Setup output folder, logs, and reporting infrastructure."""
@@ -671,78 +667,56 @@ class TestConfiguration(object):
         log_name = self.output_dir + "\\regression.log"
         logging.basicConfig(filename=log_name, level=logging.DEBUG)
 
-    def _init_build_info(self):
+    def _init_build_info(self, parsed_config):
         """Initializes paths that point to information necessary to run the AutopsyIngest."""
-        global parsed
-        if(self.args.list):
-            build_elements = parsed.getElementsByTagName("build")
-            if(len(build_elements) <= 0):
-                build_path = make_path("..", "build.xml")
+        build_elements = parsed_config.getElementsByTagName("build")
+        if build_elements:
+            build_element = build_elements[0]
+            build_path = build_element.getAttribute("value").encode().decode("utf_8")
+            self.build_path = build_path
+
+    def _init_imgs(self, parsed_config):
+        """Initialize the list of images to run test on."""
+        for element in parsed_config.getElementsByTagName("image"):
+            value = element.getAttribute("value").encode().decode("utf_8")
+            print ("Image in Config File: " + value)
+            if file_exists(value):
+                self.images.append(value)
             else:
-                build_element = build_elements[0]
-                build_path = build_element.getAttribute("value").encode().decode("utf_8")
-                if(build_path == None):
-                    build_path = make_path("..", "build.xml")
-        else:
-            build_path = make_path("..", "build.xml")
-        self.build_path = build_path
-        self.known_bad_path = make_path(self.input_dir, "notablehashes.txt-md5.idx")
-        self.keyword_path = make_path(self.input_dir, "notablekeywords.xml")
-        self.nsrl_path = make_path(self.input_dir, "nsrl.txt-md5.idx")
+                msg = "File: " + value + " doesn't exist"
+                Errors.print_error(msg)
+                Errors.add_email_msg(msg)
+        image_count = len(self.images)
 
-    def _load_config_file(self, config_file):
-        """Updates this TestConfiguration's attributes from the config file.
+        # Sanity check to see if there are obvious gold images that we are not testing
+        gold_count = 0
+        for file in os.listdir(self.gold):
+            if not(file == 'tmp'):
+                gold_count+=1
 
-        Initializes this TestConfiguration by iterating through the XML config file
-        command-line argument. Populates self.images and optional email configuration
+        if (image_count > gold_count):
+            print("******Alert: There are more input images than gold standards, some images will not be properly tested.\n")
+        elif (image_count < gold_count):
+            print("******Alert: There are more gold standards than input images, this will not check all gold Standards.\n")
 
-        Args:
-            config_file: ConfigFile - the configuration file to load
-        """
-        try:
-            global parsed
-            count = 0
-            parsed = parse(config_file)
-            logres = []
-            counts = {}
-            if parsed.getElementsByTagName("indir"):
-                self.input_dir = parsed.getElementsByTagName("indir")[0].getAttribute("value").encode().decode("utf_8")
-            if parsed.getElementsByTagName("global_csv"):
-                self.global_csv = parsed.getElementsByTagName("global_csv")[0].getAttribute("value").encode().decode("utf_8")
-                self.global_csv = make_local_path(self.global_csv)
-            if parsed.getElementsByTagName("golddir"):
-                self.gold = parsed.getElementsByTagName("golddir")[0].getAttribute("value").encode().decode("utf_8")
-                self.img_gold = make_path(self.gold, 'tmp')
+    def _init_email_info(self, parsed_config):
+        """Initializes email information dictionary"""
+        email_elements = parsed_config.getElementsByTagName("email")
+        if email_elements:
+            mail_to = email_elements[0]
+            self.mail_to = mail_to.getAttribute("value").encode().decode("utf_8")
+        mail_server_elements = parsed_config.getElementsByTagName("mail_server")
+        if mail_server_elements:
+            mail_from = mail_server_elements[0]
+            self.mail_server = mail_from.getAttribute("value").encode().decode("utf_8")
+        subject_elements = parsed_config.getElementsByTagName("subject")
+        if subject_elements:
+            subject = subject_elements[0]
+            self.mail_subject = subject.getAttribute("value").encode().decode("utf_8")
+        if self.mail_server and self.mail_to:
+            self.email_enabled = True
 
-            # Generate the top navbar of the HTML for easy access to all images
-            for element in parsed.getElementsByTagName("image"):
-                value = element.getAttribute("value").encode().decode("utf_8")
-                print ("Image in Config File: " + value)
-                if file_exists(value):
-                    self.images.append(value)
-                else:
-                    msg = "File: " + value + " doesn't exist"
-                    Errors.print_error(msg)
-                    Errors.add_email_msg(msg)
-            image_count = len(self.images)
 
-            # Sanity check to see if there are obvious gold images that we are not testing
-            gold_count = 0
-            for file in os.listdir(self.gold):
-                if not(file == 'tmp'):
-                    gold_count+=1
-
-            if (image_count > gold_count):
-                print("******Alert: There are more input images than gold standards, some images will not be properly tested.\n")
-            elif (image_count < gold_count):
-                print("******Alert: There are more gold standards than input images, this will not check all gold Standards.\n")
-
-        except Exception as e:
-            msg = "There was an error running with the configuration file.\n"
-            msg += "\t" + str(e)
-            Errors.add_email_msg(msg)
-            logging.critical(traceback.format_exc())
-            print(traceback.format_exc())
 
 class TskDbDiff(object):
     """Represents the differences between the gold and output databases.
@@ -2065,6 +2039,34 @@ class Args(object):
                 print(usage())
                 return False
         # Return the args were sucessfully parsed
+        return self._sanity_check()
+
+    def _sanity_check(self):
+        """Check to make sure there are no conflicting arguments and the
+        specified files exist.
+
+        Returns:
+            False if there are conflicting arguments or a specified file does
+            not exist, True otherwise
+        """
+        if self.single and self.list:
+            print("Cannot run both from config file and on a single file.")
+            return False
+        if self.list:
+           if not file_exists(self.config_file):
+               print("Configuration file does not exist at:",
+               self.config_file)
+               return False
+        elif self.single:
+           if not file_exists(self.single_file):
+               msg = "Image file does not exist at: " + self.single_file
+               return False
+        if (not self.single) and (not self.ignore) and (not self.list):
+           self.config_file = "config.xml"
+           if not file_exists(self.config_file):
+               msg = "Configuration file does not exist at: " + self.config_file
+               return False
+
         return True
 
 ####

From 9f2015e4ce63ab08ae541542ce40263fdc763ec3 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 13:34:23 -0400
Subject: [PATCH 11/13] Removed global variable failedbool, updated overall
 pass/fail output message

---
 test/script/regression.py | 29 +++++++++++------------------
 1 file changed, 11 insertions(+), 18 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 2bf9f4a42c..4a9e86ac20 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -101,9 +101,7 @@ Day = 0
 #----------------------#
 def main():
     # Global variables
-    global failedbool
     global test_config
-    failedbool = False
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)
@@ -132,7 +130,6 @@ class TestRunner(object):
         Executes the AutopsyIngest for each image and dispatches the results based on
         the mode (rebuild or testing)
         """
-        global failedbool
         global html
 
         test_data_list = [ TestData(image, test_config) for image in test_config.images ]
@@ -143,8 +140,7 @@ class TestRunner(object):
         for test_data in test_data_list:
             Errors.clear_print_logs()
             Errors.set_testing_phase(test_data.image)
-            if not (test_config.args.rebuild or
-                os.path.exists(test_data.gold_archive)):
+            if not (test_config.args.rebuild or os.path.exists(test_data.gold_archive)):
                 msg = "Gold standard doesn't exist, skipping image:"
                 Errors.print_error(msg)
                 Errors.print_error(test_data.gold_archive)
@@ -159,23 +155,25 @@ class TestRunner(object):
             test_data.printerror = Errors.printerror
 
         Reports.write_html_foot()
+        # TODO: move this elsewhere
         if (len(logres)>0):
-            failedbool = True
-            print(logres)
             for lm in logres:
                 for ln in lm:
                     Errors.add_email_msg(ln)
-        if failedbool:
-            msg = "The test output didn't match the gold standard.\n"
-            msg += "autopsy test failed.\n"
+
+        # TODO: possibly worth putting this in a sub method
+        if all([ test_data.overall_passed for test_data in test_data_list ]):
+            Errors.add_email_msg("All images passed.\n")
+        else:
+            msg = "The following images failed:\n"
+            for test_data in test_data_list:
+                if not test_data.overall_passed:
+                    msg += "\t" + test_data.image + "\n"
             Errors.add_email_msg(msg)
             html = open(test_config.html_log)
             Errors.add_email_attachment(html.name)
             html.close()
-        else:
-            Errors.add_email_msg("Autopsy test passed.\n")
 
-        # @@@ This fails here if we didn't parse an XML file
         if test_config.email_enabled:
             Emailer.send_email(test_config.mail_to, test_config.mail_server,
             test_config.mail_subject, Errors.email_body, Errors.email_attachs)
@@ -957,7 +955,6 @@ class TskDbDiff(object):
             sorted_data_file: a pathto_File, the sorted dump file to write to
         """
         autopsy_cur2 = autopsy_con.cursor()
-        global failedbool
         # Get the list of all artifacts
         # @@@ Could add a SORT by parent_path in here since that is how we are going to later sort it.
         autopsy_cur2.execute("SELECT tsk_files.parent_path, tsk_files.name, blackboard_artifact_types.display_name, blackboard_artifacts.artifact_id FROM blackboard_artifact_types INNER JOIN blackboard_artifacts ON blackboard_artifact_types.artifact_type_id = blackboard_artifacts.artifact_type_id INNER JOIN tsk_files ON tsk_files.obj_id = blackboard_artifacts.obj_id")
@@ -1010,7 +1007,6 @@ class TskDbDiff(object):
                             msg = "There were too many values for attribute type: " + attr[1] + " for artifact with id #" + str(rw[3]) + ".\n"
                             Errors.add_email_msg(msg)
                             Errors.print_error(msg)
-                            failedbool = True
                             if(not appnd):
                                 Errors.add_email_attachment(db_file)
                                 appnd = True
@@ -1018,7 +1014,6 @@ class TskDbDiff(object):
                             msg ="There were inconsistent sources for artifact with id #" + str(rw[3]) + ".\n"
                             Errors.add_email_msg(msg)
                             Errors.print_error(msg)
-                            failedbool = True
                             if(not appnd):
                                 Errors.add_email_attachment(db_file)
                                 appnd = True
@@ -1182,13 +1177,11 @@ class TestResultsDiffer(object):
             diff_file = codecs.open(diff_path, "wb", "utf_8")
             dffcmdlst = ["diff", output_file, gold_file]
             subprocess.call(dffcmdlst, stdout = diff_file)
-            global failedbool
             Errors.add_email_attachment(diff_path)
             msg = "There was a difference in "
             msg += os.path.basename(output_file) + ".\n"
             Errors.add_email_msg(msg)
             Errors.print_error(msg)
-            failedbool = True
             return False
         else:
             return True

From 65471d726a757a72cdfb897b94ed234518d34310 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 14:20:14 -0400
Subject: [PATCH 12/13] Removed global variable test_config, updated
 appropriate references

---
 test/script/regression.py | 186 ++++++++++++++++++++------------------
 1 file changed, 98 insertions(+), 88 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 4a9e86ac20..417a207b00 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -101,7 +101,6 @@ Day = 0
 #----------------------#
 def main():
     # Global variables
-    global test_config
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)
@@ -119,22 +118,20 @@ def main():
             theproc = subprocess.Popen(antin, shell = True, stdout=subprocess.PIPE)
             theproc.communicate()
     # Otherwise test away!
-    TestRunner.run_tests()
+    TestRunner.run_tests(test_config)
 
 
 class TestRunner(object):
 
-    def run_tests():
+    def run_tests(test_config):
         """Run the tests specified by the main TestConfiguration.
 
         Executes the AutopsyIngest for each image and dispatches the results based on
         the mode (rebuild or testing)
         """
-        global html
-
         test_data_list = [ TestData(image, test_config) for image in test_config.images ]
 
-        Reports.html_add_images(test_config.images)
+        Reports.html_add_images(test_config.html_log, test_config.images)
 
         logres =[]
         for test_data in test_data_list:
@@ -154,7 +151,7 @@ class TestRunner(object):
             test_data.printout = Errors.printout
             test_data.printerror = Errors.printerror
 
-        Reports.write_html_foot()
+        Reports.write_html_foot(test_config.html_log)
         # TODO: move this elsewhere
         if (len(logres)>0):
             for lm in logres:
@@ -228,9 +225,7 @@ class TestRunner(object):
         test_data.errors_diff_passed and test_data.sorted_data_passed and
         test_data.db_dump_passed and test_data.db_diff_results.passed)
 
-        # @@@ COnsider if we want to do this for a rebuild.
-        # Make the CSV log and the html log viewer
-        Reports.generate_reports(test_config.csv, test_data)
+        Reports.generate_reports(test_data)
         if(not test_data.overall_passed):
             Errors.add_email_attachment(test_data.common_log_path)
         return logres
@@ -252,7 +247,7 @@ class TestRunner(object):
         Args:
             test_data: the TestData
         """
-        if not test_config.args.keep:
+        if not test_data.main_config.args.keep:
             if clear_dir(test_data.solr_index):
                 print_report([], "DELETE SOLR INDEX", "Solr index deleted.")
         else:
@@ -264,9 +259,10 @@ class TestRunner(object):
         Args:
             test_data: the TestData
         """
-        if test_config.args.exception:
-            exceptions = search_logs(test_config.args.exception_string, test_data)
-            okay = "No warnings or exceptions found containing text '" + test_config.args.exception_string + "'."
+        if test_data.main_config.args.exception:
+            exceptions = search_logs(test_data.main_config.args.exception_string, test_data)
+            okay = ("No warnings or exceptions found containing text '" +
+            test_data.main_config.args.exception_string + "'.")
             print_report(exceptions, "EXCEPTION", okay)
 
     def rebuild(test_data):
@@ -274,6 +270,7 @@ class TestRunner(object):
 
         Copies the test-generated database and html report files into the gold directory.
         """
+        test_config = test_data.main_config
         # Errors to print
         errors = []
         # Delete the current gold standards
@@ -339,38 +336,38 @@ class TestRunner(object):
         Args:
             test_data: the TestData
         """
+        test_config = test_data.main_config
         # Set up the directories
-        test_config_path = os.path.join(test_config.output_dir, test_data.image_name)
-        if dir_exists(test_config_path):
-            shutil.rmtree(test_config_path)
-        os.makedirs(test_config_path)
-        test_config.ant = ["ant"]
-        test_config.ant.append("-v")
-        test_config.ant.append("-f")
+        if dir_exists(test_data.output_path):
+            shutil.rmtree(test_data.output_path)
+        os.makedirs(test_data.output_path)
+        test_data.ant = ["ant"]
+        test_data.ant.append("-v")
+        test_data.ant.append("-f")
     #   case.ant.append(case.build_path)
-        test_config.ant.append(os.path.join("..","..","Testing","build.xml"))
-        test_config.ant.append("regression-test")
-        test_config.ant.append("-l")
-        test_config.ant.append(test_data.antlog_dir)
-        test_config.ant.append("-Dimg_path=" + test_data.image_file)
-        test_config.ant.append("-Dknown_bad_path=" + test_config.known_bad_path)
-        test_config.ant.append("-Dkeyword_path=" + test_config.keyword_path)
-        test_config.ant.append("-Dnsrl_path=" + test_config.nsrl_path)
-        test_config.ant.append("-Dgold_path=" + test_config.gold)
-        test_config.ant.append("-Dout_path=" +
+        test_data.ant.append(os.path.join("..","..","Testing","build.xml"))
+        test_data.ant.append("regression-test")
+        test_data.ant.append("-l")
+        test_data.ant.append(test_data.antlog_dir)
+        test_data.ant.append("-Dimg_path=" + test_data.image_file)
+        test_data.ant.append("-Dknown_bad_path=" + test_config.known_bad_path)
+        test_data.ant.append("-Dkeyword_path=" + test_config.keyword_path)
+        test_data.ant.append("-Dnsrl_path=" + test_config.nsrl_path)
+        test_data.ant.append("-Dgold_path=" + test_config.gold)
+        test_data.ant.append("-Dout_path=" +
         make_local_path(test_data.output_path))
-        test_config.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
-        test_config.ant.append("-Dtest.timeout=" + str(test_config.timeout))
+        test_data.ant.append("-Dignore_unalloc=" + "%s" % test_config.args.unallocated)
+        test_data.ant.append("-Dtest.timeout=" + str(test_config.timeout))
 
         Errors.print_out("Ingesting Image:\n" + test_data.image_file + "\n")
-        Errors.print_out("CMD: " + " ".join(test_config.ant))
+        Errors.print_out("CMD: " + " ".join(test_data.ant))
         Errors.print_out("Starting test...\n")
-        antoutpth = make_local_path(test_config.output_dir, "antRunOutput.txt")
+        antoutpth = make_local_path(test_data.main_config.output_dir, "antRunOutput.txt")
         antout = open(antoutpth, "a")
         if SYS is OS.CYGWIN:
-            subprocess.call(test_config.ant, stdout=subprocess.PIPE)
+            subprocess.call(test_data.ant, stdout=subprocess.PIPE)
         elif SYS is OS.WIN:
-            theproc = subprocess.Popen(test_config.ant, shell = True, stdout=subprocess.PIPE)
+            theproc = subprocess.Popen(test_data.ant, shell = True, stdout=subprocess.PIPE)
             theproc.communicate()
         antout.close()
 
@@ -383,6 +380,7 @@ class TestData(object):
 
     Attributes:
         main_config: the global TestConfiguration
+        ant: a listof_String, the ant command for this TestData
         image_file: a pathto_Image, the image for this TestData
         image: a String, the image file's name
         image_name: a String, the image file's name with a trailing (0)
@@ -411,6 +409,10 @@ class TestData(object):
         artifact_fail: a Nat, the number of artifact failures
         heap_space: a String representation of TODO
         service_times: a String representation of TODO
+        autopsy_version: a String, the version of autopsy that was run
+        ingest_messages: a Nat, the number of ingest messages
+        indexed_files: a Nat, the number of files indexed during the ingest
+        indexed_chunks: a Nat, the number of chunks indexed during the ingest
         printerror: a listof_String, the error messages printed during this TestData's test
         printout: a listof_String, the messages pritned during this TestData's test
     """
@@ -424,6 +426,7 @@ class TestData(object):
         """
         # Configuration Data
         self.main_config = main_config
+        self.ant = []
         self.image_file = str(image)
         # TODO: This 0 should be be refactored out, but it will require rebuilding and changing of outputs.
         self.image = get_image_name(self.image_file)
@@ -451,6 +454,7 @@ class TestData(object):
         self.sorted_data_passed = False
         self.db_dump_passed = False
         self.overall_passed = False
+        # Ingest info
         self.total_test_time = ""
         self.start_date = ""
         self.end_date = ""
@@ -459,11 +463,20 @@ class TestData(object):
         self.artifact_fail = 0
         self.heap_space = ""
         self.service_times = ""
-
+        self.autopsy_version = ""
+        self.ingest_messages = 0
+        self.indexed_files = 0
+        self.indexed_chunks = 0
         # Error tracking
         self.printerror = []
         self.printout = []
 
+    def ant_to_string(self):
+        string = ""
+        for arg in self.ant:
+            string += (arg + " ")
+        return string
+
     def get_db_path(self, db_type):
         """Get the path to the database file that corresponds to the given DBType.
 
@@ -586,11 +599,6 @@ class TestConfiguration(object):
         self.keyword_path = make_path(self.input_dir, "notablekeywords.xml")
         self.nsrl_path = make_path(self.input_dir, "nsrl.txt-md5.idx")
         self.build_path = make_path("..", "build.xml")
-        # test_config info
-        self.autopsy_version = ""
-        self.ingest_messages = 0
-        self.indexed_files = 0
-        self.indexed_chunks = 0
         # Infinite Testing info
         timer = 0
         self.images = []
@@ -604,7 +612,6 @@ class TestConfiguration(object):
         # However it only seems to take about half this time
         # And it's very buggy, so we're being careful
         self.timeout = 24 * 60 * 60 * 1000 * 1000
-        self.ant = []
 
         if not self.args.single:
             self._load_config_file(self.args.config_file)
@@ -614,11 +621,6 @@ class TestConfiguration(object):
         #self._init_imgs()
         #self._init_build_info()
 
-    def ant_to_string(self):
-        string = ""
-        for arg in self.ant:
-            string += (arg + " ")
-        return string
 
     def _load_config_file(self, config_file):
         """Updates this TestConfiguration's attributes from the config file.
@@ -1268,28 +1270,27 @@ class TestResultsDiffer(object):
 
 
 class Reports(object):
-    def generate_reports(csv_path, test_data):
+    def generate_reports(test_data):
         """Generate the reports for a single test
 
         Args:
-            csv_path: a pathto_File, the csv file
             test_data: the TestData
         """
         Reports._generate_html(test_data)
-        if test_config.global_csv:
-            Reports._generate_csv(test_config.global_csv, test_data)
+        if test_data.main_config.global_csv:
+            Reports._generate_csv(test_data.main_config.global_csv, test_data)
         else:
-            Reports._generate_csv(csv_path, test_data)
+            Reports._generate_csv(test_data.main_config.csv, test_data)
 
     def _generate_html(test_data):
         """Generate the HTML log file."""
         # If the file doesn't exist yet, this is the first test_config to run for
         # this test, so we need to make the start of the html log
-        if not file_exists(test_config.html_log):
+        html_log = test_data.main_config.html_log
+        if not file_exists(html_log):
             Reports.write_html_head()
         try:
-            global html
-            html = open(test_config.html_log, "a")
+            html = open(html_log, "a")
             # The image title
             title = "<h1><a name='" + test_data.image_name + "'>" + test_data.image_name + " \
                         <span>tested on <strong>" + socket.gethostname() + "</strong></span></a></h1>\
@@ -1336,9 +1337,9 @@ class Reports(object):
             info += "<tr><td>Image Name:</td>"
             info += "<td>" + test_data.image_name + "</td></tr>"
             info += "<tr><td>test_config Output Directory:</td>"
-            info += "<td>" + test_config.output_dir + "</td></tr>"
+            info += "<td>" + test_data.main_config.output_dir + "</td></tr>"
             info += "<tr><td>Autopsy Version:</td>"
-            info += "<td>" + test_config.autopsy_version + "</td></tr>"
+            info += "<td>" + test_data.autopsy_version + "</td></tr>"
             info += "<tr><td>Heap Space:</td>"
             info += "<td>" + test_data.heap_space + "</td></tr>"
             info += "<tr><td>Test Start Date:</td>"
@@ -1364,11 +1365,11 @@ class Reports(object):
             info += "<tr><td>TskDataExceptions:</td>"
             info += "<td>" + str(len(search_log_set("autopsy", "TskDataException", test_data))) + "</td></tr>"
             info += "<tr><td>Ingest Messages Count:</td>"
-            info += "<td>" + str(test_config.ingest_messages) + "</td></tr>"
+            info += "<td>" + str(test_data.ingest_messages) + "</td></tr>"
             info += "<tr><td>Indexed Files Count:</td>"
-            info += "<td>" + str(test_config.indexed_files) + "</td></tr>"
+            info += "<td>" + str(test_data.indexed_files) + "</td></tr>"
             info += "<tr><td>Indexed File Chunks Count:</td>"
-            info += "<td>" + str(test_config.indexed_chunks) + "</td></tr>"
+            info += "<td>" + str(test_data.indexed_chunks) + "</td></tr>"
             info += "<tr><td>Out Of Disk Space:\
                              <p style='font-size: 11px;'>(will skew other test results)</p></td>"
             info += "<td>" + str(len(search_log_set("autopsy", "Stopping ingest due to low disk space on disk", test_data))) + "</td></tr>"
@@ -1400,14 +1401,18 @@ class Reports(object):
             html.close()
         except Exception as e:
             Errors.print_error("Error: Unknown fatal error when creating HTML log at:")
-            Errors.print_error(test_config.html_log)
+            Errors.print_error(html_log)
             Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
 
-    def write_html_head():
-        """Write the top of the HTML log file."""
-        print(test_config.html_log)
-        html = open(str(test_config.html_log), "a")
+    def write_html_head(html_log):
+        """Write the top of the HTML log file.
+
+        Args:
+            html_log: a pathto_File, the global HTML log
+        """
+        print(html_log)
+        html = open(str(html_log), "a")
         head = "<html>\
                 <head>\
                 <title>AutopsyTesttest_config Output</title>\
@@ -1431,24 +1436,29 @@ class Reports(object):
         html.write(head)
         html.close()
 
-    def write_html_foot():
-        """Write the bottom of the HTML log file."""
-        html = open(test_config.html_log, "a")
+    def write_html_foot(html_log):
+        """Write the bottom of the HTML log file.
+
+        Args:
+            html_log: a pathto_File, the global HTML log
+        """
+        html = open(html_log, "a")
         head = "</body></html>"
         html.write(head)
         html.close()
 
-    def html_add_images(full_image_names):
+    def html_add_images(html_log, full_image_names):
         """Add all the image names to the HTML log.
 
         Args:
             full_image_names: a listof_String, each representing an image name
+            html_log: a pathto_File, the global HTML log
         """
         # If the file doesn't exist yet, this is the first test_config to run for
         # this test, so we need to make the start of the html log
-        if not file_exists(test_config.html_log):
-            Reports.write_html_head()
-        html = open(test_config.html_log, "a")
+        if not file_exists(html_log):
+            Reports.write_html_head(html_log)
+        html = open(html_log, "a")
         links = []
         for full_name in full_image_names:
             name = get_image_name(full_name)
@@ -1470,9 +1480,9 @@ class Reports(object):
             vars = []
             vars.append( test_data.image_file )
             vars.append( test_data.image_name )
-            vars.append( test_config.output_dir )
+            vars.append( test_data.main_config.output_dir )
             vars.append( socket.gethostname() )
-            vars.append( test_config.autopsy_version )
+            vars.append( test_data.autopsy_version )
             vars.append( test_data.heap_space )
             vars.append( test_data.start_date )
             vars.append( test_data.end_date )
@@ -1485,9 +1495,9 @@ class Reports(object):
             vars.append( str(Reports._get_num_memory_errors("solr", test_data)) )
             vars.append( str(len(search_log_set("autopsy", "TskCoreException", test_data))) )
             vars.append( str(len(search_log_set("autopsy", "TskDataException", test_data))) )
-            vars.append( str(test_config.ingest_messages) )
-            vars.append( str(test_config.indexed_files) )
-            vars.append( str(test_config.indexed_chunks) )
+            vars.append( str(test_data.ingest_messages) )
+            vars.append( str(test_data.indexed_files) )
+            vars.append( str(test_data.indexed_chunks) )
             vars.append( str(len(search_log_set("autopsy", "Stopping ingest due to low disk space on disk", test_data))) )
             vars.append( str(test_data.db_diff_results.output_objs) )
             vars.append( str(test_data.db_diff_results.output_artifacts) )
@@ -1497,7 +1507,7 @@ class Reports(object):
             vars.append( test_data.db_diff_results.get_attribute_comparison() )
             vars.append( make_local_path("gold", test_data.image_name, "standard.html") )
             vars.append( str(test_data.html_report_passed) )
-            vars.append( test_config.ant_to_string() )
+            vars.append( test_data.ant_to_string() )
             # Join it together with a ", "
             output = "|".join(vars)
             output += "\n"
@@ -1564,13 +1574,13 @@ class Logs(object):
     def generate_log_data(test_data):
         Logs._generate_common_log(test_data)
         try:
-            Logs._fill_test_config_data(test_data)
+            Logs._fill_ingest_data(test_data)
         except Exception as e:
             Errors.print_error("Error: Unknown fatal error when filling test_config data.")
             Errors.print_error(str(e) + "\n")
             logging.critical(traceback.format_exc())
         # If running in verbose mode (-v)
-        if test_config.args.verbose:
+        if test_data.main_config.args.verbose:
             errors = Logs._report_all_errors()
             okay = "No warnings or errors in any log files."
             print_report(errors, "VERBOSE", okay)
@@ -1584,7 +1594,7 @@ class Logs(object):
             common_log.write("--------------------------------------------------\n")
             common_log.write(test_data.image_name + "\n")
             common_log.write("--------------------------------------------------\n")
-            rep_path = make_local_path(test_config.output_dir)
+            rep_path = make_local_path(test_data.main_config.output_dir)
             rep_path = rep_path.replace("\\\\", "\\")
             for file in os.listdir(logs_path):
                 log = codecs.open(make_path(logs_path, file), "r", "utf_8")
@@ -1610,7 +1620,7 @@ class Logs(object):
             Errors.print_error(traceback.format_exc())
             logging.critical(traceback.format_exc())
 
-    def _fill_test_config_data(test_data):
+    def _fill_ingest_data(test_data):
         """Fill the global test config's variables that require the log files."""
         try:
             # Open autopsy.log.0
@@ -1639,7 +1649,7 @@ class Logs(object):
             # Set Autopsy version, heap space, ingest time, and service times
 
             version_line = search_logs("INFO: Application name: Autopsy, version:", test_data)[0]
-            test_config.autopsy_version = get_word_at(version_line, 5).rstrip(",")
+            test_data.autopsy_version = get_word_at(version_line, 5).rstrip(",")
 
             test_data.heap_space = search_logs("Heap memory usage:", test_data)[0].rstrip().split(": ")[1]
 
@@ -1647,13 +1657,13 @@ class Logs(object):
             test_data.total_ingest_time = get_word_at(ingest_line, 6).rstrip()
 
             message_line = search_log_set("autopsy", "Ingest messages count:", test_data)[0]
-            test_config.ingest_messages = int(message_line.rstrip().split(": ")[2])
+            test_data.ingest_messages = int(message_line.rstrip().split(": ")[2])
 
             files_line = search_log_set("autopsy", "Indexed files count:", test_data)[0]
-            test_config.indexed_files = int(files_line.rstrip().split(": ")[2])
+            test_data.indexed_files = int(files_line.rstrip().split(": ")[2])
 
             chunks_line = search_log_set("autopsy", "Indexed file chunks count:", test_data)[0]
-            test_config.indexed_chunks = int(chunks_line.rstrip().split(": ")[2])
+            test_data.indexed_chunks = int(chunks_line.rstrip().split(": ")[2])
         except Exception as e:
             Errors.print_error("Error: Unable to find the required information to fill test_config data.")
             Errors.print_error(str(e) + "\n")

From f180665333fae941dd7b5cbb1765d7f36537a6e2 Mon Sep 17 00:00:00 2001
From: Jeff Wallace <jwallace@basistech.com>
Date: Tue, 16 Jul 2013 15:18:03 -0400
Subject: [PATCH 13/13] Updated documentation of functions and classes.

---
 test/script/regression.py | 124 ++++++++++++++++++++++++++------------
 1 file changed, 85 insertions(+), 39 deletions(-)

diff --git a/test/script/regression.py b/test/script/regression.py
index 417a207b00..93b68457f6 100644
--- a/test/script/regression.py
+++ b/test/script/regression.py
@@ -57,13 +57,6 @@ from regression_utils import *
 # Variable, function, and class names are written in Python conventions:
 # this_is_a_variable    this_is_a_function()    ThisIsAClass
 #
-# All variables that are needed throughout the script have been initialized
-# in a global class.
-# - Command line arguments are in Args (named args)
-# - Global Test Configuration is in TestConfiguration(named test_config)
-# - Queried information from the databases is in TskDbDiff (named database)
-# Feel free to add additional global classes or add to the existing ones,
-# but do not overwrite any existing variables as they are used frequently.
 #
 
 
@@ -100,7 +93,7 @@ Day = 0
 #        Main          #
 #----------------------#
 def main():
-    # Global variables
+    """Parse the command-line arguments, create the configuration, and run the tests."""
     args = Args()
     parse_result = args.parse()
     test_config = TestConfiguration(args)
@@ -122,6 +115,7 @@ def main():
 
 
 class TestRunner(object):
+    """A collection of functions to run the regression tests."""
 
     def run_tests(test_config):
         """Run the tests specified by the main TestConfiguration.
@@ -676,7 +670,7 @@ class TestConfiguration(object):
             self.build_path = build_path
 
     def _init_imgs(self, parsed_config):
-        """Initialize the list of images to run test on."""
+        """Initialize the list of images to run tests on."""
         for element in parsed_config.getElementsByTagName("image"):
             value = element.getAttribute("value").encode().decode("utf_8")
             print ("Image in Config File: " + value)
@@ -742,7 +736,8 @@ class TskDbDiff(object):
         """Constructor for TskDbDiff.
 
         Args:
-            test_data: TestData - the test data to compare
+            output_db_path: a pathto_File, the output database
+            gold_db_path: a pathto_File, the gold database
         """
         self.gold_artifacts = []
         self.autopsy_artifacts = []
@@ -881,9 +876,6 @@ class TskDbDiff(object):
         Args:
             autopsy_cur: SQLCursor - the cursor for the output database
             gold_cur:    SQLCursor - the cursor for the gold database
-
-        Returns:
-
         """
         try:
             # Objects
@@ -1139,7 +1131,7 @@ class TestResultsDiffer(object):
             # Compare html output
             gold_report_path = test_data.get_html_report_path(DBType.GOLD)
             output_report_path = test_data.get_html_report_path(DBType.OUTPUT)
-            passed = TestResultsDiffer._html_report_diff(test_data, gold_report_path,
+            passed = TestResultsDiffer._html_report_diff(gold_report_path,
             output_report_path)
             test_data.html_report_passed = passed
 
@@ -1151,10 +1143,6 @@ class TestResultsDiffer(object):
             Errors.print_error(str(e) + "\n")
             print(traceback.format_exc())
 
-
-    # TODO: _compare_text could be made more generic with how it forms the paths (i.e. not add ".txt" in the method) and probably merged with
-    # compare_errors since they both do basic comparison of text files
-
     def _compare_text(output_file, gold_file, process=None):
         """Compare two text files.
 
@@ -1188,12 +1176,10 @@ class TestResultsDiffer(object):
         else:
             return True
 
-    # TODO: get rid of test_data by changing the error reporting
-    def _html_report_diff(test_data, gold_report_path, output_report_path):
+    def _html_report_diff(gold_report_path, output_report_path):
         """Compare the output and gold html reports.
 
         Args:
-            test_data: the TestData of the test being performed.
             gold_report_path: a pathto_Dir, the gold HTML report directory
             output_report_path: a pathto_Dir, the output HTML report directory
 
@@ -1571,7 +1557,13 @@ class Reports(object):
                 len(search_log_set(type, "OutOfMemoryException", test_data)))
 
 class Logs(object):
+
     def generate_log_data(test_data):
+        """Find and handle relevent data from the Autopsy logs.
+
+        Args:
+            test_data: the TestData whose logs to examine
+        """
         Logs._generate_common_log(test_data)
         try:
             Logs._fill_ingest_data(test_data)
@@ -1584,9 +1576,14 @@ class Logs(object):
             errors = Logs._report_all_errors()
             okay = "No warnings or errors in any log files."
             print_report(errors, "VERBOSE", okay)
-    # Generate the "common log": a log of all exceptions and warnings
-    # from each log file generated by Autopsy
+
     def _generate_common_log(test_data):
+        """Generate the common log, the log of all exceptions and warnings from
+        each log file generated by Autopsy.
+
+        Args:
+            test_data: the TestData to generate a log for
+        """
         try:
             logs_path = test_data.logs_dir
             common_log = codecs.open(test_data.common_log_path, "w", "utf_8")
@@ -1621,23 +1618,26 @@ class Logs(object):
             logging.critical(traceback.format_exc())
 
     def _fill_ingest_data(test_data):
-        """Fill the global test config's variables that require the log files."""
+        """Fill the TestDatas variables that require the log files.
+
+        Args:
+            test_data: the TestData to modify
+        """
         try:
             # Open autopsy.log.0
             log_path = make_path(test_data.logs_dir, "autopsy.log.0")
             log = open(log_path)
 
-            # Set the test_config starting time based off the first line of autopsy.log.0
+            # Set the TestData start time based off the first line of autopsy.log.0
             # *** If logging time format ever changes this will break ***
             test_data.start_date = log.readline().split(" org.")[0]
 
-            # Set the test_config ending time based off the "create" time (when the file was copied)
+            # Set the test_data ending time based off the "create" time (when the file was copied)
             test_data.end_date = time.ctime(os.path.getmtime(log_path))
         except Exception as e:
             Errors.print_error("Error: Unable to open autopsy.log.0.")
             Errors.print_error(str(e) + "\n")
             logging.warning(traceback.format_exc())
-        # Set the test_config total test time
         # Start date must look like: "Jul 16, 2012 12:57:53 PM"
         # End date must look like: "Mon Jul 16 13:02:42 2012"
         # *** If logging time format ever changes this will break ***
@@ -1743,6 +1743,8 @@ def print_report(errors, name, okay):
 def get_exceptions(test_data):
     """Get a list of the exceptions in the autopsy logs.
 
+    Args:
+        test_data: the TestData to use to find the exceptions.
     Returns:
         a listof_String, the exceptions found in the logs.
     """
@@ -1763,6 +1765,9 @@ def get_exceptions(test_data):
 def get_warnings(test_data):
     """Get a list of the warnings listed in the common log.
 
+    Args:
+        test_data: the TestData to use to find the warnings
+
     Returns:
         listof_String, the warnings found.
     """
@@ -1775,6 +1780,11 @@ def get_warnings(test_data):
     return warnings
 
 def copy_logs(test_data):
+    """Copy the Autopsy generated logs to output directory.
+
+    Args:
+        test_data: the TestData whose logs will be copied
+    """
     try:
         log_dir = os.path.join("..", "..", "Testing","build","test","qa-functional","work","userdir0","var","log")
         shutil.copytree(log_dir, test_data.logs_dir)
@@ -1812,8 +1822,9 @@ class FileNotFoundException(Exception):
         self.strerror = "FileNotFoundException: " + file
 
     def print_error(self):
-        printerror(test_data,"Error: File could not be found at:")
-        printerror(test_data,self.file + "\n")
+        Errors.print_error("Error: File could not be found at:")
+        Errors.print_error(self.file + "\n")
+
     def error(self):
         error = "Error: File could not be found at:\n" + self.file + "\n"
         return error
@@ -1830,6 +1841,7 @@ class DirNotFoundException(Exception):
     def print_error(self):
         Errors.print_error("Error: Directory could not be found at:")
         Errors.print_error(self.dir + "\n")
+
     def error(self):
         error = "Error: Directory could not be found at:\n" + self.dir + "\n"
         return error
@@ -1981,7 +1993,7 @@ class Args(object):
         self.fr = False
 
     def parse(self):
-        global nxtproc
+        """Get the command line arguments and parse them."""
         nxtproc = []
         nxtproc.append("python3")
         nxtproc.append(sys.argv.pop(0))
@@ -1990,11 +2002,11 @@ class Args(object):
             nxtproc.append(arg)
             if(arg == "-f"):
                 #try: @@@ Commented out until a more specific except statement is added
-                    arg = sys.argv.pop(0)
-                    print("Running on a single file:")
-                    print(path_fix(arg) + "\n")
-                    self.single = True
-                    self.single_file = path_fix(arg)
+                arg = sys.argv.pop(0)
+                print("Running on a single file:")
+                print(path_fix(arg) + "\n")
+                self.single = True
+                self.single_file = path_fix(arg)
                 #except:
                 #   print("Error: No single file given.\n")
             #       return False
@@ -2145,7 +2157,11 @@ def search_log_set(type, string, test_data):
 
 
 def clear_dir(dir):
-    """Clears all files from a directory and remakes it."""
+    """Clears all files from a directory and remakes it.
+
+    Args:
+        dir: a pathto_Dir, the directory to clear
+    """
     try:
         if dir_exists(dir):
             shutil.rmtree(dir)
@@ -2158,6 +2174,11 @@ def clear_dir(dir):
         return False;
 
 def del_dir(dir):
+    """Delete the given directory.
+
+    Args:
+        dir: a pathto_Dir, the directory to delete
+    """
     try:
         if dir_exists(dir):
             shutil.rmtree(dir)
@@ -2168,7 +2189,12 @@ def del_dir(dir):
         return False;
 
 def copy_file(ffrom, to):
-    """Copies a given file from "ffrom" to "to"."""
+    """Copies a given file from "ffrom" to "to".
+
+    Args:
+        ffrom: a pathto_File, the origin path
+        to: a pathto_File, the destination path
+    """
     try :
         shutil.copy(ffrom, to)
     except Exception as e:
@@ -2176,7 +2202,12 @@ def copy_file(ffrom, to):
         print(traceback.format_exc())
 
 def copy_dir(ffrom, to):
-    """Copies a directory file from "ffrom" to "to"."""
+    """Copies a directory file from "ffrom" to "to".
+
+    Args:
+        ffrom: a pathto_Dir, the origin path
+        to: a pathto_Dir, the destination path
+    """
     try :
         if not os.path.isdir(ffrom):
             raise FileNotFoundException(ffrom)
@@ -2185,7 +2216,15 @@ def copy_dir(ffrom, to):
         raise FileNotFoundException(to)
 
 def get_file_in_dir(dir, ext):
-    """Returns the first file in the given directory with the given extension."""
+    """Returns the first file in the given directory with the given extension.
+
+    Args:
+        dir: a pathto_Dir, the directory to search
+        ext: a String, the extension to search for
+
+    Returns:
+        pathto_File, the file that was found
+    """
     try:
         for file in os.listdir(dir):
             if file.endswith(ext):
@@ -2196,6 +2235,13 @@ def get_file_in_dir(dir, ext):
         raise DirNotFoundException(dir)
 
 def find_file_in_dir(dir, name, ext):
+    """Find the file with the given name in the given directory.
+
+    Args:
+        dir: a pathto_Dir, the directory to search
+        name: a String, the basename of the file to search for
+        ext: a String, the extension of the file to search for
+    """
     try:
         for file in os.listdir(dir):
             if file.startswith(name):