resulttool: Improvements to allow integration to the autobuilder

This is a combined patch of the various tweaks and improvements I made to resulttool: * Avoid subprocess.run() as its a python 3.6 feature and we have autobuilder workers with 3.5. * Avoid python keywords as variable names * Simplify dict accesses using .get() * Rename resultsutils -> resultutils to match the resultstool -> resulttool rename * Formalised the handling of "file_name" to "TESTSERIES" which the code will now add into the json configuration data if its not present, based on the directory name. * When we don't have failed test cases, print something saying so instead of an empty table * Tweak the table headers in the report to be more readable (reference "Test Series" instead if file_id and ID instead of results_id) * Improve/simplify the max string length handling * Merge the counts and percentage data into one table in the report since printing two reports of the same data confuses the user * Removed the confusing header in the regression report * Show matches, then regressions, then unmatched runs in the regression report, also remove chatting unneeded output * Try harder to "pair" up matching configurations to reduce noise in the regressions report * Abstracted the "mapping" table concept used to pairing in the regression code to general code in resultutils * Created multiple mappings for results analysis, results storage and 'flattening' results data in a merge * Simplify the merge command to take a source and a destination, letting the destination be a directory or a file, removing the need for an output directory parameter * Add the 'IMAGE_PKGTYPE' and 'DISTRO' config options to the regression mappings * Have the store command place the testresults files in a layout from the mapping, making commits into the git repo for results storage more useful for simple comparison purposes * Set the oe-git-archive tag format appropriately for oeqa results storage (and simplify the commit messages closer to their defaults) * Fix oe-git-archive to use the commit/branch data from the results file * Cleaned up the command option help to match other changes * Follow the model of git branch/tag processing used by oe-build-perf-report and use that to read the data using git show to avoid branch change * Add ptest summary to the report command * Update the tests to match the above changes (From OE-Core rev: ff2c029b568f70aa9960dde04ddd207829812ea0) Signed-off-by: Richard Purdie <richard.purdie@linuxfoundation.org>
author: Richard Purdie <richard.purdie@linuxfoundation.org> 2019-02-16 18:13:00 +0000
committer: Richard Purdie <richard.purdie@linuxfoundation.org> 2019-02-21 12:34:00 +0000
commit: 47eb3d00e9d6a66aee1283dab29af8117a006d6d (patch)
tree: 9d574720d23da3edeab5648f05fb5d2ee95c9cd2 /scripts/lib/resulttool/regression.py
parent: beed7523b667affea71d37d88d2f5c19c935d159 (diff)
download: poky-47eb3d00e9d6a66aee1283dab29af8117a006d6d.tar.gz
1 files changed, 156 insertions, 172 deletions
diff --git a/scripts/lib/resulttool/regression.py b/scripts/lib/resulttool/regression.py
index bee3fb011a..ff77332fa9 100644
--- a/scripts/lib/resulttool/regression.py
+++ b/scripts/lib/resulttool/regression.py
@@ -1,6 +1,7 @@
-# test result tool - regression analysis
+# resulttool - regression analysis
 #
 # Copyright (c) 2019, Intel Corporation.
+# Copyright (c) 2019, Linux Foundation
 #
 # This program is free software; you can redistribute it and/or modify it
 # under the terms and conditions of the GNU General Public License,
@@ -11,171 +12,170 @@
 # FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 # more details.
 #
-from resulttool.resultsutils import load_json_file, get_dict_value, pop_dict_element
+import resulttool.resultutils as resultutils
 import json
-class ResultsRegressionSelector(object):
+from oeqa.utils.git import GitRepo
+import oeqa.utils.gitarchive as gitarchive
-    def get_results_unique_configurations(self, logger, results):
-        unique_configurations_map = {"oeselftest": ['TEST_TYPE', 'HOST_DISTRO', 'MACHINE'],
+def compare_result(logger, base_name, target_name, base_result, target_result):
-                                     "runtime": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE'],
+    base_result = base_result.get('result')
-                                     "sdk": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE', 'SDKMACHINE'],
+    target_result = target_result.get('result')
-                                     "sdkext": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE', 'SDKMACHINE']}
+    result = {}
-        results_unique_configs = {}
+    if base_result and target_result:
-        for k in results:
+        for k in base_result:
-            result = results[k]
+            base_testcase = base_result[k]
-            result_configs = get_dict_value(logger, result, 'configuration')
+            base_status = base_testcase.get('status')
-            result_test_type = get_dict_value(logger, result_configs, 'TEST_TYPE')
+            if base_status:
-            unique_configuration_keys = get_dict_value(logger, unique_configurations_map, result_test_type)
+                target_testcase = target_result.get(k, {})
-            result_unique_config = {}
+                target_status = target_testcase.get('status')
-            for ck in unique_configuration_keys:
+                if base_status != target_status:
-                config_value = get_dict_value(logger, result_configs, ck)
+                    result[k] = {'base': base_status, 'target': target_status}
-                if config_value:
+            else:
-                    result_unique_config[ck] = config_value
+                logger.error('Failed to retrieved base test case status: %s' % k)
-            results_unique_configs[k] = result_unique_config
+    if result:
-        return results_unique_configs
+        resultstring = "Regression: %s\n            %s\n" % (base_name, target_name)
+        for k in result:
-    def get_regression_base_target_pair(self, logger, base_results, target_results):
+            resultstring += '    %s: %s -> %s\n' % (k, result[k]['base'], result[k]['target'])
-        base_configs = self.get_results_unique_configurations(logger, base_results)
-        logger.debug('Retrieved base configuration: config=%s' % base_configs)
-        target_configs = self.get_results_unique_configurations(logger, target_results)
-        logger.debug('Retrieved target configuration: config=%s' % target_configs)
-        regression_pair = {}
-        for bk in base_configs:
-            base_config = base_configs[bk]
-            for tk in target_configs:
-                target_config = target_configs[tk]
-                if base_config == target_config:
-                    if bk in regression_pair:
-                        regression_pair[bk].append(tk)
-                    else:
-                        regression_pair[bk] = [tk]
-        return regression_pair
-    def run_regression_with_regression_pairing(self, logger, regression_pair, base_results, target_results):
-        regression = ResultsRegression()
-        for base in regression_pair:
-            for target in regression_pair[base]:
-                print('Getting regression for base=%s target=%s' % (base, target))
-                regression.run(logger, base_results[base], target_results[target])
-class ResultsRegression(object):
-    def print_regression_result(self, result):
-        if result:
-            print('============================Start Regression============================')
-            print('Only print regression if base status not equal target')
-            print('<test case> : <base status> -> <target status>')
-            print('========================================================================')
-            for k in result:
-                print(k, ':', result[k]['base'], '->', result[k]['target'])
-            print('==============================End Regression==============================')
-    def get_regression_result(self, logger, base_result, target_result):
-        base_result = get_dict_value(logger, base_result, 'result')
-        target_result = get_dict_value(logger, target_result, 'result')
-        result = {}
-        if base_result and target_result:
-            logger.debug('Getting regression result')
-            for k in base_result:
-                base_testcase = base_result[k]
-                base_status = get_dict_value(logger, base_testcase, 'status')
-                if base_status:
-                    target_testcase = get_dict_value(logger, target_result, k)
-                    target_status = get_dict_value(logger, target_testcase, 'status')
-                    if base_status != target_status:
-                        result[k] = {'base': base_status, 'target': target_status}
-                else:
-                    logger.error('Failed to retrieved base test case status: %s' % k)
-        return result
-    def run(self, logger, base_result, target_result):
-        if base_result and target_result:
-            result = self.get_regression_result(logger, base_result, target_result)
-            logger.debug('Retrieved regression result =%s' % result)
-            self.print_regression_result(result)
-        else:
-            logger.error('Input data objects must not be empty (base_result=%s, target_result=%s)' %
-                         (base_result, target_result))
-def get_results_from_directory(logger, source_dir):
-    from resulttool.merge import ResultsMerge
-    from resulttool.resultsutils import get_directory_files
-    result_files = get_directory_files(source_dir, ['.git'], 'testresults.json')
-    base_results = {}
-    for file in result_files:
-        merge = ResultsMerge()
-        results = merge.get_test_results(logger, file, '')
-        base_results = merge.merge_results(base_results, results)
-    return base_results
-def remove_testcases_to_optimize_regression_runtime(logger, results):
-    test_case_removal = ['ptestresult.rawlogs', 'ptestresult.sections']
-    for r in test_case_removal:
-        for k in results:
-            result = get_dict_value(logger, results[k], 'result')
-            pop_dict_element(logger, result, r)
-def regression_file(args, logger):
-    base_results = load_json_file(args.base_result_file)
-    print('Successfully loaded base test results from: %s' % args.base_result_file)
-    target_results = load_json_file(args.target_result_file)
-    print('Successfully loaded target test results from: %s' % args.target_result_file)
-    remove_testcases_to_optimize_regression_runtime(logger, base_results)
-    remove_testcases_to_optimize_regression_runtime(logger, target_results)
-    if args.base_result_id and args.target_result_id:
-        base_result = get_dict_value(logger, base_results, base_result_id)
-        print('Getting base test result with result_id=%s' % base_result_id)
-        target_result = get_dict_value(logger, target_results, target_result_id)
-        print('Getting target test result with result_id=%s' % target_result_id)
-        regression = ResultsRegression()
-        regression.run(logger, base_result, target_result)
    else:
-        regression = ResultsRegressionSelector()
+        resultstring = "Match: %s\n       %s" % (base_name, target_name)
-        regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)
+    return result, resultstring
-        logger.debug('Retrieved regression pair=%s' % regression_pair)
-        regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)
+def get_results(logger, source):
-    return 0
+    return resultutils.load_resultsdata(source, configmap=resultutils.regression_map)
+def regression(args, logger):
+    base_results = get_results(logger, args.base_result)
+    target_results = get_results(logger, args.target_result)
+    regression_common(args, logger, base_results, target_results)
+def regression_common(args, logger, base_results, target_results):
+    if args.base_result_id:
+        base_results = resultutils.filter_resultsdata(base_results, args.base_result_id)
+    if args.target_result_id:
+        target_results = resultutils.filter_resultsdata(target_results, args.target_result_id)
+    matches = []
+    regressions = []
+    notfound = []
+    for a in base_results:
+        if a in target_results:
+            base = list(base_results[a].keys())
+            target = list(target_results[a].keys())
+            # We may have multiple base/targets which are for different configurations. Start by 
+            # removing any pairs which match
+            for c in base.copy():
+                for b in target.copy():
+                    res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b])
+                    if not res:
+                        matches.append(resstr)
+                        base.remove(c)
+                        target.remove(b)
+                        break
+            # Should only now see regressions, we may not be able to match multiple pairs directly
+            for c in base:
+                for b in target:
+                    res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b])
+                    if res:
+                        regressions.append(resstr)
+        else:
+            notfound.append("%s not found in target" % a)
+    print("\n".join(matches))
+    print("\n".join(regressions))
+    print("\n".join(notfound))
-def regression_directory(args, logger):
-    base_results = get_results_from_directory(logger, args.base_result_directory)
-    target_results = get_results_from_directory(logger, args.target_result_directory)
-    remove_testcases_to_optimize_regression_runtime(logger, base_results)
-    remove_testcases_to_optimize_regression_runtime(logger, target_results)
-    regression = ResultsRegressionSelector()
-    regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)
-    logger.debug('Retrieved regression pair=%s' % regression_pair)
-    regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)
    return 0
 def regression_git(args, logger):
-    from resulttool.resultsutils import checkout_git_dir
    base_results = {}
    target_results = {}
-    if checkout_git_dir(args.source_dir, args.base_git_branch):
-        base_results = get_results_from_directory(logger, args.source_dir)
+    tag_name = "{branch}/{commit_number}-g{commit}/{tag_number}"
-    if checkout_git_dir(args.source_dir, args.target_git_branch):
+    repo = GitRepo(args.repo)
-        target_results = get_results_from_directory(logger, args.source_dir)
-    if base_results and target_results:
+    revs = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch)
-        remove_testcases_to_optimize_regression_runtime(logger, base_results)
-        remove_testcases_to_optimize_regression_runtime(logger, target_results)
+    if args.branch2:
-        regression = ResultsRegressionSelector()
+        revs2 = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch2)
-        regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)
+        if not len(revs2):
-        logger.debug('Retrieved regression pair=%s' % regression_pair)
+            logger.error("No revisions found to compare against")
-        regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)
+            return 1
+        if not len(revs):
+            logger.error("No revision to report on found")
+            return 1
+    else:
+        if len(revs) < 2:
+            logger.error("Only %d tester revisions found, unable to generate report" % len(revs))
+            return 1
+    # Pick revisions
+    if args.commit:
+        if args.commit_number:
+            logger.warning("Ignoring --commit-number as --commit was specified")
+        index1 = gitarchive.rev_find(revs, 'commit', args.commit)
+    elif args.commit_number:
+        index1 = gitarchive.rev_find(revs, 'commit_number', args.commit_number)
+    else:
+        index1 = len(revs) - 1
+    if args.branch2:
+        revs2.append(revs[index1])
+        index1 = len(revs2) - 1
+        revs = revs2
+    if args.commit2:
+        if args.commit_number2:
+            logger.warning("Ignoring --commit-number2 as --commit2 was specified")
+        index2 = gitarchive.rev_find(revs, 'commit', args.commit2)
+    elif args.commit_number2:
+        index2 = gitarchive.rev_find(revs, 'commit_number', args.commit_number2)
+    else:
+        if index1 > 0:
+            index2 = index1 - 1
+            # Find the closest matching commit number for comparision
+            # In future we could check the commit is a common ancestor and
+            # continue back if not but this good enough for now
+            while index2 > 0 and revs[index2].commit_number > revs[index1].commit_number:
+                index2 = index2 - 1
+        else:
+            logger.error("Unable to determine the other commit, use "
+                      "--commit2 or --commit-number2 to specify it")
+            return 1
+    logger.info("Comparing:\n%s\nto\n%s\n" % (revs[index1], revs[index2]))
+    base_results = resultutils.git_get_result(repo, revs[index1][2])
+    target_results = resultutils.git_get_result(repo, revs[index2][2])
+    regression_common(args, logger, base_results, target_results)
    return 0
 def register_commands(subparsers):
    """Register subcommands from this plugin"""
-    parser_build = subparsers.add_parser('regression-file', help='regression file analysis',
+    parser_build = subparsers.add_parser('regression', help='regression file/directory analysis',
+                                         description='regression analysis comparing the base set of results to the target results',
+                                         group='analysis')
+    parser_build.set_defaults(func=regression)
+    parser_build.add_argument('base_result',
+                              help='base result file/directory for the comparison')
+    parser_build.add_argument('target_result',
+                              help='target result file/directory to compare with')
+    parser_build.add_argument('-b', '--base-result-id', default='',
+                              help='(optional) filter the base results to this result ID')
+    parser_build.add_argument('-t', '--target-result-id', default='',
+                              help='(optional) filter the target results to this result ID')
+    parser_build = subparsers.add_parser('regression-git', help='regression git analysis',
                                         description='regression analysis comparing base result set to target '
                                                     'result set',
                                         group='analysis')
-    parser_build.set_defaults(func=regression_file)
+    parser_build.set_defaults(func=regression_git)
-    parser_build.add_argument('base_result_file',
+    parser_build.add_argument('repo',
-                              help='base result file provide the base result set')
+                              help='the git repository containing the data')
-    parser_build.add_argument('target_result_file',
-                              help='target result file provide the target result set for comparison with base result')
    parser_build.add_argument('-b', '--base-result-id', default='',
                              help='(optional) default select regression based on configurations unless base result '
                                   'id was provided')
@@ -183,26 +183,10 @@ def register_commands(subparsers):
                              help='(optional) default select regression based on configurations unless target result '
                                   'id was provided')
-    parser_build = subparsers.add_parser('regression-dir', help='regression directory analysis',
+    parser_build.add_argument('--branch', '-B', default='master', help="Branch to find commit in")
-                                         description='regression analysis comparing base result set to target '
+    parser_build.add_argument('--branch2', help="Branch to find comparision revisions in")
-                                                     'result set',
+    parser_build.add_argument('--commit', help="Revision to search for")
-                                         group='analysis')
+    parser_build.add_argument('--commit-number', help="Revision number to search for, redundant if --commit is specified")
-    parser_build.set_defaults(func=regression_directory)
+    parser_build.add_argument('--commit2', help="Revision to compare with")
-    parser_build.add_argument('base_result_directory',
+    parser_build.add_argument('--commit-number2', help="Revision number to compare with, redundant if --commit2 is specified")
-                              help='base result directory provide the files for base result set')
-    parser_build.add_argument('target_result_directory',
-                              help='target result file provide the files for target result set for comparison with '
-                                   'base result')
-    parser_build = subparsers.add_parser('regression-git', help='regression git analysis',
-                                         description='regression analysis comparing base result set to target '
-                                                     'result set',
-                                         group='analysis')
-    parser_build.set_defaults(func=regression_git)
-    parser_build.add_argument('source_dir',
-                              help='source directory that contain the git repository with test result files')
-    parser_build.add_argument('base_git_branch',
-                              help='base git branch that provide the files for base result set')
-    parser_build.add_argument('target_git_branch',
-                              help='target git branch that provide the files for target result set for comparison with '
-                                   'base result')
author	Richard Purdie <richard.purdie@linuxfoundation.org>	2019-02-16 18:13:00 +0000
committer	Richard Purdie <richard.purdie@linuxfoundation.org>	2019-02-21 12:34:00 +0000
commit	47eb3d00e9d6a66aee1283dab29af8117a006d6d (patch)
tree	9d574720d23da3edeab5648f05fb5d2ee95c9cd2 /scripts/lib/resulttool/regression.py
parent	beed7523b667affea71d37d88d2f5c19c935d159 (diff)
download	poky-47eb3d00e9d6a66aee1283dab29af8117a006d6d.tar.gz

diff --git a/scripts/lib/resulttool/regression.py b/scripts/lib/resulttool/regression.py index bee3fb011a..ff77332fa9 100644 --- a/scripts/lib/resulttool/regression.py +++ b/scripts/lib/resulttool/regression.py
@@ -1,6 +1,7 @@
1	# test result tool - regression analysis	1	# resulttool - regression analysis
2	#	2	#
3	# Copyright (c) 2019, Intel Corporation.	3	# Copyright (c) 2019, Intel Corporation.
		4	# Copyright (c) 2019, Linux Foundation
4	#	5	#
5	# This program is free software; you can redistribute it and/or modify it	6	# This program is free software; you can redistribute it and/or modify it
6	# under the terms and conditions of the GNU General Public License,	7	# under the terms and conditions of the GNU General Public License,
@@ -11,171 +12,170 @@
11	# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for	12	# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12	# more details.	13	# more details.
13	#	14	#
14	from resulttool.resultsutils import load_json_file, get_dict_value, pop_dict_element	15	import resulttool.resultutils as resultutils
15	import json	16	import json
16		17
17	class ResultsRegressionSelector(object):	18	from oeqa.utils.git import GitRepo
18		19	import oeqa.utils.gitarchive as gitarchive
19	def get_results_unique_configurations(self, logger, results):	20
20	unique_configurations_map = {"oeselftest": ['TEST_TYPE', 'HOST_DISTRO', 'MACHINE'],	21	def compare_result(logger, base_name, target_name, base_result, target_result):
21	"runtime": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE'],	22	base_result = base_result.get('result')
22	"sdk": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE', 'SDKMACHINE'],	23	target_result = target_result.get('result')
23	"sdkext": ['TEST_TYPE', 'IMAGE_BASENAME', 'MACHINE', 'SDKMACHINE']}	24	result = {}
24	results_unique_configs = {}	25	if base_result and target_result:
25	for k in results:	26	for k in base_result:
26	result = results[k]	27	base_testcase = base_result[k]
27	result_configs = get_dict_value(logger, result, 'configuration')	28	base_status = base_testcase.get('status')
28	result_test_type = get_dict_value(logger, result_configs, 'TEST_TYPE')	29	if base_status:
29	unique_configuration_keys = get_dict_value(logger, unique_configurations_map, result_test_type)	30	target_testcase = target_result.get(k, {})
30	result_unique_config = {}	31	target_status = target_testcase.get('status')
31	for ck in unique_configuration_keys:	32	if base_status != target_status:
32	config_value = get_dict_value(logger, result_configs, ck)	33	result[k] = {'base': base_status, 'target': target_status}
33	if config_value:	34	else:
34	result_unique_config[ck] = config_value	35	logger.error('Failed to retrieved base test case status: %s' % k)
35	results_unique_configs[k] = result_unique_config	36	if result:
36	return results_unique_configs	37	resultstring = "Regression: %s\n %s\n" % (base_name, target_name)
37		38	for k in result:
38	def get_regression_base_target_pair(self, logger, base_results, target_results):	39	resultstring += ' %s: %s -> %s\n' % (k, result[k]['base'], result[k]['target'])
39	base_configs = self.get_results_unique_configurations(logger, base_results)
40	logger.debug('Retrieved base configuration: config=%s' % base_configs)
41	target_configs = self.get_results_unique_configurations(logger, target_results)
42	logger.debug('Retrieved target configuration: config=%s' % target_configs)
43	regression_pair = {}
44	for bk in base_configs:
45	base_config = base_configs[bk]
46	for tk in target_configs:
47	target_config = target_configs[tk]
48	if base_config == target_config:
49	if bk in regression_pair:
50	regression_pair[bk].append(tk)
51	else:
52	regression_pair[bk] = [tk]
53	return regression_pair
54
55	def run_regression_with_regression_pairing(self, logger, regression_pair, base_results, target_results):
56	regression = ResultsRegression()
57	for base in regression_pair:
58	for target in regression_pair[base]:
59	print('Getting regression for base=%s target=%s' % (base, target))
60	regression.run(logger, base_results[base], target_results[target])
61
62	class ResultsRegression(object):
63
64	def print_regression_result(self, result):
65	if result:
66	print('============================Start Regression============================')
67	print('Only print regression if base status not equal target')
68	print('<test case> : <base status> -> <target status>')
69	print('========================================================================')
70	for k in result:
71	print(k, ':', result[k]['base'], '->', result[k]['target'])
72	print('==============================End Regression==============================')
73
74	def get_regression_result(self, logger, base_result, target_result):
75	base_result = get_dict_value(logger, base_result, 'result')
76	target_result = get_dict_value(logger, target_result, 'result')
77	result = {}
78	if base_result and target_result:
79	logger.debug('Getting regression result')
80	for k in base_result:
81	base_testcase = base_result[k]
82	base_status = get_dict_value(logger, base_testcase, 'status')
83	if base_status:
84	target_testcase = get_dict_value(logger, target_result, k)
85	target_status = get_dict_value(logger, target_testcase, 'status')
86	if base_status != target_status:
87	result[k] = {'base': base_status, 'target': target_status}
88	else:
89	logger.error('Failed to retrieved base test case status: %s' % k)
90	return result
91
92	def run(self, logger, base_result, target_result):
93	if base_result and target_result:
94	result = self.get_regression_result(logger, base_result, target_result)
95	logger.debug('Retrieved regression result =%s' % result)
96	self.print_regression_result(result)
97	else:
98	logger.error('Input data objects must not be empty (base_result=%s, target_result=%s)' %
99	(base_result, target_result))
100
101	def get_results_from_directory(logger, source_dir):
102	from resulttool.merge import ResultsMerge
103	from resulttool.resultsutils import get_directory_files
104	result_files = get_directory_files(source_dir, ['.git'], 'testresults.json')
105	base_results = {}
106	for file in result_files:
107	merge = ResultsMerge()
108	results = merge.get_test_results(logger, file, '')
109	base_results = merge.merge_results(base_results, results)
110	return base_results
111
112	def remove_testcases_to_optimize_regression_runtime(logger, results):
113	test_case_removal = ['ptestresult.rawlogs', 'ptestresult.sections']
114	for r in test_case_removal:
115	for k in results:
116	result = get_dict_value(logger, results[k], 'result')
117	pop_dict_element(logger, result, r)
118
119	def regression_file(args, logger):
120	base_results = load_json_file(args.base_result_file)
121	print('Successfully loaded base test results from: %s' % args.base_result_file)
122	target_results = load_json_file(args.target_result_file)
123	print('Successfully loaded target test results from: %s' % args.target_result_file)
124	remove_testcases_to_optimize_regression_runtime(logger, base_results)
125	remove_testcases_to_optimize_regression_runtime(logger, target_results)
126	if args.base_result_id and args.target_result_id:
127	base_result = get_dict_value(logger, base_results, base_result_id)
128	print('Getting base test result with result_id=%s' % base_result_id)
129	target_result = get_dict_value(logger, target_results, target_result_id)
130	print('Getting target test result with result_id=%s' % target_result_id)
131	regression = ResultsRegression()
132	regression.run(logger, base_result, target_result)
133	else:	40	else:
134	regression = ResultsRegressionSelector()	41	resultstring = "Match: %s\n %s" % (base_name, target_name)
135	regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)	42	return result, resultstring
136	logger.debug('Retrieved regression pair=%s' % regression_pair)	43
137	regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)	44	def get_results(logger, source):
138	return 0	45	return resultutils.load_resultsdata(source, configmap=resultutils.regression_map)
		46
		47	def regression(args, logger):
		48	base_results = get_results(logger, args.base_result)
		49	target_results = get_results(logger, args.target_result)
		50
		51	regression_common(args, logger, base_results, target_results)
		52
		53	def regression_common(args, logger, base_results, target_results):
		54	if args.base_result_id:
		55	base_results = resultutils.filter_resultsdata(base_results, args.base_result_id)
		56	if args.target_result_id:
		57	target_results = resultutils.filter_resultsdata(target_results, args.target_result_id)
		58
		59	matches = []
		60	regressions = []
		61	notfound = []
		62
		63	for a in base_results:
		64	if a in target_results:
		65	base = list(base_results[a].keys())
		66	target = list(target_results[a].keys())
		67	# We may have multiple base/targets which are for different configurations. Start by
		68	# removing any pairs which match
		69	for c in base.copy():
		70	for b in target.copy():
		71	res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b])
		72	if not res:
		73	matches.append(resstr)
		74	base.remove(c)
		75	target.remove(b)
		76	break
		77	# Should only now see regressions, we may not be able to match multiple pairs directly
		78	for c in base:
		79	for b in target:
		80	res, resstr = compare_result(logger, c, b, base_results[a][c], target_results[a][b])
		81	if res:
		82	regressions.append(resstr)
		83	else:
		84	notfound.append("%s not found in target" % a)
		85	print("\n".join(matches))
		86	print("\n".join(regressions))
		87	print("\n".join(notfound))
139		88
140	def regression_directory(args, logger):
141	base_results = get_results_from_directory(logger, args.base_result_directory)
142	target_results = get_results_from_directory(logger, args.target_result_directory)
143	remove_testcases_to_optimize_regression_runtime(logger, base_results)
144	remove_testcases_to_optimize_regression_runtime(logger, target_results)
145	regression = ResultsRegressionSelector()
146	regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)
147	logger.debug('Retrieved regression pair=%s' % regression_pair)
148	regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)
149	return 0	89	return 0
150		90
151	def regression_git(args, logger):	91	def regression_git(args, logger):
152	from resulttool.resultsutils import checkout_git_dir
153	base_results = {}	92	base_results = {}
154	target_results = {}	93	target_results = {}
155	if checkout_git_dir(args.source_dir, args.base_git_branch):	94
156	base_results = get_results_from_directory(logger, args.source_dir)	95	tag_name = "{branch}/{commit_number}-g{commit}/{tag_number}"
157	if checkout_git_dir(args.source_dir, args.target_git_branch):	96	repo = GitRepo(args.repo)
158	target_results = get_results_from_directory(logger, args.source_dir)	97
159	if base_results and target_results:	98	revs = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch)
160	remove_testcases_to_optimize_regression_runtime(logger, base_results)	99
161	remove_testcases_to_optimize_regression_runtime(logger, target_results)	100	if args.branch2:
162	regression = ResultsRegressionSelector()	101	revs2 = gitarchive.get_test_revs(logger, repo, tag_name, branch=args.branch2)
163	regression_pair = regression.get_regression_base_target_pair(logger, base_results, target_results)	102	if not len(revs2):
164	logger.debug('Retrieved regression pair=%s' % regression_pair)	103	logger.error("No revisions found to compare against")
165	regression.run_regression_with_regression_pairing(logger, regression_pair, base_results, target_results)	104	return 1
		105	if not len(revs):
		106	logger.error("No revision to report on found")
		107	return 1
		108	else:
		109	if len(revs) < 2:
		110	logger.error("Only %d tester revisions found, unable to generate report" % len(revs))
		111	return 1
		112
		113	# Pick revisions
		114	if args.commit:
		115	if args.commit_number:
		116	logger.warning("Ignoring --commit-number as --commit was specified")
		117	index1 = gitarchive.rev_find(revs, 'commit', args.commit)
		118	elif args.commit_number:
		119	index1 = gitarchive.rev_find(revs, 'commit_number', args.commit_number)
		120	else:
		121	index1 = len(revs) - 1
		122
		123	if args.branch2:
		124	revs2.append(revs[index1])
		125	index1 = len(revs2) - 1
		126	revs = revs2
		127
		128	if args.commit2:
		129	if args.commit_number2:
		130	logger.warning("Ignoring --commit-number2 as --commit2 was specified")
		131	index2 = gitarchive.rev_find(revs, 'commit', args.commit2)
		132	elif args.commit_number2:
		133	index2 = gitarchive.rev_find(revs, 'commit_number', args.commit_number2)
		134	else:
		135	if index1 > 0:
		136	index2 = index1 - 1
		137	# Find the closest matching commit number for comparision
		138	# In future we could check the commit is a common ancestor and
		139	# continue back if not but this good enough for now
		140	while index2 > 0 and revs[index2].commit_number > revs[index1].commit_number:
		141	index2 = index2 - 1
		142	else:
		143	logger.error("Unable to determine the other commit, use "
		144	"--commit2 or --commit-number2 to specify it")
		145	return 1
		146
		147	logger.info("Comparing:\n%s\nto\n%s\n" % (revs[index1], revs[index2]))
		148
		149	base_results = resultutils.git_get_result(repo, revs[index1][2])
		150	target_results = resultutils.git_get_result(repo, revs[index2][2])
		151
		152	regression_common(args, logger, base_results, target_results)
		153
166	return 0	154	return 0
167		155
168	def register_commands(subparsers):	156	def register_commands(subparsers):
169	"""Register subcommands from this plugin"""	157	"""Register subcommands from this plugin"""
170	parser_build = subparsers.add_parser('regression-file', help='regression file analysis',	158
		159	parser_build = subparsers.add_parser('regression', help='regression file/directory analysis',
		160	description='regression analysis comparing the base set of results to the target results',
		161	group='analysis')
		162	parser_build.set_defaults(func=regression)
		163	parser_build.add_argument('base_result',
		164	help='base result file/directory for the comparison')
		165	parser_build.add_argument('target_result',
		166	help='target result file/directory to compare with')
		167	parser_build.add_argument('-b', '--base-result-id', default='',
		168	help='(optional) filter the base results to this result ID')
		169	parser_build.add_argument('-t', '--target-result-id', default='',
		170	help='(optional) filter the target results to this result ID')
		171
		172	parser_build = subparsers.add_parser('regression-git', help='regression git analysis',
171	description='regression analysis comparing base result set to target '	173	description='regression analysis comparing base result set to target '
172	'result set',	174	'result set',
173	group='analysis')	175	group='analysis')
174	parser_build.set_defaults(func=regression_file)	176	parser_build.set_defaults(func=regression_git)
175	parser_build.add_argument('base_result_file',	177	parser_build.add_argument('repo',
176	help='base result file provide the base result set')	178	help='the git repository containing the data')
177	parser_build.add_argument('target_result_file',
178	help='target result file provide the target result set for comparison with base result')
179	parser_build.add_argument('-b', '--base-result-id', default='',	179	parser_build.add_argument('-b', '--base-result-id', default='',
180	help='(optional) default select regression based on configurations unless base result '	180	help='(optional) default select regression based on configurations unless base result '
181	'id was provided')	181	'id was provided')
@@ -183,26 +183,10 @@ def register_commands(subparsers):
183	help='(optional) default select regression based on configurations unless target result '	183	help='(optional) default select regression based on configurations unless target result '
184	'id was provided')	184	'id was provided')
185		185
186	parser_build = subparsers.add_parser('regression-dir', help='regression directory analysis',	186	parser_build.add_argument('--branch', '-B', default='master', help="Branch to find commit in")
187	description='regression analysis comparing base result set to target '	187	parser_build.add_argument('--branch2', help="Branch to find comparision revisions in")
188	'result set',	188	parser_build.add_argument('--commit', help="Revision to search for")
189	group='analysis')	189	parser_build.add_argument('--commit-number', help="Revision number to search for, redundant if --commit is specified")
190	parser_build.set_defaults(func=regression_directory)	190	parser_build.add_argument('--commit2', help="Revision to compare with")
191	parser_build.add_argument('base_result_directory',	191	parser_build.add_argument('--commit-number2', help="Revision number to compare with, redundant if --commit2 is specified")
192	help='base result directory provide the files for base result set')
193	parser_build.add_argument('target_result_directory',
194	help='target result file provide the files for target result set for comparison with '
195	'base result')
196		192
197	parser_build = subparsers.add_parser('regression-git', help='regression git analysis',
198	description='regression analysis comparing base result set to target '
199	'result set',
200	group='analysis')
201	parser_build.set_defaults(func=regression_git)
202	parser_build.add_argument('source_dir',
203	help='source directory that contain the git repository with test result files')
204	parser_build.add_argument('base_git_branch',
205	help='base git branch that provide the files for base result set')
206	parser_build.add_argument('target_git_branch',
207	help='target git branch that provide the files for target result set for comparison with '
208	'base result')