diff options
author | Vratko Polak <vrpolak@cisco.com> | 2018-08-10 10:20:30 +0200 |
---|---|---|
committer | Vratko Polak <vrpolak@cisco.com> | 2018-08-30 16:48:56 +0200 |
commit | 7db6faf25da39820d321222f7f8fcb191585add9 (patch) | |
tree | 15f7a9ac56a48d820cc5aca337cffc2caaaf1e3f /resources/tools/scripts/compare_perpatch.py | |
parent | e105ab722bbc6c98bf76a863539c971be506859a (diff) |
CSIT-1135: Scripts for VPP per-patch testing
+ Scripts do not rely on (other) bootstraps.
+ Perf verify bootstrap is also the new style sript now.
+ Scripts are divided to functions for better re-use.
+ Functions are sourced from small number of large "library" files.
- Still using jumpavg from pipy.
- Perpatch has specific simplified parsing (instead of the PAL one).
- Bash style document is in a separate Change.
Change-Id: If88fa528ce155ea86b614e3d77c0550b91bbdf11
Signed-off-by: Vratko Polak <vrpolak@cisco.com>
Diffstat (limited to 'resources/tools/scripts/compare_perpatch.py')
-rw-r--r-- | resources/tools/scripts/compare_perpatch.py | 85 |
1 files changed, 85 insertions, 0 deletions
diff --git a/resources/tools/scripts/compare_perpatch.py b/resources/tools/scripts/compare_perpatch.py new file mode 100644 index 0000000000..cc9ffd8992 --- /dev/null +++ b/resources/tools/scripts/compare_perpatch.py @@ -0,0 +1,85 @@ +# Copyright (c) 2018 Cisco and/or its affiliates. +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at: +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +"""Script for determining whether per-patch perf test votes -1. + +This script assumes there exist two text files with processed BMRR results, +located at hardcoded relative paths, having several lines +of json-parseable lists of float values, corresponding to testcase results. +This script then uses jumpavg library to determine whether there was +a regression, progression or no change for each testcase. +If number of tests does not match, or there was a regression, +this script votes -1 (by exiting with code 1), otherwise it votes +1 (exit 0). +""" + +import json +import sys + +from jumpavg.BitCountingMetadataFactory import BitCountingMetadataFactory +from jumpavg.BitCountingClassifier import BitCountingClassifier + + +def hack(value_list): + """Return middle two quartiles, hoping to reduce influence of outliers. + + :param value_list: List to pick subset from. + :type value_list: list of float + :returns: New list containing middle values. + :rtype: list of float + """ + tmp = sorted(value_list) + quarter = len(tmp) / 4 + ret = tmp[quarter:-quarter] + return ret + +parent_lines = list() +new_lines = list() +with open("csit_parent/results.txt") as parent_file: + parent_lines = parent_file.readlines() +with open("csit_new/results.txt") as new_file: + new_lines = new_file.readlines() +if len(parent_lines) != len(new_lines): + print "Number of passed tests does not match!" + sys.exit(1) +classifier = BitCountingClassifier() +num_tests = len(parent_lines) +exit_code = 0 +for index in range(num_tests): + parent_values = hack(json.loads(parent_lines[index])) + new_values = hack(json.loads(new_lines[index])) + parent_max = BitCountingMetadataFactory.find_max_value(parent_values) + new_max = BitCountingMetadataFactory.find_max_value(new_values) + cmax = max(parent_max, new_max) + factory = BitCountingMetadataFactory(cmax) + parent_stats = factory.from_data(parent_values) + factory = BitCountingMetadataFactory(cmax, parent_stats.avg) + new_stats = factory.from_data(new_values) + print "DEBUG parent: {p}".format(p=parent_stats) + print "DEBUG new: {n}".format(n=new_stats) + common_max = max(parent_stats.avg, new_stats.avg) + difference = (new_stats.avg - parent_stats.avg) / common_max + print "DEBUG difference: {d}%".format(d=100 * difference) + classified_list = classifier.classify([parent_stats, new_stats]) + if len(classified_list) < 2: + print "Test index {index}: normal (no anomaly)".format( + index=index) + continue + anomaly = classified_list[1].metadata.classification + if anomaly == "regression": + print "Test index {index}: anomaly regression".format(index=index) + exit_code = 1 + continue + print "Test index {index}: anomaly {anomaly}".format( + index=index, anomaly=anomaly) +print "DEBUG exit code {code}".format(code=exit_code) +sys.exit(exit_code) |