aboutsummaryrefslogtreecommitdiffstats
path: root/resources/tools/scripts/compare_perpatch.py
diff options
context:
space:
mode:
authorVratko Polak <vrpolak@cisco.com>2018-08-10 10:20:30 +0200
committerVratko Polak <vrpolak@cisco.com>2018-08-30 16:48:56 +0200
commit7db6faf25da39820d321222f7f8fcb191585add9 (patch)
tree15f7a9ac56a48d820cc5aca337cffc2caaaf1e3f /resources/tools/scripts/compare_perpatch.py
parente105ab722bbc6c98bf76a863539c971be506859a (diff)
CSIT-1135: Scripts for VPP per-patch testing
+ Scripts do not rely on (other) bootstraps. + Perf verify bootstrap is also the new style sript now. + Scripts are divided to functions for better re-use. + Functions are sourced from small number of large "library" files. - Still using jumpavg from pipy. - Perpatch has specific simplified parsing (instead of the PAL one). - Bash style document is in a separate Change. Change-Id: If88fa528ce155ea86b614e3d77c0550b91bbdf11 Signed-off-by: Vratko Polak <vrpolak@cisco.com>
Diffstat (limited to 'resources/tools/scripts/compare_perpatch.py')
-rw-r--r--resources/tools/scripts/compare_perpatch.py85
1 files changed, 85 insertions, 0 deletions
diff --git a/resources/tools/scripts/compare_perpatch.py b/resources/tools/scripts/compare_perpatch.py
new file mode 100644
index 0000000000..cc9ffd8992
--- /dev/null
+++ b/resources/tools/scripts/compare_perpatch.py
@@ -0,0 +1,85 @@
+# Copyright (c) 2018 Cisco and/or its affiliates.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at:
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Script for determining whether per-patch perf test votes -1.
+
+This script assumes there exist two text files with processed BMRR results,
+located at hardcoded relative paths, having several lines
+of json-parseable lists of float values, corresponding to testcase results.
+This script then uses jumpavg library to determine whether there was
+a regression, progression or no change for each testcase.
+If number of tests does not match, or there was a regression,
+this script votes -1 (by exiting with code 1), otherwise it votes +1 (exit 0).
+"""
+
+import json
+import sys
+
+from jumpavg.BitCountingMetadataFactory import BitCountingMetadataFactory
+from jumpavg.BitCountingClassifier import BitCountingClassifier
+
+
+def hack(value_list):
+ """Return middle two quartiles, hoping to reduce influence of outliers.
+
+ :param value_list: List to pick subset from.
+ :type value_list: list of float
+ :returns: New list containing middle values.
+ :rtype: list of float
+ """
+ tmp = sorted(value_list)
+ quarter = len(tmp) / 4
+ ret = tmp[quarter:-quarter]
+ return ret
+
+parent_lines = list()
+new_lines = list()
+with open("csit_parent/results.txt") as parent_file:
+ parent_lines = parent_file.readlines()
+with open("csit_new/results.txt") as new_file:
+ new_lines = new_file.readlines()
+if len(parent_lines) != len(new_lines):
+ print "Number of passed tests does not match!"
+ sys.exit(1)
+classifier = BitCountingClassifier()
+num_tests = len(parent_lines)
+exit_code = 0
+for index in range(num_tests):
+ parent_values = hack(json.loads(parent_lines[index]))
+ new_values = hack(json.loads(new_lines[index]))
+ parent_max = BitCountingMetadataFactory.find_max_value(parent_values)
+ new_max = BitCountingMetadataFactory.find_max_value(new_values)
+ cmax = max(parent_max, new_max)
+ factory = BitCountingMetadataFactory(cmax)
+ parent_stats = factory.from_data(parent_values)
+ factory = BitCountingMetadataFactory(cmax, parent_stats.avg)
+ new_stats = factory.from_data(new_values)
+ print "DEBUG parent: {p}".format(p=parent_stats)
+ print "DEBUG new: {n}".format(n=new_stats)
+ common_max = max(parent_stats.avg, new_stats.avg)
+ difference = (new_stats.avg - parent_stats.avg) / common_max
+ print "DEBUG difference: {d}%".format(d=100 * difference)
+ classified_list = classifier.classify([parent_stats, new_stats])
+ if len(classified_list) < 2:
+ print "Test index {index}: normal (no anomaly)".format(
+ index=index)
+ continue
+ anomaly = classified_list[1].metadata.classification
+ if anomaly == "regression":
+ print "Test index {index}: anomaly regression".format(index=index)
+ exit_code = 1
+ continue
+ print "Test index {index}: anomaly {anomaly}".format(
+ index=index, anomaly=anomaly)
+print "DEBUG exit code {code}".format(code=exit_code)
+sys.exit(exit_code)