HBASE-15651 Script to report flaky tests. (Apekshit)

Change-Id: I5cd5c23985b8c3f928d7ab44e57606b0a5478f15

Signed-off-by: stack <stack@apache.org>
This commit is contained in:
Apekshit 2016-04-13 23:02:17 -07:00 committed by stack
parent 4c0587134a
commit 57e1dbc8a6
1 changed files with 146 additions and 0 deletions

146
dev-support/report-flakies.py Executable file
View File

@ -0,0 +1,146 @@
#!/usr/bin/env python
##
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# This script uses Jenkins REST api to collect test results of given builds and generates flakyness
# data about unittests.
# Print help: ./report-flakies.py -h
import argparse
import logging
import re
import requests
parser = argparse.ArgumentParser()
parser.add_argument("--max-builds", type=int, metavar="n",
help="Number of builds to analyze for each job (if available in jenkins). Default: all "
+ "available builds.")
parser.add_argument("--mvn", action="store_true",
help="Writes two strings for including/excluding these flaky tests using maven flags. These "
+ "strings are written to files so they can be saved as artifacts and easily imported in "
+ "other projects.")
parser.add_argument("-v", "--verbose", help="Prints more logs.", action="store_true")
parser.add_argument(
"urls", help="Space separated list of urls (single/multi-configuration project) to analyze")
args = parser.parse_args()
logging.basicConfig()
logger = logging.getLogger("org.apache.hadoop.hbase.report-flakies")
if args.verbose:
logger.setLevel(logging.INFO)
# Given url of an executed build, fetches its test report, and returns dictionary from testname to
# pass/skip/fail status.
def get_build_results(build_url):
logger.info("Getting test results for %s", build_url)
url = build_url + "testReport/api/json?tree=suites[cases[className,name,status]]"
response = requests.get(url)
if response.status_code == 404:
logger.info("No test results for %s", build_url)
return {}
json_response = response.json()
tests = {}
for test_cases in json_response["suites"]:
for test in test_cases["cases"]:
# Truncate initial "org.apache.hadoop.hbase." from all tests.
test_name = (test["className"] + "#" + test["name"])[24:]
tests[test_name] = test["status"]
return tests
# If any url is of type multi-configuration project (i.e. has key 'activeConfigurations'),
# get urls for individual jobs.
jobs_list = []
for url in args.urls.split():
json_response = requests.get(url + "/api/json").json()
if json_response.has_key("activeConfigurations"):
for config in json_response["activeConfigurations"]:
jobs_list.append(config["url"])
elif json_response.has_key("builds"):
jobs_list.append(url)
else:
raise Exception("Bad url ({0}).".format(url))
global_bad_tests = set()
# Iterates over each job, gets its test results and prints flaky tests.
for job_url in jobs_list:
logger.info("Analyzing job: %s", job_url)
build_id_to_results = {}
builds = requests.get(job_url + "/api/json").json()["builds"]
num_builds = 0
build_ids = []
build_ids_without_result = []
for build in builds:
build_id = build["number"]
build_ids.append(build_id)
build_result = get_build_results(build["url"])
if len(build_result) > 0:
build_id_to_results[build_id] = build_result
else:
build_ids_without_result.append(build_id)
num_builds += 1
if num_builds == args.max_builds:
break
# Collect list of bad tests.
bad_tests = set()
for build in build_id_to_results:
for test in build_id_to_results[build]:
if build_id_to_results[build][test] == "REGRESSION":
bad_tests.add(test)
global_bad_tests.add(test)
# Get total and failed build times for each bad test.
build_counts = {key:dict([('total', 0), ('failed', 0)]) for key in bad_tests}
for build in build_id_to_results:
build_results = build_id_to_results[build]
for bad_test in bad_tests:
if build_results.has_key(bad_test):
if build_results[bad_test] != "SKIPPED": # Ignore the test if it's skipped.
build_counts[bad_test]['total'] += 1
if build_results[bad_test] == "REGRESSION":
build_counts[bad_test]['failed'] += 1
if len(bad_tests) > 0:
print "Job: {}".format(job_url)
print "{:>100} {:6} {:10} {}".format("Test Name", "Failed", "Total Runs", "Flakyness")
for bad_test in bad_tests:
fail = build_counts[bad_test]['failed']
total = build_counts[bad_test]['total']
print "{:>100} {:6} {:10} {:2.0f}%".format(bad_test, fail, total, fail*100.0/total)
else:
print "No flaky tests founds."
if len(builds_ids) == len(build_ids_without_result):
print "None of the analyzed builds have test result."
print "Builds analyzed: " + str(build_ids)
print "Builds with no results: " + str(build_ids_without_result)
print ""
if args.mvn:
includes = ""
excludes = ""
for test in global_bad_tests:
test = re.sub(".*\.", "", test) # Remove package name prefix.
test = re.sub("#.*", "", test) # Remove individual unittest's name
includes += test + ","
excludes += "**/" + test + ".java,"
with open("./includes", "w") as inc_file:
inc_file.write(includes)
inc_file.close()
with open("./excludes", "w") as exc_file:
exc_file.write(excludes)
exc_file.close()