Add project stats check tool
Validate on Zuul builds and Gerrit. This is needed for project stats check. Please check etherpad for more detail discussion or output example [1]. Run project_stats_check.py with no arguments will run on all projects defined in `reference/projects.yaml`. If you wish to run for specific project or branch. Run like: `project_stats_check.py -p heat,sahara -b master,stable/xena` [1] https://etherpad.opendev.org/p/health_check Change-Id: I84c3a4898a74c26746fd66d046a80b8936a608e9
This commit is contained in:
parent
cc9e9ac6d5
commit
14e078a7a3
319
tools/project_stats_check.py
Executable file
319
tools/project_stats_check.py
Executable file
@ -0,0 +1,319 @@
|
||||
#!/usr/bin/env python3
|
||||
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
||||
# not use this file except in compliance with the License. You may obtain
|
||||
# a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
||||
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
||||
# License for the specific language governing permissions and limitations
|
||||
# under the License.
|
||||
|
||||
import argparse
|
||||
import sys
|
||||
from urllib import request
|
||||
import yaml
|
||||
|
||||
|
||||
TOP_X_OWNER = 10
|
||||
# Zuul builds fetch size per query
|
||||
BUILDSET_FETCH_SIZE = 500
|
||||
|
||||
|
||||
class BaseQuery:
|
||||
def __init__(self, base_url, query_separator='&', verbose=False):
|
||||
self.verbose = verbose
|
||||
self.query_separator = query_separator
|
||||
if base_url.endswith('/'):
|
||||
self.base_url = base_url
|
||||
else:
|
||||
self.base_url = base_url + '/'
|
||||
|
||||
def query(self, api, conditions=None):
|
||||
url = self.base_url + api
|
||||
if conditions:
|
||||
url += '?' + (self.query_separator.join(conditions))
|
||||
if self.verbose:
|
||||
print("Request on url %s" % url)
|
||||
result = request.urlopen(url)
|
||||
result = yaml.safe_load(result.read())
|
||||
if self.verbose:
|
||||
print(result)
|
||||
return result
|
||||
|
||||
|
||||
class Zuul(BaseQuery):
|
||||
def get_project_buildsets(self, repos, fetch_size, branch='master', tenant='openstack'):
|
||||
# project={repos}&pipeline=gate&limit=500&branch=master
|
||||
|
||||
conditions = ['pipeline=gate',
|
||||
'limit='+str(fetch_size),
|
||||
'branch=' + branch]
|
||||
for repo in repos:
|
||||
# count all repos in one set
|
||||
conditions.append('project=' + repo)
|
||||
return self.query(api='api/tenant/%s/buildsets' % tenant, conditions=conditions)
|
||||
|
||||
def fetch_repo_buildset_success_rate(self, buildsets):
|
||||
success = {}
|
||||
not_success = {}
|
||||
for buildset in buildsets:
|
||||
if type(buildset) != dict:
|
||||
if self.verbose:
|
||||
print("Buildset %s is not a dict. Skipping." % buildset)
|
||||
continue
|
||||
project = buildset['project']
|
||||
result = buildset['result']
|
||||
if result == 'SUCCESS':
|
||||
if project in success:
|
||||
success[project] += 1
|
||||
else:
|
||||
success[project] = 1
|
||||
else:
|
||||
if project in not_success:
|
||||
not_success[project] += 1
|
||||
else:
|
||||
not_success[project] = 1
|
||||
success_rates = {}
|
||||
all_projects = set(success).union(set(not_success))
|
||||
for project in all_projects:
|
||||
success_rates[project] = format(
|
||||
success.get(project, 0)/(
|
||||
success.get(project, 0) + not_success.get(project, 0)
|
||||
)*100, '.0f') + '%'
|
||||
return success_rates
|
||||
|
||||
|
||||
class Gerrit(BaseQuery):
|
||||
def query(self, api, conditions=None):
|
||||
url = self.base_url + api
|
||||
if conditions:
|
||||
# Set no-limit=1 to fetch larger amount of patches
|
||||
url += '?no-limit=1&q=' + (self.query_separator.join(conditions))
|
||||
if self.verbose:
|
||||
print("Request on url %s" % url)
|
||||
result = request.urlopen(url)
|
||||
if self.verbose:
|
||||
print(result)
|
||||
|
||||
# The first line contains random chars like `'b\')]}\\\'`
|
||||
# Consider it as a bug and directly access second line from result
|
||||
result = yaml.safe_load(result.readlines()[1])
|
||||
if self.verbose:
|
||||
print(result)
|
||||
return result
|
||||
|
||||
def get_project_query_list(self, repos):
|
||||
projects = []
|
||||
repoSize = len(repos)
|
||||
for i in range(repoSize):
|
||||
repo = repos[i]
|
||||
if i == 0:
|
||||
projects += ['(project:' + repo, 'OR']
|
||||
elif i == repoSize - 1:
|
||||
projects.append('project:' + repo + ')')
|
||||
else:
|
||||
projects += ['project:' + repo, 'OR']
|
||||
return projects
|
||||
|
||||
def get_total_valid(self, repos, within, branch='master'):
|
||||
# q=(status:open+OR+status:merged)+project:{repo}+
|
||||
# NOT+label:Workflow<=-1+label:Verified>=1+NOT+age:{within}day
|
||||
|
||||
conditions = ['(status:open', 'OR', 'status:merged)',
|
||||
'NOT', 'label:Workflow<=-1',
|
||||
'label:Verified>=1',
|
||||
'branch:' + branch,
|
||||
'NOT', 'age:' + str(within) + 'day']
|
||||
conditions += self.get_project_query_list(repos)
|
||||
return self.query(api='changes/', conditions=conditions)
|
||||
|
||||
def get_total_not_review(self, repos, within, branch='master'):
|
||||
# q=status:open+project:{repos}+label:Code-Review=0+
|
||||
# NOT+label:Workflow<=-1+label:Verified>=1+NOT+age:{within}day
|
||||
|
||||
conditions = ['status:open',
|
||||
'NOT', 'label:Workflow<=-1',
|
||||
'label:Verified>=1',
|
||||
'label:Code-Review=0',
|
||||
'branch:' + branch,
|
||||
'NOT', 'age:' + str(within) + 'day']
|
||||
conditions += self.get_project_query_list(repos)
|
||||
return self.query(api='changes/', conditions=conditions)
|
||||
|
||||
def get_total_merged(self, repos, within, branch='master'):
|
||||
# q=status:merged+project:{repos}+NOT+age:{within}day
|
||||
|
||||
conditions = ['status:merged',
|
||||
'branch:' + branch,
|
||||
'NOT', 'age:' + str(within) + 'day']
|
||||
conditions += self.get_project_query_list(repos)
|
||||
return self.query(api='changes/', conditions=conditions)
|
||||
|
||||
def count_owners(self, patches, limit=-1):
|
||||
owners = {}
|
||||
patchCount = len(patches)
|
||||
for p in patches:
|
||||
owner = p.get('owner', {}).get('_account_id', 0)
|
||||
if owner in owners:
|
||||
owners[owner] += 1
|
||||
else:
|
||||
owners[owner] = 1
|
||||
sorted_owners = sorted(
|
||||
owners.items(), reverse=True, key=lambda item: item[1])
|
||||
results = {}
|
||||
for owner, count in sorted_owners:
|
||||
owner = self.get_account_name(owner)
|
||||
if limit != -1 and len(results) >= limit:
|
||||
break
|
||||
results[owner] = format(
|
||||
(count / patchCount) * 100, '.2f') + '%'
|
||||
return results
|
||||
|
||||
def get_account_name(self, account_id):
|
||||
# Profile will looks like: {"_account_id":22816,
|
||||
# "name":"OpenStack Release Bot",
|
||||
# "email":"infra-root@openstack.org","username":"release"}
|
||||
profile = self.query(api=('accounts/%s' % account_id))
|
||||
return profile.get('name', account_id)
|
||||
|
||||
|
||||
def validate_gerrit_data(repos, count_days, branch, verbose):
|
||||
gerrit = Gerrit(
|
||||
base_url='https://review.opendev.org/', query_separator='+',
|
||||
verbose=verbose)
|
||||
print(" Validating Gerrit...")
|
||||
total_valid_patches = gerrit.get_total_valid(
|
||||
repos, within=count_days, branch=branch)
|
||||
|
||||
if not total_valid_patches:
|
||||
print(" * There are no any patches proposed within "
|
||||
"%s days" % count_days)
|
||||
return
|
||||
|
||||
not_reviewed_patches = gerrit.get_total_not_review(
|
||||
repos, within=count_days, branch=branch)
|
||||
merged_patches = gerrit.get_total_merged(
|
||||
repos, within=count_days, branch=branch)
|
||||
unreview_rate = (
|
||||
len(not_reviewed_patches)/len(total_valid_patches))*100//1
|
||||
merged_rate = (
|
||||
len(merged_patches)/len(total_valid_patches))*100//1
|
||||
owners_rates = gerrit.count_owners(
|
||||
patches=total_valid_patches, limit=10)
|
||||
|
||||
print(" *", "There are",
|
||||
"%s ready for" % len(total_valid_patches),
|
||||
"review patches generated within %s days" % count_days)
|
||||
print(" *", "There are",
|
||||
"%s not reviewed" % len(not_reviewed_patches),
|
||||
"patches generated within %s days" % count_days)
|
||||
print(" *", "There are %s merged" % len(merged_patches),
|
||||
"patches generated within %s days" % count_days)
|
||||
print(" *", "Unreviewed patch rate for",
|
||||
"patches generated within",
|
||||
"%s days is %s" % (count_days, unreview_rate), '%')
|
||||
print(" *", "Merged patch rate for patches generated within",
|
||||
"%s days is %s" % (count_days, merged_rate), '%')
|
||||
print(" * ", "Here's top %s owner for patches" % TOP_X_OWNER,
|
||||
"generated within",
|
||||
"%s days (Name/Account_ID: Percentage):" % count_days)
|
||||
for owner, rate in owners_rates.items():
|
||||
print(' - ', owner, ': ', rate)
|
||||
|
||||
|
||||
def validate_zuul_data(repos, branch, verbose):
|
||||
zuul = Zuul(base_url="https://zuul.opendev.org/", verbose=verbose)
|
||||
print(" Validate Zuul...")
|
||||
print(" Set buildsets fetch size to",
|
||||
"%s" % BUILDSET_FETCH_SIZE)
|
||||
gate_builds = zuul.get_project_buildsets(
|
||||
repos, fetch_size=BUILDSET_FETCH_SIZE, branch=branch)
|
||||
repo_success_rates = zuul.fetch_repo_buildset_success_rate(
|
||||
gate_builds)
|
||||
for repo, rate in repo_success_rates.items():
|
||||
print(" * Repo: %s gate job builds success" % repo,
|
||||
"rate: %s" % rate)
|
||||
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser()
|
||||
parser.add_argument(
|
||||
'-f', '--file',
|
||||
default='./reference/projects.yaml',
|
||||
help='projects.yaml file path (%(default)s)',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-p', '--projects',
|
||||
help='projects to analyze. Separate with comma',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-d', '--days',
|
||||
default='180',
|
||||
help='Days to count gerrit patches generated since (%(default)s)',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-b', '--branch',
|
||||
default='master',
|
||||
help='Branch to analyze on projects (%(default)s)',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-z', '--skip-zuul',
|
||||
action='store_true',
|
||||
help='Skip Zuul analysis (%(default)s)',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-g', '--skip-gerrit',
|
||||
action='store_true',
|
||||
help='Skip Gerrit analysis (%(default)s)',
|
||||
)
|
||||
parser.add_argument(
|
||||
'-v', '--verbose',
|
||||
action='store_true',
|
||||
help='Show debug information',
|
||||
)
|
||||
args = parser.parse_args()
|
||||
with open(args.file, 'r', encoding='utf-8') as f:
|
||||
projects = yaml.safe_load(f.read())
|
||||
|
||||
project_scope = args.projects.split(',') if (
|
||||
args.projects is not None) else list(projects.keys())
|
||||
count_days = args.days
|
||||
|
||||
def get_repos(project):
|
||||
'''Get repositories in project'''
|
||||
repos = []
|
||||
defn = projects.get(project, {})
|
||||
deliverables = defn.get('deliverables', {})
|
||||
for key, deliverable in deliverables.items():
|
||||
repos += deliverable.get('repos', '')
|
||||
return repos
|
||||
|
||||
all_branch = args.branch.split(',')
|
||||
for branch in all_branch:
|
||||
if not (branch.startswith('master') or branch.startswith('stable/')):
|
||||
print('Invalid branch %s' % branch)
|
||||
sys.exit(1)
|
||||
for project in project_scope:
|
||||
print('*' * 50)
|
||||
if project not in projects:
|
||||
print('Invalid project %s' % project)
|
||||
continue
|
||||
print("Start Project %s analysis..." % project)
|
||||
repos = get_repos(project)
|
||||
print(" Includes repositories: %s" % repos)
|
||||
for branch in all_branch:
|
||||
print(" Start analysis branch %s..." % branch)
|
||||
if not args.skip_gerrit:
|
||||
validate_gerrit_data(repos, count_days, branch, args.verbose)
|
||||
|
||||
if not args.skip_zuul:
|
||||
validate_zuul_data(repos, branch, args.verbose)
|
||||
|
||||
print('*'*50)
|
||||
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
Loading…
x
Reference in New Issue
Block a user