blob: 9f4eebca3789fe51fdf9e4571c2e5cff06c45410 [file] [log] [blame]
# Copyright 2014 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
from datetime import datetime
from itertools import chain
import logging
import webapp2
from model.record import Record
from shared.config import (
from shared.parsing import parse_rietveld_timestamp
from shared import utils
class PatchSummary(webapp2.RequestHandler):
def get(self, issue, patch): # pylint: disable=W0221
now = utils.to_unix_timestamp(datetime.utcnow())
codereview_hostname = utils.guess_legacy_codereview_hostname(issue)
return summarize_patch(codereview_hostname, issue, patch, now)
class PatchSummaryV2(webapp2.RequestHandler):
def get(self, codereview_hostname, issue, patch): # pylint: disable=W0221
now = utils.to_unix_timestamp(datetime.utcnow())
return summarize_patch(codereview_hostname, issue, patch, now)
def summarize_patch(codereview_hostname, issue, patch, now):
attempts = [
summarize_attempt(raw_attempt, now)
for raw_attempt in get_raw_attempts(codereview_hostname, issue, patch)
return {
'success': any(attempt['success'] for attempt in attempts),
'begin': maybe_min(attempt['begin'] for attempt in attempts),
'end': maybe_max(attempt['end'] for attempt in attempts),
'durations': {
field: sum(attempt['durations'][field] for attempt in attempts)
for field in blank_durations_summary()
'job_counts': {
state: sum(len(attempt['jobs'][state]) for attempt in attempts)
for state in JOB_STATE.itervalues()
'flaky_jobs': get_flaky_jobs(attempts),
'attempt_count': len(attempts),
'attempt_fail_count': sum(
for attempt in attempts
if attempt['success'] == False),
'attempts': attempts,
def get_raw_attempts(codereview_hostname, issue, patch):
"""Returns a generator for raw attempts."""
# Do not filter by TAG_CODEREVIEW_HOSTNAME here, because it is not set for old
# issues.
query = Record.query().order(Record.timestamp).filter(
Record.tags == TAG_ISSUE % issue,
Record.tags == TAG_PATCHSET % patch)
raw_attempt = None
count = 0
for record in query:
if not record.matches_codereview_hostname(codereview_hostname):
if raw_attempt is None and TAG_START in record.tags:
raw_attempt = []
if raw_attempt is not None: # pragma: no branch
if TAG_STOP in record.tags:
count += 1
logging.debug('attempt %d has %d records', count, len(raw_attempt))
yield raw_attempt
raw_attempt = None
if raw_attempt: # pragma: no cover
# In cq_stats and Dremel we ignore attempts that do not have patch_stop
# event. However, it may be not a good decision here as this app is
# user-facing and we don't want users to be confused why their last attempt
# is now shown until attempt is actually complete (or if for some reason
# patch_stop message was lost).
count += 1
logging.debug('attempt %d has %d records', count, len(raw_attempt))
yield raw_attempt
def summarize_attempt(raw_attempt, now):
assert len(raw_attempt) > 0
start_timestamp = utils.to_unix_timestamp(raw_attempt[0].timestamp)
summary = blank_attempt_summary()
job_tracker = AttemptJobTracker(start_timestamp)
durations = summary['durations']
last_patch_action = None
last_patch_timestamp = None
verifier_start_timestamp = None
for record in raw_attempt:
action = record.fields.get('action')
# patch_ready_to_commit signals are noisy and not useful.
if action == 'patch_ready_to_commit':
verifier = record.fields.get('verifier')
timestamp = utils.to_unix_timestamp(record.timestamp)
if last_patch_action:
patch_state_duration = timestamp - last_patch_timestamp
# Verifier job updates.
if verifier == TRYJOBVERIFIER:
if action == 'verifier_start':
verifier_start_timestamp = timestamp
elif action == 'verifier_jobs_update':
elif (action in ('verifier_pass', 'verifier_fail') and
verifier_start_timestamp is not None):
durations['running_all_jobs'] = timestamp - verifier_start_timestamp
verifier_start_timestamp = None
# Patch state updates.
if action and action.startswith('patch_'):
if last_patch_action == 'patch_throttled':
durations['blocked_on_throttled_tree'] += patch_state_duration
if last_patch_action == 'patch_tree_closed':
durations['blocked_on_closed_tree'] += patch_state_duration
if action == 'patch_committed':
summary['success'] = True
if last_patch_action == 'patch_committing': # pragma: no branch
durations['committing'] += patch_state_duration
if action == 'patch_failed':
summary['success'] = False
summary['fail_reason'] = record.fields.get('reason')
if action == 'patch_stop':
summary['end'] = timestamp
if action and action.startswith('patch_'):
last_patch_action = action
last_patch_timestamp = timestamp
# Finalize attempt durations.
summary['begin'] = start_timestamp
if summary['end'] != None: # pragma: no branch
durations['total'] = summary['end'] - summary['begin']
last_timestamp = summary['end'] or now
if last_patch_action: # pragma: no branch
patch_state_duration = last_timestamp - last_patch_timestamp
if last_patch_action == 'patch_tree_closed': # pragma: no cover
durations['blocked_on_closed_tree'] += patch_state_duration
if last_patch_action == 'patch_throttled': # pragma: no cover
durations['blocked_on_throttled_tree'] += patch_state_duration
if last_patch_action == 'patch_committing': # pragma: no cover
durations['committing'] += patch_state_duration
if verifier_start_timestamp: # pragma: no cover
durations['running_all_jobs'] = last_timestamp - verifier_start_timestamp
# Finalize jobs and job durations.
summary['jobs'] = job_tracker.summarize_jobs(
summary['success'] != None, last_timestamp)
return summary
class AttemptJobTracker(object):
def __init__(self, cutoff_timestamp):
self.cutoff_timestamp = cutoff_timestamp = {}
def update_jobs(self, record):
job_states = record.fields.get('jobs', {})
for cq_job_state, jobs in job_states.iteritems():
job_state = JOB_STATE.get(cq_job_state)
if not job_state: # pragma: no cover
logging.warning('Unknown job state: %s', cq_job_state)
for job_info in jobs:
build_number = job_info.get('buildnumber')
if not build_number: # pragma: no cover
# Early exit: CQ is now scheduling with buildbucket,
# which means first events won't have a buildnumber, just build_id.
master = job_info.get('master')
builder = job_info.get('builder'), {})[master].setdefault(builder, {})
job_info = job_info or {}
timestamp = parse_rietveld_timestamp(
job_info.get('created_ts') or job_info.get('timestamp'))
# Ignore jobs from past attempts.
if (not timestamp or # pragma: no branch
timestamp < self.cutoff_timestamp):
job =[master][builder].setdefault(build_number, {})
if len(job) == 0:
'begin': timestamp,
'master': master,
'builder': builder,
'slave': job_info.get('slave'),
'build_number': build_number,
if job_state != 'running':
job['end'] = timestamp
job['duration'] = timestamp - job['begin']
job['state'] = job_state
job['retry'] = any(
same_builder(job, test_job) and
job['build_number'] != test_job['build_number'] and
test_job['begin'] < job['begin']
for test_job in[master][builder].itervalues())
# The build URL is sometimes missing so ensure we set it
# if it was not already set.
job['url'] = job['url'] or job_info.get('url')
def summarize_jobs(self, attempt_ended, last_timestamp):
summaries = {state: [] for state in JOB_STATE.itervalues()}
for builds in
for jobs in builds.itervalues():
for job in jobs.itervalues():
if job['end'] == None: # pragma: no cover
if attempt_ended:
job['end'] = last_timestamp
job['duration'] = last_timestamp - job['begin']
for jobs in summaries.itervalues():
jobs.sort(key=lambda x: x['begin'], reverse=True)
return summaries
def blank_attempt_summary():
return {
'success': None,
'fail_reason': None,
'begin': None,
'end': None,
'durations': blank_durations_summary(),
'jobs': {state: [] for state in JOB_STATE.itervalues()},
def blank_durations_summary():
return {
'running_all_jobs': 0,
'blocked_on_closed_tree': 0,
'blocked_on_throttled_tree': 0,
'committing': 0,
'total': 0,
def blank_job_summary():
return {
'state': None,
'retry': False,
'begin': None,
'end': None,
'duration': 0,
'master': None,
'builder': None,
'slave': None,
'build_number': None,
'url': None,
def get_flaky_jobs(attempts):
flaky_jobs = []
passed_jobs = set()
for attempt in attempts:
for job in attempt['jobs']['passed']:
for attempt in attempts:
for job in attempt['jobs']['failed']:
if job_builder_id(job) in passed_jobs: # pragma: no branch
return flaky_jobs
def job_builder_id(job):
return (job['master'], job['builder'])
def same_builder(job_a, job_b):
return job_builder_id(job_a) == job_builder_id(job_b)
def maybe_min(iterable):
return min(iterable)
except ValueError: # pragma: no cover
return None
def maybe_max(iterable):
return max(iterable)
except ValueError: # pragma: no cover
return None