1# Copyright 2016 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
5"""Services relating to generating a suite timeline and report."""
6
7from __future__ import print_function
8
9import common
10import datetime
11import json
12
13from autotest_lib.client.common_lib import time_utils
14from autotest_lib.server import frontend
15from autotest_lib.server.lib import status_history
16from chromite.lib import cros_logging as logging
17
18
19HostJobHistory = status_history.HostJobHistory
20
21# TODO: Handle other statuses like infra failures.
22TKO_STATUS_MAP = {
23    'ERROR': 'fail',
24    'FAIL': 'fail',
25    'GOOD': 'pass',
26    'PASS': 'pass',
27    'ABORT': 'aborted',
28    'Failed': 'fail',
29    'Completed': 'pass',
30    'Aborted': 'aborted',
31}
32
33
34# Default suite timeout in seconds
35DEFAULT_SUITE_TIMEOUT = 90 * 60
36
37
38def to_epoch_time_int(value):
39    """Convert the given value to epoch time int.
40
41    @returns: epoch time in integer."""
42    return int(time_utils.to_epoch_time(value))
43
44
45def parse_tko_status_string(status_string):
46    """Parse a status string from TKO or the HQE databases.
47
48    @param status_string: A status string from TKO or HQE databases.
49
50    @return A status string suitable for inclusion within Cloud Datastore.
51    """
52    return TKO_STATUS_MAP.get(status_string, 'unknown:' + status_string)
53
54
55def make_entry(entry_id, name, status, start_time,
56               finish_time=None, parent=None):
57    """Generate an event log entry to be stored in Cloud Datastore.
58
59    @param entry_id: A (Kind, id) tuple representing the key.
60    @param name: A string identifying the event
61    @param status: A string identifying the status of the event.
62    @param start_time: A unix timestamp of the start of the event.
63    @param finish_time: A unix timestamp of the finish of the event.
64    @param parent: A (Kind, id) tuple representing the parent key.
65
66    @return A dictionary representing the entry suitable for dumping via JSON.
67    """
68    entry = {
69        'id': entry_id,
70        'name': name,
71        'status': status,
72        'start_time': start_time,
73    }
74    if finish_time is not None:
75        entry['finish_time'] = finish_time
76    if parent is not None:
77        entry['parent'] = parent
78    return entry
79
80
81def find_start_finish_times(statuses):
82    """Determines the start and finish times for a list of statuses.
83
84    @param statuses: A list of job test statuses.
85
86    @return (start_tme, finish_time) tuple of seconds past epoch.  If either
87            cannot be determined, None for that time.
88    """
89    starts = {to_epoch_time_int(s.test_started_time)
90              for s in statuses if s.test_started_time != 'None'}
91    finishes = {to_epoch_time_int(s.test_finished_time)
92                for s in statuses if s.test_finished_time != 'None'}
93    start_time = min(starts) if starts else None
94    finish_time = max(finishes) if finishes else None
95    return start_time, finish_time
96
97
98def make_job_entry(tko, job, parent=None, suite_job=False, job_entries=None):
99    """Generate a Suite or HWTest event log entry.
100
101    @param tko: TKO database handle.
102    @param job: A frontend.Job to generate an entry for.
103    @param parent: A (Kind, id) tuple representing the parent key.
104    @param suite_job: A boolean indicating wheret this represents a suite job.
105    @param job_entries: A dictionary mapping job id to earlier job entries.
106
107    @return A dictionary representing the entry suitable for dumping via JSON.
108    """
109    statuses = tko.get_job_test_statuses_from_db(job.id)
110    status = 'pass'
111    dut = None
112    for s in statuses:
113        parsed_status = parse_tko_status_string(s.status)
114        # TODO: Improve this generation of status.
115        if parsed_status != 'pass':
116            status = parsed_status
117        if s.hostname:
118            dut = s.hostname
119        if s.test_started_time == 'None' or s.test_finished_time == 'None':
120            logging.warn('TKO entry for %d missing time: %s' % (job.id, str(s)))
121    start_time, finish_time = find_start_finish_times(statuses)
122    entry = make_entry(('Suite' if suite_job else 'HWTest', int(job.id)),
123                       job.name.split('/')[-1], status, start_time,
124                       finish_time=finish_time, parent=parent)
125
126    entry['job_id'] = int(job.id)
127    if dut:
128        entry['dut'] = dut
129    if job.shard:
130        entry['shard'] = job.shard
131    # Determine the try of this job by looking back through what the
132    # original job id is.
133    if 'retry_original_job_id' in job.keyvals:
134        original_job_id = int(job.keyvals['retry_original_job_id'])
135        original_job = job_entries.get(original_job_id, None)
136        if original_job:
137            entry['try'] = original_job['try'] + 1
138        else:
139            entry['try'] = 0
140    else:
141        entry['try'] = 1
142    entry['gs_url'] = status_history.get_job_gs_url(job)
143    return entry
144
145
146def make_hqe_entry(hostname, hqe, hqe_statuses, parent=None):
147    """Generate a HQE event log entry.
148
149    @param hostname: A string of the hostname.
150    @param hqe: A host history to generate an event for.
151    @param hqe_statuses: A dictionary mapping HQE ids to job status.
152    @param parent: A (Kind, id) tuple representing the parent key.
153
154    @return A dictionary representing the entry suitable for dumping via JSON.
155    """
156    entry = make_entry(
157        ('HQE', int(hqe.id)), hostname,
158        hqe_statuses.get(hqe.id, parse_tko_status_string(hqe.job_status)),
159        hqe.start_time, finish_time=hqe.end_time, parent=parent)
160
161    entry['task_name'] = hqe.name.split('/')[-1]
162    entry['in_suite'] = hqe.id in hqe_statuses
163    entry['job_url'] = hqe.job_url
164    entry['gs_url'] = hqe.gs_url
165    if hqe.job_id is not None:
166        entry['job_id'] = hqe.job_id
167    entry['is_special'] = hqe.is_special
168    return entry
169
170
171def generate_suite_report(suite_job_id, afe=None, tko=None,
172                          reset_finish_time=False):
173    """Generate a list of events corresonding to a single suite job.
174
175    @param suite_job_id: The AFE id of the suite job.
176    @param afe: AFE database handle.
177    @param tko: TKO database handle.
178    @reset_finish_time: Boolean indicating whether to reset the suite finish
179                        to now.
180
181    @return A list of entries suitable for dumping via JSON.
182    """
183    if afe is None:
184        afe = frontend.AFE()
185    if tko is None:
186        tko = frontend.TKO()
187
188    # Retrieve the main suite job.
189    suite_job = afe.get_jobs(id=suite_job_id)[0]
190
191    suite_entry = make_job_entry(tko, suite_job, suite_job=True)
192    entries = [suite_entry]
193
194    # Retrieve the child jobs and cache all their statuses
195    logging.debug('Fetching child jobs...')
196    child_jobs = afe.get_jobs(parent_job_id=suite_job_id)
197    logging.debug('... fetched %s child jobs.' % len(child_jobs))
198    job_statuses = {}
199    job_entries = {}
200    for j in child_jobs:
201        job_entry = make_job_entry(tko, j, suite_entry['id'],
202                                   job_entries=job_entries)
203        entries.append(job_entry)
204        job_statuses[j.id] = job_entry['status']
205        job_entries[j.id] = job_entry
206
207    # Retrieve the HQEs from all the child jobs, record statuses from
208    # job statuses.
209    child_job_ids = {j.id for j in child_jobs}
210    logging.debug('Fetching HQEs...')
211    hqes = afe.get_host_queue_entries(job_id__in=list(child_job_ids))
212    logging.debug('... fetched %s HQEs.' % len(hqes))
213    hqe_statuses = {h.id: job_statuses.get(h.job.id, None) for h in hqes}
214
215    # Generate list of hosts.
216    hostnames = {h.host.hostname for h in hqes if h.host}
217    logging.debug('%s distinct hosts participated in the suite.' %
218                  len(hostnames))
219
220    suite_start_time = suite_entry.get('start_time')
221    suite_finish_time = suite_entry.get('finish_time')
222    # Retrieve histories for the time of the suite for all associated hosts.
223    # TODO: Include all hosts in the pool.
224    if suite_start_time and suite_finish_time:
225
226        if reset_finish_time:
227            suite_timeout_time = suite_start_time + DEFAULT_SUITE_TIMEOUT
228            current_time = to_epoch_time_int(datetime.datetime.now())
229            suite_finish_time = min(current_time, suite_timeout_time)
230
231        histories = [HostJobHistory.get_host_history(afe, hostname,
232                                                     suite_start_time,
233                                                     suite_finish_time)
234                     for hostname in sorted(hostnames)]
235
236        for history in histories:
237            entries.extend(make_hqe_entry(history.hostname, h, hqe_statuses,
238                                          suite_entry['id']) for h in history)
239
240    return entries
241
242def dump_entries_as_json(entries, output_file):
243    """Dump event log entries as json to a file.
244
245    @param entries: A list of event log entries to dump.
246    @param output_file: The file to write to.
247    """
248    # Write the entries out as JSON.
249    logging.debug('Dumping %d entries' % len(entries))
250    for e in entries:
251        json.dump(e, output_file, sort_keys=True)
252        output_file.write('\n')
253