Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | |
| 3 | from __future__ import print_function |
| 4 | |
| 5 | __copyright__ = """ |
| 6 | /* |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 7 | * Copyright (c) 2020-2022, Arm Limited. All rights reserved. |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 8 | * |
| 9 | * SPDX-License-Identifier: BSD-3-Clause |
| 10 | * |
| 11 | */ |
| 12 | """ |
| 13 | |
| 14 | """ |
| 15 | Script for waiting for LAVA jobs and parsing the results |
| 16 | """ |
| 17 | |
| 18 | import os |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 19 | import time |
| 20 | import yaml |
| 21 | import argparse |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 22 | import shutil |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 23 | import logging |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 24 | from jinja2 import Environment, FileSystemLoader |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 25 | from lava_helper import test_lava_dispatch_credentials |
Xinyu Zhang | c918b6e | 2022-10-08 17:13:17 +0800 | [diff] [blame] | 26 | from lava_submit_jobs import submit_lava_jobs |
Paul Sokolovsky | 2512ec5 | 2022-03-04 00:15:39 +0300 | [diff] [blame] | 27 | import codecov_helper |
| 28 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 29 | |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 30 | _log = logging.getLogger("lavaci") |
| 31 | |
| 32 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 33 | def wait_for_jobs(user_args): |
| 34 | job_list = user_args.job_ids.split(",") |
| 35 | job_list = [int(x) for x in job_list if x != ''] |
| 36 | lava = test_lava_dispatch_credentials(user_args) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 37 | finished_jobs = get_finished_jobs(job_list, user_args, lava) |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 38 | resubmit_jobs = resubmit_failed_jobs(finished_jobs, user_args) |
Paul Sokolovsky | c87beee | 2022-04-30 08:50:47 +0300 | [diff] [blame] | 39 | if resubmit_jobs: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 40 | _log.info("Waiting for resubmitted jobs: %s", resubmit_jobs) |
Paul Sokolovsky | c87beee | 2022-04-30 08:50:47 +0300 | [diff] [blame] | 41 | finished_resubmit_jobs = get_finished_jobs(resubmit_jobs, user_args, lava) |
| 42 | finished_jobs.update(finished_resubmit_jobs) |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 43 | return finished_jobs |
| 44 | |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 45 | def process_finished_jobs(finished_jobs, user_args): |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 46 | print_lava_urls(finished_jobs, user_args) |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 47 | test_report(finished_jobs, user_args) |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 48 | job_links(finished_jobs, user_args) |
Paul Sokolovsky | 2512ec5 | 2022-03-04 00:15:39 +0300 | [diff] [blame] | 49 | codecov_helper.coverage_reports(finished_jobs, user_args) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 50 | |
| 51 | def get_finished_jobs(job_list, user_args, lava): |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 52 | _log.info("Waiting for %d LAVA jobs", len(job_list)) |
Paul Sokolovsky | 697f955 | 2022-05-05 10:44:27 +0300 | [diff] [blame] | 53 | finished_jobs = lava.block_wait_for_jobs(job_list, user_args.dispatch_timeout, 5) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 54 | unfinished_jobs = [item for item in job_list if item not in finished_jobs] |
| 55 | for job in unfinished_jobs: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 56 | _log.info("Cancelling unfinished job %d", job) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 57 | lava.cancel_job(job) |
| 58 | if user_args.artifacts_path: |
| 59 | for job, info in finished_jobs.items(): |
| 60 | info['job_dir'] = os.path.join(user_args.artifacts_path, "{}_{}".format(str(job), info['description'])) |
| 61 | finished_jobs[job] = info |
| 62 | finished_jobs = fetch_artifacts(finished_jobs, user_args, lava) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 63 | return finished_jobs |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 64 | |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 65 | def resubmit_failed_jobs(jobs, user_args): |
| 66 | if not jobs: |
| 67 | return [] |
Xinyu Zhang | 4aca6d0 | 2021-05-31 11:43:32 +0800 | [diff] [blame] | 68 | time.sleep(2) # be friendly to LAVA |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 69 | failed_job = [] |
| 70 | os.makedirs('failed_jobs', exist_ok=True) |
| 71 | for job_id, info in jobs.items(): |
| 72 | if not (info['health'] == "Complete" and info['state'] == "Finished"): |
Paul Sokolovsky | b7a41a9 | 2022-12-28 18:06:45 +0300 | [diff] [blame] | 73 | _log.warning( |
| 74 | "Will resubmit job %d because of its state: %s, health: %s", |
Paul Sokolovsky | 7fa6c9e | 2022-12-30 15:01:49 +0300 | [diff] [blame] | 75 | job_id, info["state"], info["health"] |
Paul Sokolovsky | b7a41a9 | 2022-12-28 18:06:45 +0300 | [diff] [blame] | 76 | ) |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 77 | job_dir = info['job_dir'] |
| 78 | def_path = os.path.join(job_dir, 'definition.yaml') |
| 79 | os.rename(def_path, 'failed_jobs/{}_definition.yaml'.format(job_id)) |
| 80 | shutil.rmtree(job_dir) |
| 81 | failed_job.append(job_id) |
| 82 | for failed_job_id in failed_job: |
| 83 | jobs.pop(failed_job_id) |
Xinyu Zhang | c918b6e | 2022-10-08 17:13:17 +0800 | [diff] [blame] | 84 | resubmitted_jobs = submit_lava_jobs(user_args, job_dir='failed_jobs') |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 85 | resubmitted_jobs = [int(x) for x in resubmitted_jobs if x != ''] |
| 86 | return resubmitted_jobs |
| 87 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 88 | def fetch_artifacts(jobs, user_args, lava): |
| 89 | if not user_args.artifacts_path: |
| 90 | return |
| 91 | for job_id, info in jobs.items(): |
| 92 | job_dir = info['job_dir'] |
Paul Sokolovsky | dc8281a | 2022-12-27 21:54:42 +0300 | [diff] [blame] | 93 | t = time.time() |
| 94 | _log.info("Fetching artifacts for job %d to %s", job_id, job_dir) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 95 | os.makedirs(job_dir, exist_ok=True) |
| 96 | def_path = os.path.join(job_dir, 'definition.yaml') |
| 97 | target_log = os.path.join(job_dir, 'target_log.txt') |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 98 | config = os.path.join(job_dir, 'config.tar.bz2') |
| 99 | results_file = os.path.join(job_dir, 'results.yaml') |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 100 | definition = lava.get_job_definition(job_id, def_path) |
| 101 | jobs[job_id]['metadata'] = definition.get('metadata', []) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 102 | time.sleep(0.2) # be friendly to LAVA |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 103 | lava.get_job_log(job_id, target_log) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 104 | time.sleep(0.2) |
| 105 | lava.get_job_config(job_id, config) |
| 106 | time.sleep(0.2) |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 107 | lava.get_job_results(job_id, results_file) |
Paul Sokolovsky | dc8281a | 2022-12-27 21:54:42 +0300 | [diff] [blame] | 108 | _log.info("Fetched artifacts in %ds", time.time() - t) |
Paul Sokolovsky | c2d6d88 | 2022-02-25 19:11:18 +0300 | [diff] [blame] | 109 | codecov_helper.extract_trace_data(target_log, job_dir) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 110 | return(jobs) |
| 111 | |
| 112 | |
| 113 | def lava_id_to_url(id, user_args): |
| 114 | return "{}/scheduler/job/{}".format(user_args.lava_url, id) |
| 115 | |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 116 | def job_links(jobs, user_args): |
| 117 | job_links = "" |
| 118 | for job, info in jobs.items(): |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 119 | job_links += "\nLAVA Test Config:\n" |
| 120 | job_links += "Config Name: {}\n".format(info['metadata']['build_name']) |
| 121 | job_links += "Test Result: {}\n".format(info['result']) |
| 122 | job_links += "Device Type: {}\n".format(info['metadata']['device_type']) |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 123 | job_links += "Build link: {}\n".format(info['metadata']['build_job_url']) |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 124 | job_links += "LAVA link: {}\n".format(lava_id_to_url(job, user_args)) |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 125 | job_links += "TFM LOG: {}artifact/{}/target_log.txt\n".format(os.getenv("BUILD_URL"), info['job_dir']) |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 126 | print(job_links) |
| 127 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 128 | def remove_lava_dupes(results): |
| 129 | for result in results: |
| 130 | if result['result'] != 'pass': |
| 131 | if result['suite'] == "lava": |
| 132 | for other in [x for x in results if x != result]: |
| 133 | if other['name'] == result['name']: |
| 134 | if other['result'] == 'pass': |
| 135 | results.remove(result) |
| 136 | return(results) |
| 137 | |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 138 | def test_report(jobs, user_args): |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 139 | # parsing of test results is WIP |
| 140 | fail_j = [] |
| 141 | jinja_data = [] |
| 142 | for job, info in jobs.items(): |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 143 | info['result'] = 'SUCCESS' |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 144 | if info['health'] != 'Complete': |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 145 | info['result'] = 'FAILURE' |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 146 | fail_j.append(job) |
| 147 | continue |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 148 | results_file = os.path.join(info['job_dir'], 'results.yaml') |
| 149 | if not os.path.exists(results_file) or (os.path.getsize(results_file) == 0): |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 150 | info['result'] = 'FAILURE' |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 151 | fail_j.append(job) |
| 152 | continue |
| 153 | with open(results_file, "r") as F: |
| 154 | res_data = F.read() |
Paul Sokolovsky | f2f385d | 2022-01-11 00:36:31 +0300 | [diff] [blame] | 155 | results = yaml.safe_load(res_data) |
Paul Sokolovsky | 07f6dfb | 2022-07-15 12:26:24 +0300 | [diff] [blame] | 156 | non_lava_results = [x for x in results if x['suite'] != 'lava' or x['name'] == 'lava-test-monitor'] |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 157 | info['lava_url'] = lava_id_to_url(job, user_args) |
Arthur She | 38d5f5a | 2022-09-02 17:32:14 -0700 | [diff] [blame] | 158 | info['artifacts_dir'] = info['job_dir'] |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 159 | jinja_data.append({job: [info, non_lava_results]}) |
| 160 | for result in non_lava_results: |
Paul Sokolovsky | 58f00de | 2022-02-01 00:26:32 +0300 | [diff] [blame] | 161 | if result['result'] == 'fail': |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 162 | info['result'] = 'FAILURE' |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 163 | fail_j.append(job) if job not in fail_j else fail_j |
| 164 | time.sleep(0.5) # be friendly to LAVA |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 165 | data = {} |
| 166 | data['jobs'] = jinja_data |
| 167 | render_jinja(data) |
| 168 | |
| 169 | def render_jinja(data): |
| 170 | work_dir = os.path.join(os.path.abspath(os.path.dirname(__file__)), "jinja2_templates") |
| 171 | template_loader = FileSystemLoader(searchpath=work_dir) |
| 172 | template_env = Environment(loader=template_loader) |
| 173 | html = template_env.get_template("test_summary.jinja2").render(data) |
| 174 | csv = template_env.get_template("test_summary_csv.jinja2").render(data) |
| 175 | with open('test_summary.html', "w") as F: |
| 176 | F.write(html) |
| 177 | with open('test_summary.csv', "w") as F: |
| 178 | F.write(csv) |
| 179 | |
| 180 | def print_lava_urls(jobs, user_args): |
| 181 | output = [lava_id_to_url(x, user_args) for x in jobs] |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 182 | info_print("LAVA jobs triggered for this build: {}".format(output)) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 183 | |
| 184 | |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 185 | def info_print(line, silent=True): |
| 186 | if not silent: |
| 187 | print("INFO: {}".format(line)) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 188 | |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame^] | 189 | |
| 190 | # WARNING: Setting this to >1 is a last resort, temporary stop-gap measure, |
| 191 | # which will overload LAVA and jeopardize stability of the entire TF CI. |
| 192 | INEFFICIENT_RETRIES = 1 |
| 193 | |
| 194 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 195 | def main(user_args): |
| 196 | """ Main logic """ |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame^] | 197 | for try_time in range(INEFFICIENT_RETRIES): |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 198 | try: |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 199 | finished_jobs = wait_for_jobs(user_args) |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 200 | break |
| 201 | except Exception as e: |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame^] | 202 | if try_time < INEFFICIENT_RETRIES - 1: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 203 | _log.exception("Exception in wait_for_jobs") |
| 204 | _log.info("Will try to get LAVA jobs again, this was try: %d", try_time) |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 205 | else: |
| 206 | raise e |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 207 | process_finished_jobs(finished_jobs, user_args) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 208 | |
| 209 | def get_cmd_args(): |
| 210 | """ Parse command line arguments """ |
| 211 | |
| 212 | # Parse command line arguments to override config |
| 213 | parser = argparse.ArgumentParser(description="Lava Wait Jobs") |
| 214 | cmdargs = parser.add_argument_group("Lava Wait Jobs") |
| 215 | |
| 216 | # Configuration control |
| 217 | cmdargs.add_argument( |
| 218 | "--lava-url", dest="lava_url", action="store", help="LAVA lab URL (without RPC2)" |
| 219 | ) |
| 220 | cmdargs.add_argument( |
| 221 | "--job-ids", dest="job_ids", action="store", required=True, help="Comma separated list of job IDS" |
| 222 | ) |
| 223 | cmdargs.add_argument( |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 224 | "--lava-token", dest="lava_token", action="store", help="LAVA auth token" |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 225 | ) |
| 226 | cmdargs.add_argument( |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 227 | "--lava-user", dest="lava_user", action="store", help="LAVA username" |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 228 | ) |
| 229 | cmdargs.add_argument( |
| 230 | "--use-env", dest="token_from_env", action="store_true", default=False, help="Use LAVA auth info from environment" |
| 231 | ) |
| 232 | cmdargs.add_argument( |
| 233 | "--lava-timeout", dest="dispatch_timeout", action="store", type=int, default=3600, help="Time in seconds to wait for all jobs" |
| 234 | ) |
| 235 | cmdargs.add_argument( |
| 236 | "--artifacts-path", dest="artifacts_path", action="store", help="Download LAVA artifacts to this directory" |
| 237 | ) |
| 238 | return parser.parse_args() |
| 239 | |
| 240 | |
| 241 | if __name__ == "__main__": |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 242 | logging.basicConfig(level=logging.INFO) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 243 | main(get_cmd_args()) |