Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | |
| 3 | from __future__ import print_function |
| 4 | |
| 5 | __copyright__ = """ |
| 6 | /* |
Xinyu Zhang | af63f90 | 2023-01-05 15:09:28 +0800 | [diff] [blame] | 7 | * Copyright (c) 2020-2023, Arm Limited. All rights reserved. |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 8 | * |
| 9 | * SPDX-License-Identifier: BSD-3-Clause |
| 10 | * |
| 11 | */ |
| 12 | """ |
| 13 | |
| 14 | """ |
| 15 | Script for waiting for LAVA jobs and parsing the results |
| 16 | """ |
| 17 | |
| 18 | import os |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 19 | import time |
| 20 | import yaml |
| 21 | import argparse |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 22 | import shutil |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 23 | import logging |
Paul Sokolovsky | 7fd1bc5 | 2023-01-11 20:14:37 +0300 | [diff] [blame^] | 24 | from xmlrpc.client import ProtocolError |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 25 | from jinja2 import Environment, FileSystemLoader |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 26 | from lava_helper import test_lava_dispatch_credentials |
Xinyu Zhang | c918b6e | 2022-10-08 17:13:17 +0800 | [diff] [blame] | 27 | from lava_submit_jobs import submit_lava_jobs |
Paul Sokolovsky | 2512ec5 | 2022-03-04 00:15:39 +0300 | [diff] [blame] | 28 | import codecov_helper |
| 29 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 30 | |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 31 | _log = logging.getLogger("lavaci") |
| 32 | |
| 33 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 34 | def wait_for_jobs(user_args): |
| 35 | job_list = user_args.job_ids.split(",") |
| 36 | job_list = [int(x) for x in job_list if x != ''] |
| 37 | lava = test_lava_dispatch_credentials(user_args) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 38 | finished_jobs = get_finished_jobs(job_list, user_args, lava) |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 39 | resubmit_jobs = resubmit_failed_jobs(finished_jobs, user_args) |
Paul Sokolovsky | c87beee | 2022-04-30 08:50:47 +0300 | [diff] [blame] | 40 | if resubmit_jobs: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 41 | _log.info("Waiting for resubmitted jobs: %s", resubmit_jobs) |
Paul Sokolovsky | c87beee | 2022-04-30 08:50:47 +0300 | [diff] [blame] | 42 | finished_resubmit_jobs = get_finished_jobs(resubmit_jobs, user_args, lava) |
| 43 | finished_jobs.update(finished_resubmit_jobs) |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 44 | return finished_jobs |
| 45 | |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 46 | def process_finished_jobs(finished_jobs, user_args): |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 47 | print_lava_urls(finished_jobs, user_args) |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 48 | test_report(finished_jobs, user_args) |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 49 | job_links(finished_jobs, user_args) |
Paul Sokolovsky | 2512ec5 | 2022-03-04 00:15:39 +0300 | [diff] [blame] | 50 | codecov_helper.coverage_reports(finished_jobs, user_args) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 51 | |
| 52 | def get_finished_jobs(job_list, user_args, lava): |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 53 | _log.info("Waiting for %d LAVA jobs", len(job_list)) |
Paul Sokolovsky | 697f955 | 2022-05-05 10:44:27 +0300 | [diff] [blame] | 54 | finished_jobs = lava.block_wait_for_jobs(job_list, user_args.dispatch_timeout, 5) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 55 | unfinished_jobs = [item for item in job_list if item not in finished_jobs] |
| 56 | for job in unfinished_jobs: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 57 | _log.info("Cancelling unfinished job %d", job) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 58 | lava.cancel_job(job) |
| 59 | if user_args.artifacts_path: |
| 60 | for job, info in finished_jobs.items(): |
| 61 | info['job_dir'] = os.path.join(user_args.artifacts_path, "{}_{}".format(str(job), info['description'])) |
| 62 | finished_jobs[job] = info |
| 63 | finished_jobs = fetch_artifacts(finished_jobs, user_args, lava) |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 64 | return finished_jobs |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 65 | |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 66 | def resubmit_failed_jobs(jobs, user_args): |
| 67 | if not jobs: |
| 68 | return [] |
Xinyu Zhang | 4aca6d0 | 2021-05-31 11:43:32 +0800 | [diff] [blame] | 69 | time.sleep(2) # be friendly to LAVA |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 70 | failed_job = [] |
| 71 | os.makedirs('failed_jobs', exist_ok=True) |
| 72 | for job_id, info in jobs.items(): |
| 73 | if not (info['health'] == "Complete" and info['state'] == "Finished"): |
Paul Sokolovsky | b7a41a9 | 2022-12-28 18:06:45 +0300 | [diff] [blame] | 74 | _log.warning( |
| 75 | "Will resubmit job %d because of its state: %s, health: %s", |
Paul Sokolovsky | 7fa6c9e | 2022-12-30 15:01:49 +0300 | [diff] [blame] | 76 | job_id, info["state"], info["health"] |
Paul Sokolovsky | b7a41a9 | 2022-12-28 18:06:45 +0300 | [diff] [blame] | 77 | ) |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 78 | job_dir = info['job_dir'] |
| 79 | def_path = os.path.join(job_dir, 'definition.yaml') |
| 80 | os.rename(def_path, 'failed_jobs/{}_definition.yaml'.format(job_id)) |
| 81 | shutil.rmtree(job_dir) |
| 82 | failed_job.append(job_id) |
| 83 | for failed_job_id in failed_job: |
| 84 | jobs.pop(failed_job_id) |
Xinyu Zhang | c918b6e | 2022-10-08 17:13:17 +0800 | [diff] [blame] | 85 | resubmitted_jobs = submit_lava_jobs(user_args, job_dir='failed_jobs') |
Xinyu Zhang | c8a670c | 2021-05-18 20:20:53 +0800 | [diff] [blame] | 86 | resubmitted_jobs = [int(x) for x in resubmitted_jobs if x != ''] |
| 87 | return resubmitted_jobs |
| 88 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 89 | def fetch_artifacts(jobs, user_args, lava): |
| 90 | if not user_args.artifacts_path: |
| 91 | return |
| 92 | for job_id, info in jobs.items(): |
| 93 | job_dir = info['job_dir'] |
Paul Sokolovsky | dc8281a | 2022-12-27 21:54:42 +0300 | [diff] [blame] | 94 | t = time.time() |
| 95 | _log.info("Fetching artifacts for job %d to %s", job_id, job_dir) |
Paul Sokolovsky | ce54619 | 2023-01-03 21:28:08 +0300 | [diff] [blame] | 96 | |
| 97 | for retry in range(3, 0, -1): |
| 98 | try: |
| 99 | os.makedirs(job_dir, exist_ok=True) |
| 100 | def_path = os.path.join(job_dir, 'definition.yaml') |
| 101 | target_log = os.path.join(job_dir, 'target_log.txt') |
| 102 | config = os.path.join(job_dir, 'config.tar.bz2') |
| 103 | results_file = os.path.join(job_dir, 'results.yaml') |
| 104 | definition = lava.get_job_definition(job_id, def_path) |
| 105 | jobs[job_id]['metadata'] = definition.get('metadata', []) |
| 106 | time.sleep(0.2) # be friendly to LAVA |
| 107 | lava.get_job_log(job_id, target_log) |
| 108 | time.sleep(0.2) |
| 109 | lava.get_job_config(job_id, config) |
| 110 | time.sleep(0.2) |
| 111 | lava.get_job_results(job_id, results_file) |
| 112 | break |
Paul Sokolovsky | 7fd1bc5 | 2023-01-11 20:14:37 +0300 | [diff] [blame^] | 113 | except (ProtocolError, IOError) as e: |
Paul Sokolovsky | ce54619 | 2023-01-03 21:28:08 +0300 | [diff] [blame] | 114 | if retry == 1: |
| 115 | raise |
| 116 | else: |
| 117 | _log.warning("fetch_artifacts: Error %r occurred, retrying", e) |
| 118 | time.sleep(2) |
| 119 | |
Paul Sokolovsky | dc8281a | 2022-12-27 21:54:42 +0300 | [diff] [blame] | 120 | _log.info("Fetched artifacts in %ds", time.time() - t) |
Paul Sokolovsky | c2d6d88 | 2022-02-25 19:11:18 +0300 | [diff] [blame] | 121 | codecov_helper.extract_trace_data(target_log, job_dir) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 122 | return(jobs) |
| 123 | |
| 124 | |
| 125 | def lava_id_to_url(id, user_args): |
| 126 | return "{}/scheduler/job/{}".format(user_args.lava_url, id) |
| 127 | |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 128 | def job_links(jobs, user_args): |
| 129 | job_links = "" |
| 130 | for job, info in jobs.items(): |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 131 | job_links += "\nLAVA Test Config:\n" |
| 132 | job_links += "Config Name: {}\n".format(info['metadata']['build_name']) |
| 133 | job_links += "Test Result: {}\n".format(info['result']) |
| 134 | job_links += "Device Type: {}\n".format(info['metadata']['device_type']) |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 135 | job_links += "Build link: {}\n".format(info['metadata']['build_job_url']) |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 136 | job_links += "LAVA link: {}\n".format(lava_id_to_url(job, user_args)) |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 137 | job_links += "TFM LOG: {}artifact/{}/target_log.txt\n".format(os.getenv("BUILD_URL"), info['job_dir']) |
Xinyu Zhang | 97ee3fd | 2020-12-14 14:45:06 +0800 | [diff] [blame] | 138 | print(job_links) |
| 139 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 140 | def remove_lava_dupes(results): |
| 141 | for result in results: |
| 142 | if result['result'] != 'pass': |
| 143 | if result['suite'] == "lava": |
| 144 | for other in [x for x in results if x != result]: |
| 145 | if other['name'] == result['name']: |
| 146 | if other['result'] == 'pass': |
| 147 | results.remove(result) |
| 148 | return(results) |
| 149 | |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 150 | def test_report(jobs, user_args): |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 151 | # parsing of test results is WIP |
| 152 | fail_j = [] |
| 153 | jinja_data = [] |
| 154 | for job, info in jobs.items(): |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 155 | info['result'] = 'SUCCESS' |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 156 | if info['health'] != 'Complete': |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 157 | info['result'] = 'FAILURE' |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 158 | fail_j.append(job) |
| 159 | continue |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 160 | results_file = os.path.join(info['job_dir'], 'results.yaml') |
| 161 | if not os.path.exists(results_file) or (os.path.getsize(results_file) == 0): |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 162 | info['result'] = 'FAILURE' |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 163 | fail_j.append(job) |
| 164 | continue |
| 165 | with open(results_file, "r") as F: |
| 166 | res_data = F.read() |
Paul Sokolovsky | f2f385d | 2022-01-11 00:36:31 +0300 | [diff] [blame] | 167 | results = yaml.safe_load(res_data) |
Paul Sokolovsky | 07f6dfb | 2022-07-15 12:26:24 +0300 | [diff] [blame] | 168 | non_lava_results = [x for x in results if x['suite'] != 'lava' or x['name'] == 'lava-test-monitor'] |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 169 | info['lava_url'] = lava_id_to_url(job, user_args) |
Arthur She | 38d5f5a | 2022-09-02 17:32:14 -0700 | [diff] [blame] | 170 | info['artifacts_dir'] = info['job_dir'] |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 171 | jinja_data.append({job: [info, non_lava_results]}) |
| 172 | for result in non_lava_results: |
Paul Sokolovsky | 58f00de | 2022-02-01 00:26:32 +0300 | [diff] [blame] | 173 | if result['result'] == 'fail': |
Xinyu Zhang | 0f78e7a | 2022-10-17 13:55:52 +0800 | [diff] [blame] | 174 | info['result'] = 'FAILURE' |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 175 | fail_j.append(job) if job not in fail_j else fail_j |
| 176 | time.sleep(0.5) # be friendly to LAVA |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 177 | data = {} |
| 178 | data['jobs'] = jinja_data |
| 179 | render_jinja(data) |
| 180 | |
| 181 | def render_jinja(data): |
| 182 | work_dir = os.path.join(os.path.abspath(os.path.dirname(__file__)), "jinja2_templates") |
| 183 | template_loader = FileSystemLoader(searchpath=work_dir) |
| 184 | template_env = Environment(loader=template_loader) |
| 185 | html = template_env.get_template("test_summary.jinja2").render(data) |
| 186 | csv = template_env.get_template("test_summary_csv.jinja2").render(data) |
| 187 | with open('test_summary.html', "w") as F: |
| 188 | F.write(html) |
| 189 | with open('test_summary.csv', "w") as F: |
| 190 | F.write(csv) |
| 191 | |
| 192 | def print_lava_urls(jobs, user_args): |
| 193 | output = [lava_id_to_url(x, user_args) for x in jobs] |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 194 | info_print("LAVA jobs triggered for this build: {}".format(output)) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 195 | |
| 196 | |
Xinyu Zhang | 78c146a | 2022-09-05 19:06:40 +0800 | [diff] [blame] | 197 | def info_print(line, silent=True): |
| 198 | if not silent: |
| 199 | print("INFO: {}".format(line)) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 200 | |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame] | 201 | |
| 202 | # WARNING: Setting this to >1 is a last resort, temporary stop-gap measure, |
| 203 | # which will overload LAVA and jeopardize stability of the entire TF CI. |
| 204 | INEFFICIENT_RETRIES = 1 |
| 205 | |
| 206 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 207 | def main(user_args): |
| 208 | """ Main logic """ |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame] | 209 | for try_time in range(INEFFICIENT_RETRIES): |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 210 | try: |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 211 | finished_jobs = wait_for_jobs(user_args) |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 212 | break |
| 213 | except Exception as e: |
Paul Sokolovsky | de25e1f | 2023-01-02 14:29:21 +0300 | [diff] [blame] | 214 | if try_time < INEFFICIENT_RETRIES - 1: |
Paul Sokolovsky | f367456 | 2022-12-27 22:20:01 +0300 | [diff] [blame] | 215 | _log.exception("Exception in wait_for_jobs") |
| 216 | _log.info("Will try to get LAVA jobs again, this was try: %d", try_time) |
Xinyu Zhang | 3e8f660 | 2021-04-28 10:57:32 +0800 | [diff] [blame] | 217 | else: |
| 218 | raise e |
Paul Sokolovsky | 451f67b | 2022-03-08 19:44:41 +0300 | [diff] [blame] | 219 | process_finished_jobs(finished_jobs, user_args) |
Xinyu Zhang | af63f90 | 2023-01-05 15:09:28 +0800 | [diff] [blame] | 220 | if len(finished_jobs) < len(user_args.job_ids.split(",")): |
| 221 | raise Exception("Some LAVA jobs cancelled.") |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 222 | |
| 223 | def get_cmd_args(): |
| 224 | """ Parse command line arguments """ |
| 225 | |
| 226 | # Parse command line arguments to override config |
| 227 | parser = argparse.ArgumentParser(description="Lava Wait Jobs") |
| 228 | cmdargs = parser.add_argument_group("Lava Wait Jobs") |
| 229 | |
| 230 | # Configuration control |
| 231 | cmdargs.add_argument( |
| 232 | "--lava-url", dest="lava_url", action="store", help="LAVA lab URL (without RPC2)" |
| 233 | ) |
| 234 | cmdargs.add_argument( |
| 235 | "--job-ids", dest="job_ids", action="store", required=True, help="Comma separated list of job IDS" |
| 236 | ) |
| 237 | cmdargs.add_argument( |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 238 | "--lava-token", dest="lava_token", action="store", help="LAVA auth token" |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 239 | ) |
| 240 | cmdargs.add_argument( |
Xinyu Zhang | f2b7cbf | 2021-05-18 20:17:34 +0800 | [diff] [blame] | 241 | "--lava-user", dest="lava_user", action="store", help="LAVA username" |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 242 | ) |
| 243 | cmdargs.add_argument( |
| 244 | "--use-env", dest="token_from_env", action="store_true", default=False, help="Use LAVA auth info from environment" |
| 245 | ) |
| 246 | cmdargs.add_argument( |
| 247 | "--lava-timeout", dest="dispatch_timeout", action="store", type=int, default=3600, help="Time in seconds to wait for all jobs" |
| 248 | ) |
| 249 | cmdargs.add_argument( |
| 250 | "--artifacts-path", dest="artifacts_path", action="store", help="Download LAVA artifacts to this directory" |
| 251 | ) |
| 252 | return parser.parse_args() |
| 253 | |
| 254 | |
| 255 | if __name__ == "__main__": |
Paul Sokolovsky | a95abd9 | 2022-12-27 13:48:11 +0300 | [diff] [blame] | 256 | logging.basicConfig(level=logging.INFO) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 257 | main(get_cmd_args()) |