Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | |
| 3 | """ lava_rpc_connector.py: |
| 4 | |
| 5 | class that extends xmlrpc in order to add LAVA specific functionality. |
| 6 | Used in managing communication with the back-end. """ |
| 7 | |
| 8 | from __future__ import print_function |
| 9 | |
| 10 | __copyright__ = """ |
| 11 | /* |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 12 | * Copyright (c) 2018-2022, Arm Limited. All rights reserved. |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 13 | * |
| 14 | * SPDX-License-Identifier: BSD-3-Clause |
| 15 | * |
| 16 | */ |
| 17 | """ |
Karl Zhang | 08681e6 | 2020-10-30 13:56:03 +0800 | [diff] [blame] | 18 | |
| 19 | __author__ = "tf-m@lists.trustedfirmware.org" |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 20 | __project__ = "Trusted Firmware-M Open CI" |
Xinyu Zhang | 06286a9 | 2021-07-22 14:00:51 +0800 | [diff] [blame] | 21 | __version__ = "1.4.0" |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 22 | |
| 23 | import xmlrpc.client |
| 24 | import time |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 25 | import yaml |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 26 | import requests |
| 27 | import shutil |
Paul Sokolovsky | b06bf6f | 2022-12-27 13:46:24 +0300 | [diff] [blame] | 28 | import logging |
| 29 | |
| 30 | |
| 31 | _log = logging.getLogger("lavaci") |
| 32 | |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 33 | |
| 34 | class LAVA_RPC_connector(xmlrpc.client.ServerProxy, object): |
| 35 | |
| 36 | def __init__(self, |
| 37 | username, |
| 38 | token, |
| 39 | hostname, |
| 40 | rest_prefix="RPC2", |
| 41 | https=False): |
| 42 | |
| 43 | # If user provides hostname with http/s prefix |
| 44 | if "://" in hostname: |
| 45 | htp_pre, hostname = hostname.split("://") |
| 46 | server_addr = "%s://%s:%s@%s/%s" % (htp_pre, |
| 47 | username, |
| 48 | token, |
| 49 | hostname, |
| 50 | rest_prefix) |
| 51 | self.server_url = "%s://%s" % (htp_pre, hostname) |
| 52 | else: |
| 53 | server_addr = "%s://%s:%s@%s/%s" % ("https" if https else "http", |
| 54 | username, |
| 55 | token, |
| 56 | hostname, |
| 57 | rest_prefix) |
| 58 | self.server_url = "%s://%s" % ("https" if https else "http", |
| 59 | hostname) |
| 60 | |
| 61 | self.server_job_prefix = "%s/scheduler/job/%%s" % self.server_url |
Milosz Wasilewski | 4c4190d | 2020-12-15 12:56:22 +0000 | [diff] [blame] | 62 | self.server_api = "%s/api/v0.2/" % self.server_url |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 63 | self.server_results_prefix = "%s/results/%%s" % self.server_url |
Matthew Hart | c6bbbf9 | 2020-08-19 14:12:07 +0100 | [diff] [blame] | 64 | self.token = token |
| 65 | self.username = username |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 66 | super(LAVA_RPC_connector, self).__init__(server_addr) |
| 67 | |
| 68 | def _rpc_cmd_raw(self, cmd, params=None): |
| 69 | """ Run a remote comand and return the result. There is no constrain |
| 70 | check on the syntax of the command. """ |
| 71 | |
| 72 | cmd = "self.%s(%s)" % (cmd, params if params else "") |
| 73 | return eval(cmd) |
| 74 | |
| 75 | def ls_cmd(self): |
| 76 | """ Return a list of supported commands """ |
| 77 | |
| 78 | print("\n".join(self.system.listMethods())) |
| 79 | |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 80 | def fetch_file(self, url, out_file): |
Matthew Hart | c6bbbf9 | 2020-08-19 14:12:07 +0100 | [diff] [blame] | 81 | auth_params = { |
| 82 | 'user': self.username, |
| 83 | 'token': self.token |
| 84 | } |
Paul Sokolovsky | 903bc43 | 2022-12-29 17:15:04 +0300 | [diff] [blame] | 85 | with requests.get(url, stream=True, params=auth_params) as r: |
| 86 | r.raise_for_status() |
| 87 | with open(out_file, 'wb') as f: |
| 88 | shutil.copyfileobj(r.raw, f) |
| 89 | return(out_file) |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 90 | |
| 91 | def get_job_results(self, job_id, yaml_out_file): |
| 92 | results_url = "{}/yaml".format(self.server_results_prefix % job_id) |
| 93 | return(self.fetch_file(results_url, yaml_out_file)) |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 94 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 95 | def get_job_definition(self, job_id, yaml_out_file=None): |
| 96 | job_def = self.scheduler.jobs.definition(job_id) |
| 97 | if yaml_out_file: |
| 98 | with open(yaml_out_file, "w") as F: |
| 99 | F.write(str(job_def)) |
Paul Sokolovsky | f2f385d | 2022-01-11 00:36:31 +0300 | [diff] [blame] | 100 | def_o = yaml.safe_load(job_def) |
Xinyu Zhang | 82dab28 | 2022-10-09 16:33:19 +0800 | [diff] [blame] | 101 | return def_o |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 102 | |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 103 | def get_job_log(self, job_id, target_out_file): |
Milosz Wasilewski | 4c4190d | 2020-12-15 12:56:22 +0000 | [diff] [blame] | 104 | auth_headers = {"Authorization": "Token %s" % self.token} |
| 105 | log_url = "{server_url}/jobs/{job_id}/logs/".format( |
| 106 | server_url=self.server_api, job_id=job_id |
| 107 | ) |
Fathi Boudra | c10378c | 2021-01-21 18:25:19 +0100 | [diff] [blame] | 108 | with requests.get(log_url, stream=True, headers=auth_headers) as r: |
Paul Sokolovsky | 903bc43 | 2022-12-29 17:15:04 +0300 | [diff] [blame] | 109 | r.raise_for_status() |
Fathi Boudra | c10378c | 2021-01-21 18:25:19 +0100 | [diff] [blame] | 110 | log_list = yaml.load(r.content, Loader=yaml.SafeLoader) |
| 111 | with open(target_out_file, "w") as target_out: |
| 112 | for line in log_list: |
| 113 | level = line["lvl"] |
| 114 | if (level == "target") or (level == "feedback"): |
| 115 | try: |
| 116 | target_out.write("{}\n".format(line["msg"])) |
| 117 | except UnicodeEncodeError: |
| 118 | msg = ( |
| 119 | line["msg"] |
| 120 | .encode("ascii", errors="replace") |
| 121 | .decode("ascii") |
| 122 | ) |
| 123 | target_out.write("{}\n".format(msg)) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 124 | |
Matthew Hart | 4a4f120 | 2020-06-12 15:52:46 +0100 | [diff] [blame] | 125 | def get_job_config(self, job_id, config_out_file): |
| 126 | config_url = "{}/configuration".format(self.server_job_prefix % job_id) |
| 127 | self.fetch_file(config_url, config_out_file) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 128 | |
| 129 | def get_job_info(self, job_id, yaml_out_file=None): |
| 130 | job_info = self.scheduler.jobs.show(job_id) |
| 131 | if yaml_out_file: |
| 132 | with open(yaml_out_file, "w") as F: |
| 133 | F.write(str(job_info)) |
| 134 | return job_info |
| 135 | |
| 136 | def get_error_reason(self, job_id): |
Matthew Hart | 2c2688f | 2020-05-26 13:09:20 +0100 | [diff] [blame] | 137 | try: |
| 138 | lava_res = self.results.get_testsuite_results_yaml(job_id, 'lava') |
Paul Sokolovsky | f2f385d | 2022-01-11 00:36:31 +0300 | [diff] [blame] | 139 | results = yaml.safe_load(lava_res) |
Matthew Hart | 2c2688f | 2020-05-26 13:09:20 +0100 | [diff] [blame] | 140 | for test in results: |
| 141 | if test['name'] == 'job': |
| 142 | return(test.get('metadata', {}).get('error_type', '')) |
| 143 | except Exception: |
| 144 | return("Unknown") |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 145 | |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 146 | def get_job_state(self, job_id): |
| 147 | return self.scheduler.job_state(job_id)["job_state"] |
| 148 | |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 149 | def cancel_job(self, job_id): |
| 150 | """ Cancell job with id=job_id. Returns True if successfull """ |
| 151 | |
| 152 | return self.scheduler.jobs.cancel(job_id) |
| 153 | |
| 154 | def validate_job_yaml(self, job_definition, print_err=False): |
| 155 | """ Validate a job definition syntax. Returns true is server considers |
| 156 | the syntax valid """ |
| 157 | |
| 158 | try: |
| 159 | with open(job_definition) as F: |
| 160 | input_yaml = F.read() |
| 161 | self.scheduler.validate_yaml(input_yaml) |
| 162 | return True |
| 163 | except Exception as E: |
| 164 | if print_err: |
| 165 | print(E) |
| 166 | return False |
| 167 | |
Matthew Hart | 110e1dc | 2020-05-27 17:18:55 +0100 | [diff] [blame] | 168 | def device_type_from_def(self, job_data): |
Paul Sokolovsky | f2f385d | 2022-01-11 00:36:31 +0300 | [diff] [blame] | 169 | def_yaml = yaml.safe_load(job_data) |
Matthew Hart | 110e1dc | 2020-05-27 17:18:55 +0100 | [diff] [blame] | 170 | return(def_yaml['device_type']) |
| 171 | |
| 172 | def has_device_type(self, job_data): |
| 173 | d_type = self.device_type_from_def(job_data) |
| 174 | all_d = self.scheduler.devices.list() |
| 175 | for device in all_d: |
| 176 | if device['type'] == d_type: |
| 177 | if device['health'] in ['Good', 'Unknown']: |
| 178 | return(True) |
| 179 | return(False) |
| 180 | |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 181 | def submit_job(self, job_definition): |
| 182 | """ Will submit a yaml definition pointed by job_definition after |
| 183 | validating it againist the remote backend. Returns resulting job id, |
| 184 | and server url for job""" |
| 185 | |
| 186 | try: |
| 187 | if not self.validate_job_yaml(job_definition): |
Paul Sokolovsky | 80b9b35 | 2024-03-05 16:38:41 +0700 | [diff] [blame] | 188 | _log.error("Server rejected job's syntax") |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 189 | raise Exception("Invalid job") |
| 190 | with open(job_definition, "r") as F: |
| 191 | job_data = F.read() |
| 192 | except Exception as e: |
| 193 | print("Cannot submit invalid job. Check %s's content" % |
| 194 | job_definition) |
| 195 | print(e) |
| 196 | return None, None |
Dean Birch | a6ede7e | 2020-03-13 14:00:33 +0000 | [diff] [blame] | 197 | try: |
Dean Birch | 1d545c0 | 2020-05-29 14:09:21 +0100 | [diff] [blame] | 198 | if self.has_device_type(job_data): |
| 199 | job_id = self.scheduler.submit_job(job_data) |
| 200 | job_url = self.server_job_prefix % job_id |
| 201 | return(job_id, job_url) |
| 202 | else: |
| 203 | raise Exception("No devices online with required device_type") |
Dean Birch | a6ede7e | 2020-03-13 14:00:33 +0000 | [diff] [blame] | 204 | except Exception as e: |
Paul Sokolovsky | b2ca65b | 2024-03-11 15:07:34 +0700 | [diff] [blame] | 205 | _log.exception("Exception submitting job to LAVA", e) |
Dean Birch | a6ede7e | 2020-03-13 14:00:33 +0000 | [diff] [blame] | 206 | return(None, None) |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 207 | |
| 208 | def resubmit_job(self, job_id): |
| 209 | """ Re-submit job with provided id. Returns resulting job id, |
| 210 | and server url for job""" |
| 211 | |
| 212 | job_id = self.scheduler.resubmit_job(job_id) |
| 213 | job_url = self.server_job_prefix % job_id |
| 214 | return(job_id, job_url) |
| 215 | |
| 216 | def block_wait_for_job(self, job_id, timeout, poll_freq=1): |
| 217 | """ Will block code execution and wait for the job to submit. |
| 218 | Returns job status on completion """ |
| 219 | |
| 220 | start_t = int(time.time()) |
| 221 | while(True): |
| 222 | cur_t = int(time.time()) |
| 223 | if cur_t - start_t >= timeout: |
| 224 | print("Breaking because of timeout") |
| 225 | break |
| 226 | # Check if the job is not running |
Dean Arnold | f1169b9 | 2020-03-11 10:14:14 +0000 | [diff] [blame] | 227 | cur_status = self.get_job_state(job_id) |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 228 | # If in queue or running wait |
Dean Arnold | c1d81b4 | 2020-03-11 15:56:36 +0000 | [diff] [blame] | 229 | if cur_status not in ["Canceling","Finished"]: |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 230 | time.sleep(poll_freq) |
| 231 | else: |
| 232 | break |
Dean Arnold | c1d81b4 | 2020-03-11 15:56:36 +0000 | [diff] [blame] | 233 | return self.scheduler.job_health(job_id)["job_health"] |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 234 | |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 235 | def block_wait_for_jobs(self, job_ids, timeout, poll_freq=10): |
| 236 | """ Wait for multiple LAVA job ids to finish and return finished list """ |
| 237 | |
| 238 | start_t = int(time.time()) |
| 239 | finished_jobs = {} |
| 240 | while(True): |
| 241 | cur_t = int(time.time()) |
| 242 | if cur_t - start_t >= timeout: |
| 243 | print("Breaking because of timeout") |
| 244 | break |
| 245 | for job_id in job_ids: |
Paul Sokolovsky | fb298c6 | 2022-04-29 23:15:17 +0300 | [diff] [blame] | 246 | if job_id in finished_jobs: |
| 247 | continue |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 248 | # Check if the job is not running |
Paul Sokolovsky | 81ff0ad | 2022-12-29 21:47:01 +0300 | [diff] [blame] | 249 | try: |
| 250 | cur_status = self.get_job_info(job_id) |
Paul Sokolovsky | c82f933 | 2023-01-10 23:50:25 +0300 | [diff] [blame] | 251 | except (xmlrpc.client.ProtocolError, OSError) as e: |
Paul Sokolovsky | 81ff0ad | 2022-12-29 21:47:01 +0300 | [diff] [blame] | 252 | # There can be transient HTTP errors, e.g. "502 Proxy Error" |
Paul Sokolovsky | c82f933 | 2023-01-10 23:50:25 +0300 | [diff] [blame] | 253 | # or socket timeout. |
Paul Sokolovsky | 81ff0ad | 2022-12-29 21:47:01 +0300 | [diff] [blame] | 254 | # Just continue with the next job, the faulted one will be |
| 255 | # re-checked on next iteration. |
Paul Sokolovsky | c82f933 | 2023-01-10 23:50:25 +0300 | [diff] [blame] | 256 | _log.warning("block_wait_for_jobs: %r occurred, ignore and continue", e) |
Paul Sokolovsky | 81ff0ad | 2022-12-29 21:47:01 +0300 | [diff] [blame] | 257 | time.sleep(2) |
| 258 | continue |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 259 | # If in queue or running wait |
| 260 | if cur_status['state'] in ["Canceling","Finished"]: |
| 261 | cur_status['error_reason'] = self.get_error_reason(job_id) |
| 262 | finished_jobs[job_id] = cur_status |
Paul Sokolovsky | b06bf6f | 2022-12-27 13:46:24 +0300 | [diff] [blame] | 263 | _log.info( |
Paul Sokolovsky | 6e83a23 | 2024-03-11 15:30:04 +0700 | [diff] [blame] | 264 | "Job %s finished in %ds with state: %s, health: %s. Remaining: %d", |
Paul Sokolovsky | b7a41a9 | 2022-12-28 18:06:45 +0300 | [diff] [blame] | 265 | job_id, time.time() - start_t, |
| 266 | cur_status['state'], |
| 267 | cur_status['health'], |
Paul Sokolovsky | b06bf6f | 2022-12-27 13:46:24 +0300 | [diff] [blame] | 268 | len(job_ids) - len(finished_jobs) |
| 269 | ) |
Matthew Hart | fb6fd36 | 2020-03-04 21:03:59 +0000 | [diff] [blame] | 270 | if len(job_ids) == len(finished_jobs): |
| 271 | break |
| 272 | else: |
| 273 | time.sleep(poll_freq) |
| 274 | if len(job_ids) == len(finished_jobs): |
| 275 | break |
| 276 | return finished_jobs |
| 277 | |
Minos Galanakis | f4ca6ac | 2017-12-11 02:39:21 +0100 | [diff] [blame] | 278 | def test_credentials(self): |
| 279 | """ Attempt to querry the back-end and verify that the user provided |
| 280 | authentication is valid """ |
| 281 | |
| 282 | try: |
| 283 | self._rpc_cmd_raw("system.listMethods") |
| 284 | return True |
| 285 | except Exception as e: |
| 286 | print(e) |
| 287 | print("Credential validation failed") |
| 288 | return False |
| 289 | |
| 290 | |
| 291 | if __name__ == "__main__": |
| 292 | pass |