Blame - tests/scripts/analyze_outcomes.py - mirror/mbed-tls

2020-06-25 18:36:28 +0200

[diff] [blame]

1

#!/usr/bin/env python3

2

3

"""Analyze the test outcomes from a full CI run.

4

5

This script can also run on outcomes from a partial run, but the results are

6

less likely to be useful.

"""

import argparse

import sys

import traceback

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

12

import re

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

13

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

14

import check_test_cases

15

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

16

class Results:

17

"""Process analysis results."""

def __init__(self):

self.error_count = 0

self.warning_count = 0

22

23

@staticmethod

24

def log(fmt, *args, **kwargs):

25

sys.stderr.write((fmt + '\n').format(*args, **kwargs))

26

27

def error(self, fmt, *args, **kwargs):

28

self.log('Error: ' + fmt, *args, **kwargs)

29

self.error_count += 1

30

31

def warning(self, fmt, *args, **kwargs):

32

self.log('Warning: ' + fmt, *args, **kwargs)

33

self.warning_count += 1

34

35

class TestCaseOutcomes:

36

"""The outcomes of one test case across many configurations."""

37

# pylint: disable=too-few-public-methods

38

39

def __init__(self):

Gilles Peskine

3d863f2

2020-06-26 13:02:30 +0200

[diff] [blame]

40

# Collect a list of witnesses of the test case succeeding or failing.

41

# Currently we don't do anything with witnesses except count them.

42

# The format of a witness is determined by the read_outcome_file

43

# function; it's the platform and configuration joined by ';'.

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

self.successes = []

self.failures = []

def hits(self):

"""Return the number of times a test case has been run.

49

50

This includes passes and failures, but not skips.

51

"""

52

return len(self.successes) + len(self.failures)

53

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

54

def analyze_coverage(results, outcomes):

55

"""Check that all available test cases are executed at least once."""

Gilles Peskine

686c292

2022-01-07 15:58:38 +0100

[diff] [blame]

56

available = check_test_cases.collect_available_test_cases()

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

57

for key in available:

58

hits = outcomes[key].hits() if key in outcomes else 0

59

if hits == 0:

60

# Make this a warning, not an error, as long as we haven't

61

# fixed this branch to have full coverage of test cases.

62

results.warning('Test case not executed: {}', key)

63

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

64

def analyze_driver_vs_reference(outcomes, component_ref, component_driver,

65

ignored_suites, ignored_test=None):

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

66

"""Check that all tests executed in the reference component are also

67

executed in the corresponding driver component.

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

68

Skip:

69

- full test suites provided in ignored_suites list

70

- only some specific test inside a test suite, for which the corresponding

71

output string is provided

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

72

"""

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

73

available = check_test_cases.collect_available_test_cases()

74

result = True

75

76

for key in available:

77

# Skip ignored test suites

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

78

full_test_suite = key.split(';')[0] # retrieve full test suit name

79

test_string = key.split(';')[1] # retrieve the text string of this test

80

test_suite = full_test_suite.split('.')[0] # retrieve main part of test suit name

81

if test_suite in ignored_suites:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

82

continue

83

# Continue if test was not executed by any component

84

hits = outcomes[key].hits() if key in outcomes else 0

Przemek Stekiel

c86dedf

2022-10-24 09:16:04 +0200

[diff] [blame]

85

if hits == 0:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

86

continue

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

87

if ((full_test_suite in ignored_test) and

88

(test_string in ignored_test[full_test_suite])):

89

continue

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

90

# Search for tests that run in reference component and not in driver component

91

driver_test_passed = False

92

reference_test_passed = False

93

for entry in outcomes[key].successes:

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

94

if component_driver in entry:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

95

driver_test_passed = True

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

96

if component_ref in entry:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

97

reference_test_passed = True

Manuel Pégourié-Gonnard

c6967d2

2022-12-30 13:40:34 +0100

[diff] [blame]

98

if(reference_test_passed and not driver_test_passed):

99

print(key)

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

result = False

return result

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

103

def analyze_outcomes(outcomes):

104

"""Run all analyses on the given outcome collection."""

105

results = Results()

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

106

analyze_coverage(results, outcomes)

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

107

return results

108

109

def read_outcome_file(outcome_file):

110

"""Parse an outcome file and return an outcome collection.

111

112

An outcome collection is a dictionary mapping keys to TestCaseOutcomes objects.

113

The keys are the test suite name and the test case description, separated

by a semicolon.

"""

outcomes = {}

with open(outcome_file, 'r', encoding='utf-8') as input_file:

118

for line in input_file:

119

(platform, config, suite, case, result, _cause) = line.split(';')

120

key = ';'.join([suite, case])

121

setup = ';'.join([platform, config])

122

if key not in outcomes:

123

outcomes[key] = TestCaseOutcomes()

124

if result == 'PASS':

125

outcomes[key].successes.append(setup)

126

elif result == 'FAIL':

127

outcomes[key].failures.append(setup)

128

return outcomes

129

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

130

def do_analyze_coverage(outcome_file, args):

Przemek Stekiel

6856f4c

2022-11-09 10:50:29 +0100

[diff] [blame]

131

"""Perform coverage analysis."""

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

132

del args # unused

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

133

outcomes = read_outcome_file(outcome_file)

Manuel Pégourié-Gonnard

c6967d2

2022-12-30 13:40:34 +0100

[diff] [blame]

134

print("\n*** Analyze coverage ***\n")

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

135

results = analyze_outcomes(outcomes)

Przemek Stekiel

c86dedf

2022-10-24 09:16:04 +0200

[diff] [blame]

136

return results.error_count == 0

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

137

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

138

def do_analyze_driver_vs_reference(outcome_file, args):

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

139

"""Perform driver vs reference analyze."""

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

140

ignored_suites = ['test_suite_' + x for x in args['ignored_suites']]

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

141

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

142

outcomes = read_outcome_file(outcome_file)

Manuel Pégourié-Gonnard

c6967d2

2022-12-30 13:40:34 +0100

[diff] [blame]

143

print("\n*** Analyze driver {} vs reference {} ***\n".format(

144

args['component_driver'], args['component_ref']))

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

145

return analyze_driver_vs_reference(outcomes, args['component_ref'],

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

146

args['component_driver'], ignored_suites,

147

args['ignored_tests'])

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

148

Przemek Stekiel

6856f4c

2022-11-09 10:50:29 +0100

[diff] [blame]

149

# List of tasks with a function that can handle this task and additional arguments if required

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

150

TASKS = {

151

'analyze_coverage': {

152

'test_function': do_analyze_coverage,

Manuel Pégourié-Gonnard

10e3963

2022-12-29 12:29:09 +0100

[diff] [blame]

153

'args': {}

154

},

155

# How to use analyze_driver_vs_reference_xxx locally:

156

# 1. tests/scripts/all.sh --outcome-file "$PWD/out.csv" <component_ref> <component_driver>

157

# 2. tests/scripts/analyze_outcomes.py out.csv analyze_driver_vs_reference_xxx

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

158

'analyze_driver_vs_reference_hash': {

159

'test_function': do_analyze_driver_vs_reference,

160

'args': {

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

161

'component_ref': 'test_psa_crypto_config_reference_hash_use_psa',

162

'component_driver': 'test_psa_crypto_config_accel_hash_use_psa',

Manuel Pégourié-Gonnard

10e3963

2022-12-29 12:29:09 +0100

[diff] [blame]

163

'ignored_suites': [

164

'shax', 'mdx', # the software implementations that are being excluded

165

'md', # the legacy abstraction layer that's being excluded

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

],

'ignored_tests': {

}

}

},

Manuel Pégourié-Gonnard

10e3963

2022-12-29 12:29:09 +0100

[diff] [blame]

171

'analyze_driver_vs_reference_ecdsa': {

172

'test_function': do_analyze_driver_vs_reference,

173

'args': {

174

'component_ref': 'test_psa_crypto_config_reference_ecdsa_use_psa',

175

'component_driver': 'test_psa_crypto_config_accel_ecdsa_use_psa',

176

'ignored_suites': [

177

'ecdsa', # the software implementation that's excluded

178

# the following lines should not be needed,

179

# they will be removed by upcoming work

Manuel Pégourié-Gonnard

d84902f

2023-01-23 13:03:13 +0100

[diff] [blame]

180

'random', # #6856

Manuel Pégourié-Gonnard

d84902f

2023-01-23 13:03:13 +0100

[diff] [blame]

'pk', # #6857

'x509parse', # #6858

'x509write', # #6858

'debug', # #6860

'ssl', # #6860

Valerio Setti

2023-01-18 17:28:36 +0100

[diff] [blame^]

],

'ignored_tests': {

}

}

},

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

191

}

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

192

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

193

def main():

194

try:

195

parser = argparse.ArgumentParser(description=__doc__)

Przemek Stekiel

58bbc23

2022-10-24 08:10:10 +0200

[diff] [blame]

196

parser.add_argument('outcomes', metavar='OUTCOMES.CSV',

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

197

help='Outcome file to analyze')

Przemek Stekiel

542d932

2022-11-17 09:43:34 +0100

[diff] [blame]

198

parser.add_argument('task', default='all', nargs='?',

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

199

help='Analysis to be done. By default, run all tasks. '

200

'With one or more TASK, run only those. '

201

'TASK can be the name of a single task or '

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

202

'comma/space-separated list of tasks. ')

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

203

parser.add_argument('--list', action='store_true',

204

help='List all available tasks and exit.')

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

205

options = parser.parse_args()

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

206

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

if options.list:

for task in TASKS:

print(task)

sys.exit(0)

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

212

result = True

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

213

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

214

if options.task == 'all':

Przemek Stekiel

d3068af

2022-11-14 16:15:19 +0100

[diff] [blame]

215

tasks = TASKS.keys()

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

216

else:

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

217

tasks = re.split(r'[, ]+', options.task)

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

218

Przemek Stekiel

d3068af

2022-11-14 16:15:19 +0100

[diff] [blame]

219

for task in tasks:

220

if task not in TASKS:

221

print('Error: invalid task: {}'.format(task))

222

sys.exit(1)

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

223

224

for task in TASKS:

225

if task in tasks:

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

226

if not TASKS[task]['test_function'](options.outcomes, TASKS[task]['args']):

227

result = False

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

228

Przemek Stekiel

c86dedf

2022-10-24 09:16:04 +0200

[diff] [blame]

229

if result is False:

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

230

sys.exit(1)

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

231

print("SUCCESS :-)")

Gilles Peskine