Blame - tests/scripts/analyze_outcomes.py - mirror/mbed-tls

2020-06-25 18:36:28 +0200

[diff] [blame]

1

#!/usr/bin/env python3

2

3

"""Analyze the test outcomes from a full CI run.

4

5

This script can also run on outcomes from a partial run, but the results are

6

less likely to be useful.

"""

import argparse

import sys

import traceback

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

12

import re

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

13

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

14

import check_test_cases

15

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

16

class Results:

17

"""Process analysis results."""

def __init__(self):

self.error_count = 0

self.warning_count = 0

22

23

@staticmethod

24

def log(fmt, *args, **kwargs):

25

sys.stderr.write((fmt + '\n').format(*args, **kwargs))

26

27

def error(self, fmt, *args, **kwargs):

28

self.log('Error: ' + fmt, *args, **kwargs)

29

self.error_count += 1

30

31

def warning(self, fmt, *args, **kwargs):

32

self.log('Warning: ' + fmt, *args, **kwargs)

33

self.warning_count += 1

34

35

class TestCaseOutcomes:

36

"""The outcomes of one test case across many configurations."""

37

# pylint: disable=too-few-public-methods

38

39

def __init__(self):

Gilles Peskine

3d863f2

2020-06-26 13:02:30 +0200

[diff] [blame]

40

# Collect a list of witnesses of the test case succeeding or failing.

41

# Currently we don't do anything with witnesses except count them.

42

# The format of a witness is determined by the read_outcome_file

43

# function; it's the platform and configuration joined by ';'.

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

self.successes = []

self.failures = []

def hits(self):

"""Return the number of times a test case has been run.

49

50

This includes passes and failures, but not skips.

51

"""

52

return len(self.successes) + len(self.failures)

53

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

54

def analyze_coverage(results, outcomes):

55

"""Check that all available test cases are executed at least once."""

Gilles Peskine

686c292

2022-01-07 15:58:38 +0100

[diff] [blame]

56

available = check_test_cases.collect_available_test_cases()

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

57

for key in available:

58

hits = outcomes[key].hits() if key in outcomes else 0

59

if hits == 0:

60

# Make this a warning, not an error, as long as we haven't

61

# fixed this branch to have full coverage of test cases.

62

results.warning('Test case not executed: {}', key)

63

Przemek Stekiel

733c76e

2022-11-14 08:33:21 +0100

[diff] [blame]

64

def analyze_driver_vs_reference(outcomes, component_ref, component_driver, ignored_tests):

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

65

"""Check that all tests executed in the reference component are also

66

executed in the corresponding driver component.

Przemek Stekiel

2022-11-09 10:50:29 +0100

[diff] [blame]

67

Skip test suites provided in ignored_tests list.

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

68

"""

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

69

available = check_test_cases.collect_available_test_cases()

70

result = True

71

72

for key in available:

73

# Skip ignored test suites

Przemek Stekiel

2022-11-09 10:50:29 +0100

[diff] [blame]

74

test_suite = key.split(';')[0] # retrieve test suit name

75

test_suite = test_suite.split('.')[0] # retrieve main part of test suit name

76

if test_suite in ignored_tests:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

77

continue

78

# Continue if test was not executed by any component

79

hits = outcomes[key].hits() if key in outcomes else 0

Przemek Stekiel

2022-10-24 09:16:04 +0200

[diff] [blame]

80

if hits == 0:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

81

continue

82

# Search for tests that run in reference component and not in driver component

83

driver_test_passed = False

84

reference_test_passed = False

85

for entry in outcomes[key].successes:

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

86

if component_driver in entry:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

87

driver_test_passed = True

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

88

if component_ref in entry:

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

89

reference_test_passed = True

Przemek Stekiel

2022-10-24 09:16:04 +0200

[diff] [blame]

90

if(driver_test_passed is False and reference_test_passed is True):

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

91

print('{}: driver: skipped/failed; reference: passed'.format(key))

result = False

return result

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

95

def analyze_outcomes(outcomes):

96

"""Run all analyses on the given outcome collection."""

97

results = Results()

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

98

analyze_coverage(results, outcomes)

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

99

return results

100

101

def read_outcome_file(outcome_file):

102

"""Parse an outcome file and return an outcome collection.

103

104

An outcome collection is a dictionary mapping keys to TestCaseOutcomes objects.

105

The keys are the test suite name and the test case description, separated

by a semicolon.

"""

outcomes = {}

with open(outcome_file, 'r', encoding='utf-8') as input_file:

110

for line in input_file:

111

(platform, config, suite, case, result, _cause) = line.split(';')

112

key = ';'.join([suite, case])

113

setup = ';'.join([platform, config])

114

if key not in outcomes:

115

outcomes[key] = TestCaseOutcomes()

116

if result == 'PASS':

117

outcomes[key].successes.append(setup)

118

elif result == 'FAIL':

119

outcomes[key].failures.append(setup)

120

return outcomes

121

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

122

def do_analyze_coverage(outcome_file, args):

Przemek Stekiel

2022-11-09 10:50:29 +0100

[diff] [blame]

123

"""Perform coverage analysis."""

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

124

del args # unused

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

125

outcomes = read_outcome_file(outcome_file)

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

126

results = analyze_outcomes(outcomes)

Przemek Stekiel

2022-10-24 09:16:04 +0200

[diff] [blame]

127

return results.error_count == 0

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

128

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

129

def do_analyze_driver_vs_reference(outcome_file, args):

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

130

"""Perform driver vs reference analyze."""

Przemek Stekiel

be279c7

2022-11-09 12:17:08 +0100

[diff] [blame]

131

ignored_tests = ['test_suite_' + x for x in args['ignored_suites']]

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

132

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

133

outcomes = read_outcome_file(outcome_file)

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

134

return analyze_driver_vs_reference(outcomes, args['component_ref'],

135

args['component_driver'], ignored_tests)

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

136

Przemek Stekiel

2022-11-09 10:50:29 +0100

[diff] [blame]

137

# List of tasks with a function that can handle this task and additional arguments if required

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

138

TASKS = {

139

'analyze_coverage': {

140

'test_function': do_analyze_coverage,

141

'args': {}},

142

'analyze_driver_vs_reference_hash': {

143

'test_function': do_analyze_driver_vs_reference,

144

'args': {

Przemek Stekiel

2022-11-09 12:07:29 +0100

[diff] [blame]

145

'component_ref': 'test_psa_crypto_config_reference_hash_use_psa',

146

'component_driver': 'test_psa_crypto_config_accel_hash_use_psa',

Przemek Stekiel

733c76e

2022-11-14 08:33:21 +0100

[diff] [blame]

147

'ignored_suites': ['shax', 'mdx', # the software implementations that are being excluded

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

148

'md', # the legacy abstraction layer that's being excluded

Przemek Stekiel

be279c7

2022-11-09 12:17:08 +0100

[diff] [blame]

149

]}}

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

150

}

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

151

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

152

def main():

153

try:

154

parser = argparse.ArgumentParser(description=__doc__)

Przemek Stekiel

58bbc23

2022-10-24 08:10:10 +0200

[diff] [blame]

155

parser.add_argument('outcomes', metavar='OUTCOMES.CSV',

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

156

help='Outcome file to analyze')

Przemek Stekiel

542d932

2022-11-17 09:43:34 +0100

[diff] [blame]

157

parser.add_argument('task', default='all', nargs='?',

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

158

help='Analysis to be done. By default, run all tasks. '

159

'With one or more TASK, run only those. '

160

'TASK can be the name of a single task or '

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

161

'comma/space-separated list of tasks. ')

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

162

parser.add_argument('--list', action='store_true',

163

help='List all available tasks and exit.')

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

164

options = parser.parse_args()

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

165

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

if options.list:

for task in TASKS:

print(task)

sys.exit(0)

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

171

result = True

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

172

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

173

if options.task == 'all':

Przemek Stekiel

d3068af

2022-11-14 16:15:19 +0100

[diff] [blame]

174

tasks = TASKS.keys()

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

175

else:

Przemek Stekiel

85c54ea

2022-11-17 11:50:23 +0100

[diff] [blame]

176

tasks = re.split(r'[, ]+', options.task)

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

177

Przemek Stekiel

d3068af

2022-11-14 16:15:19 +0100

[diff] [blame]

178

for task in tasks:

179

if task not in TASKS:

180

print('Error: invalid task: {}'.format(task))

181

sys.exit(1)

Przemek Stekiel

2022-11-09 13:54:49 +0100

[diff] [blame]

182

183

for task in TASKS:

184

if task in tasks:

Przemek Stekiel

2022-10-26 16:11:26 +0200

[diff] [blame]

185

if not TASKS[task]['test_function'](options.outcomes, TASKS[task]['args']):

186

result = False

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

187

Przemek Stekiel

2022-10-24 09:16:04 +0200

[diff] [blame]

188

if result is False:

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

189

sys.exit(1)

Przemek Stekiel

2022-10-21 13:42:08 +0200

[diff] [blame]

190

print("SUCCESS :-)")

Gilles Peskine