Blame - tests/scripts/analyze_outcomes.py - mirror/mbed-tls

2020-06-25 18:36:28 +0200

[diff] [blame]

1

#!/usr/bin/env python3

2

3

"""Analyze the test outcomes from a full CI run.

4

5

This script can also run on outcomes from a partial run, but the results are

6

less likely to be useful.

"""

import argparse

import sys

import traceback

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

12

import re

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

13

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

14

import check_test_cases

15

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

16

class Results:

17

"""Process analysis results."""

def __init__(self):

self.error_count = 0

self.warning_count = 0

22

23

@staticmethod

24

def log(fmt, *args, **kwargs):

25

sys.stderr.write((fmt + '\n').format(*args, **kwargs))

26

27

def error(self, fmt, *args, **kwargs):

28

self.log('Error: ' + fmt, *args, **kwargs)

29

self.error_count += 1

30

31

def warning(self, fmt, *args, **kwargs):

32

self.log('Warning: ' + fmt, *args, **kwargs)

33

self.warning_count += 1

34

35

class TestCaseOutcomes:

36

"""The outcomes of one test case across many configurations."""

37

# pylint: disable=too-few-public-methods

38

39

def __init__(self):

Gilles Peskine

3d863f2

2020-06-26 13:02:30 +0200

[diff] [blame]

40

# Collect a list of witnesses of the test case succeeding or failing.

41

# Currently we don't do anything with witnesses except count them.

42

# The format of a witness is determined by the read_outcome_file

43

# function; it's the platform and configuration joined by ';'.

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

self.successes = []

self.failures = []

def hits(self):

"""Return the number of times a test case has been run.

49

50

This includes passes and failures, but not skips.

51

"""

52

return len(self.successes) + len(self.failures)

53

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

54

def analyze_coverage(results, outcomes, allow_list, full_coverage):

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

55

"""Check that all available test cases are executed at least once."""

Gilles Peskine

0c2f8ee

2022-01-07 15:58:38 +0100

[diff] [blame]

56

available = check_test_cases.collect_available_test_cases()

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

57

for key in available:

58

hits = outcomes[key].hits() if key in outcomes else 0

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

59

if hits == 0 and key not in allow_list:

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

60

if full_coverage:

61

results.error('Test case not executed: {}', key)

62

else:

63

results.warning('Test case not executed: {}', key)

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

64

elif hits != 0 and key in allow_list:

65

# Test Case should be removed from the allow list.

Tomás González

14b36ef

2023-08-22 09:40:23 +0100

[diff] [blame]

66

if full_coverage:

67

results.error('Allow listed test case was executed: {}', key)

68

else:

69

results.warning('Allow listed test case was executed: {}', key)

Gilles Peskine

2020-06-25 18:37:43 +0200

[diff] [blame]

70

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

71

def analyze_outcomes(outcomes, args):

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

72

"""Run all analyses on the given outcome collection."""

73

results = Results()

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

74

analyze_coverage(results, outcomes, args['allow_list'],

75

args['full_coverage'])

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

76

return results

77

78

def read_outcome_file(outcome_file):

79

"""Parse an outcome file and return an outcome collection.

80

81

An outcome collection is a dictionary mapping keys to TestCaseOutcomes objects.

82

The keys are the test suite name and the test case description, separated

by a semicolon.

"""

outcomes = {}

with open(outcome_file, 'r', encoding='utf-8') as input_file:

87

for line in input_file:

88

(platform, config, suite, case, result, _cause) = line.split(';')

89

key = ';'.join([suite, case])

90

setup = ';'.join([platform, config])

91

if key not in outcomes:

92

outcomes[key] = TestCaseOutcomes()

93

if result == 'PASS':

94

outcomes[key].successes.append(setup)

95

elif result == 'FAIL':

96

outcomes[key].failures.append(setup)

97

return outcomes

98

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

99

def do_analyze_coverage(outcome_file, args):

100

"""Perform coverage analysis."""

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

101

outcomes = read_outcome_file(outcome_file)

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

102

Results.log("\n*** Analyze coverage ***\n")

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

103

results = analyze_outcomes(outcomes, args)

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

104

return results.error_count == 0

105

106

# List of tasks with a function that can handle this task and additional arguments if required

107

TASKS = {

108

'analyze_coverage': {

109

'test_function': do_analyze_coverage,

110

'args': {

Tomás González

c895733

2023-08-14 15:43:46 +0100

[diff] [blame]

111

'allow_list': [

112

# Algorithm not supported yet

113

'test_suite_psa_crypto_metadata;Asymmetric signature: pure EdDSA',

114

# Algorithm not supported yet

115

'test_suite_psa_crypto_metadata;Cipher: XTS',

Manuel Pégourié-Gonnard

2e1d2fe

2024-04-09 23:13:49 +0200

[diff] [blame]

116

# compat.sh tests with OpenSSL, DTLS 1.2 and singled-DES:

117

# we have no version of OpenSSL on the CI that supports both

118

# DTLS 1.2 and single-DES (1.0.2g is too recent for single-DES

119

# and 1.0.1j is too old for DTLS 1.2).

120

'compat;O->m dtls12,no DES-CBC-SHA',

121

'compat;O->m dtls12,no EDH-RSA-DES-CBC-SHA',

122

'compat;O->m dtls12,yes DES-CBC-SHA',

123

'compat;O->m dtls12,yes EDH-RSA-DES-CBC-SHA',

124

'compat;m->O dtls12,no TLS-DHE-RSA-WITH-DES-CBC-SHA',

125

'compat;m->O dtls12,no TLS-RSA-WITH-DES-CBC-SHA',

126

'compat;m->O dtls12,yes TLS-DHE-RSA-WITH-DES-CBC-SHA',

127

'compat;m->O dtls12,yes TLS-RSA-WITH-DES-CBC-SHA',

Tomás González

1cf437b

2023-08-24 09:27:28 +0100

[diff] [blame]

128

],

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

129

'full_coverage': False,

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

130

}

131

},

132

}

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

def main():

try:

parser = argparse.ArgumentParser(description=__doc__)

137

parser.add_argument('outcomes', metavar='OUTCOMES.CSV',

138

help='Outcome file to analyze')

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

139

parser.add_argument('task', default='all', nargs='?',

140

help='Analysis to be done. By default, run all tasks. '

141

'With one or more TASK, run only those. '

142

'TASK can be the name of a single task or '

143

'comma/space-separated list of tasks. ')

144

parser.add_argument('--list', action='store_true',

145

help='List all available tasks and exit.')

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

146

parser.add_argument('--require-full-coverage', action='store_true',

147

dest='full_coverage', help="Require all available "

148

"test cases to be executed and issue an error "

149

"otherwise. This flag is ignored if 'task' is "

150

"neither 'all' nor 'analyze_coverage'")

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

151

options = parser.parse_args()

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

if options.list:

for task in TASKS:

Results.log(task)

sys.exit(0)

result = True

if options.task == 'all':

161

tasks = TASKS.keys()

162

else:

163

tasks = re.split(r'[, ]+', options.task)

164

165

for task in tasks:

166

if task not in TASKS:

167

Results.log('Error: invalid task: {}'.format(task))

168

sys.exit(1)

169

Tomás González

2023-08-11 15:22:04 +0100

[diff] [blame]

170

TASKS['analyze_coverage']['args']['full_coverage'] = \

171

options.full_coverage

172

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

173

for task in TASKS:

174

if task in tasks:

175

if not TASKS[task]['test_function'](options.outcomes, TASKS[task]['args']):

176

result = False

177

178

if result is False:

Gilles Peskine

2020-06-25 18:36:28 +0200

[diff] [blame]

179

sys.exit(1)

Tomás González

2023-08-23 16:43:26 +0100

[diff] [blame]

180

Results.log("SUCCESS :-)")

Gilles Peskine