Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 1 | #!/bin/bash |
| 2 | |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 3 | set -xe |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 4 | |
Leonardo Sandoval | 5a33566 | 2021-03-26 19:57:40 -0600 | [diff] [blame] | 5 | # Wait for the LAVA job to finished |
| 6 | # By default, timeout at 5400 secs (1.5 hours) and monitor every 60 seconds |
| 7 | wait_lava_job() { |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 8 | set +x |
Leonardo Sandoval | 5a33566 | 2021-03-26 19:57:40 -0600 | [diff] [blame] | 9 | local id=$1 |
| 10 | local timeout="${2:-5400}" |
| 11 | local interval="${3:-60}" |
| 12 | |
| 13 | (( t = timeout )) |
| 14 | |
| 15 | while ((t > 0)); do |
| 16 | sleep $interval |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 17 | resilient_cmd lavacli jobs show $id | tee "${WORKSPACE}/lava-progress.show" | grep 'state *:' |
| 18 | set +x |
Leonardo Sandoval | 5a33566 | 2021-03-26 19:57:40 -0600 | [diff] [blame] | 19 | if grep 'state.*: Finished' "${WORKSPACE}/lava-progress.show"; then |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 20 | set -x |
| 21 | cat "${WORKSPACE}/lava-progress.show" |
Paul Sokolovsky | a153b60 | 2022-10-12 20:50:05 +0300 | [diff] [blame] | 22 | # finished |
| 23 | return 0 |
Leonardo Sandoval | 5a33566 | 2021-03-26 19:57:40 -0600 | [diff] [blame] | 24 | fi |
| 25 | ((t -= interval)) |
| 26 | done |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 27 | set -x |
| 28 | cat "${WORKSPACE}/lava-progress.show" |
| 29 | echo "Timeout waiting for job to finish" |
Paul Sokolovsky | a153b60 | 2022-10-12 20:50:05 +0300 | [diff] [blame] | 30 | # timeout |
| 31 | return 1 |
Leonardo Sandoval | 5a33566 | 2021-03-26 19:57:40 -0600 | [diff] [blame] | 32 | } |
| 33 | |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 34 | # Run the given command passed through parameters, if fails, try |
| 35 | # at most more N-times with a pause of M-seconds until success. |
| 36 | resilient_cmd() { |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 37 | set +x |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 38 | local cmd="$*" |
| 39 | local max_wait=10 |
| 40 | local sleep_body=2 |
| 41 | local iter=0 |
| 42 | |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 43 | while true; do |
| 44 | if ${cmd}; then |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 45 | break |
| 46 | fi |
| 47 | |
| 48 | sleep ${sleep_body} |
| 49 | |
| 50 | iter=$(( iter + 1 )) |
| 51 | if [ ${iter} -ge ${max_wait} ]; then |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 52 | set -x |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 53 | return 1 |
| 54 | fi |
| 55 | done |
Paul Sokolovsky | 99eaff6 | 2023-01-25 19:41:23 +0700 | [diff] [blame] | 56 | set -x |
Leonardo Sandoval | eb94e91 | 2021-01-29 12:23:59 -0600 | [diff] [blame] | 57 | return 0 |
| 58 | } |
| 59 | |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 60 | ls -l ${WORKSPACE} |
| 61 | |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 62 | if [ -n "${QA_SERVER_VERSION}" ]; then |
| 63 | if [ -n "${GERRIT_CHANGE_NUMBER}" ] && [ -n "${GERRIT_PATCHSET_NUMBER}" ]; then |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 64 | curl \ |
Paul Sokolovsky | a3ac126 | 2022-07-08 16:03:48 +0300 | [diff] [blame] | 65 | --fail \ |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 66 | --retry 4 \ |
| 67 | -X POST \ |
| 68 | --header "Auth-Token: ${QA_REPORTS_TOKEN}" \ |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 69 | ${QA_SERVER}/api/createbuild/${QA_SERVER_TEAM}/${QA_SERVER_PROJECT}/${QA_SERVER_VERSION} |
| 70 | fi |
| 71 | |
| 72 | TESTJOB_ID=$(curl \ |
Paul Sokolovsky | a3ac126 | 2022-07-08 16:03:48 +0300 | [diff] [blame] | 73 | --fail \ |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 74 | --retry 4 \ |
| 75 | -X POST \ |
| 76 | --header "Auth-Token: ${QA_REPORTS_TOKEN}" \ |
| 77 | --form backend=${LAVA_SERVER} \ |
Chris Kay | f6ff467 | 2022-11-03 13:09:44 +0000 | [diff] [blame] | 78 | --form definition=@artefacts-lava/job.yaml \ |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 79 | ${QA_SERVER}/api/submitjob/${QA_SERVER_TEAM}/${QA_SERVER_PROJECT}/${QA_SERVER_VERSION}/${DEVICE_TYPE}) |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 80 | |
Arthur She | 2770cee | 2022-09-14 15:12:18 -0700 | [diff] [blame] | 81 | # SQUAD will send 400, curl error code 22, on bad test definition |
| 82 | if [ "$?" = "22" ]; then |
| 83 | echo "Bad test definition!!" |
| 84 | exit 1 |
| 85 | fi |
| 86 | |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 87 | if [ -n "${TESTJOB_ID}" ]; then |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 88 | echo "TEST JOB URL: ${QA_SERVER}/testjob/${TESTJOB_ID} TEST JOB ID: ${TESTJOB_ID}" |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 89 | |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 90 | |
Leonardo Sandoval | 73d301a | 2021-02-12 13:42:55 -0600 | [diff] [blame] | 91 | # The below loop with a sleep is intentional: LAVA could be under heavy load so previous job creation can |
| 92 | # take 'some' time to get the right numeric LAVA JOB ID |
| 93 | renumber='^[0-9]+$' |
| 94 | LAVAJOB_ID="null" |
| 95 | iter=0 |
Chris Kay | f1b3da9 | 2022-09-08 13:15:16 +0100 | [diff] [blame] | 96 | max_tries=120 # run retries for an hour |
Leonardo Sandoval | 73d301a | 2021-02-12 13:42:55 -0600 | [diff] [blame] | 97 | while ! [[ $LAVAJOB_ID =~ $renumber ]]; do |
| 98 | if [ $iter -eq $max_tries ] ; then |
| 99 | LAVAJOB_ID='' |
| 100 | break |
| 101 | fi |
Leonardo Sandoval | 8267f43 | 2021-05-07 10:02:00 -0500 | [diff] [blame] | 102 | sleep 30 |
Paul Sokolovsky | a3ac126 | 2022-07-08 16:03:48 +0300 | [diff] [blame] | 103 | LAVAJOB_ID=$(curl --fail --retry 4 ${QA_SERVER}/api/testjobs/${TESTJOB_ID}/?fields=job_id) |
Leonardo Sandoval | 73d301a | 2021-02-12 13:42:55 -0600 | [diff] [blame] | 104 | |
| 105 | # Get the job_id value (whatever it is) |
| 106 | LAVAJOB_ID=$(echo ${LAVAJOB_ID} | jq '.job_id') |
| 107 | LAVAJOB_ID="${LAVAJOB_ID//\"/}" |
| 108 | |
| 109 | iter=$(( iter + 1 )) |
| 110 | done |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 111 | |
| 112 | # check that rest query at least get non-empty value |
| 113 | if [ -n "${LAVAJOB_ID}" ]; then |
| 114 | |
Leonardo Sandoval | 73d301a | 2021-02-12 13:42:55 -0600 | [diff] [blame] | 115 | echo "LAVA URL: https://${LAVA_SERVER}/scheduler/job/${LAVAJOB_ID} LAVA JOB ID: ${LAVAJOB_ID}" |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 116 | |
Leonardo Sandoval | 73d301a | 2021-02-12 13:42:55 -0600 | [diff] [blame] | 117 | resilient_cmd lavacli identities add --username ${LAVA_USER} --token ${LAVA_TOKEN} --uri "https://${LAVA_SERVER}/RPC2" default |
Leonardo Sandoval | a8078d6 | 2021-02-11 16:29:25 -0600 | [diff] [blame] | 118 | |
Leonardo Sandoval | 6ed6209 | 2021-03-09 09:32:05 -0600 | [diff] [blame] | 119 | # if timeout on waiting for LAVA to complete, create an 'artificial' lava.log indicating |
| 120 | # job ID and timeout seconds |
Paul Sokolovsky | ebaf748 | 2022-10-13 02:05:38 +0300 | [diff] [blame] | 121 | if ! wait_lava_job ${LAVAJOB_ID}; then |
Paul Sokolovsky | a153b60 | 2022-10-12 20:50:05 +0300 | [diff] [blame] | 122 | echo "Stopped monitoring LAVA JOB ${LAVAJOB_ID}, likely stuck or timeout too short?" | tee "${WORKSPACE}/lava.log" |
Leonardo Sandoval | e945013 | 2021-04-19 13:51:11 -0500 | [diff] [blame] | 123 | exit 1 |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 124 | else |
Arthur She | 5fc7427 | 2021-03-26 21:24:34 -0700 | [diff] [blame] | 125 | # Retrieve the test job plain log which is a yaml format file from LAVA |
| 126 | resilient_cmd lavacli jobs logs --raw ${LAVAJOB_ID} > "${WORKSPACE}/lava-raw.log" |
| 127 | |
Leonardo Sandoval | 6ed6209 | 2021-03-09 09:32:05 -0600 | [diff] [blame] | 128 | # Fetch and store LAVA job result (1 failure, 0 success) |
Arthur She | 1671e48 | 2022-06-06 22:19:38 -0700 | [diff] [blame] | 129 | resilient_cmd lavacli results ${LAVAJOB_ID} | tee "${WORKSPACE}/lava.results" |
| 130 | if grep -q '\[fail\]' "${WORKSPACE}/lava.results"; then |
Leonardo Sandoval | e945013 | 2021-04-19 13:51:11 -0500 | [diff] [blame] | 131 | exit 1 |
Arthur She | 1671e48 | 2022-06-06 22:19:38 -0700 | [diff] [blame] | 132 | else |
| 133 | exit 0 |
Leonardo Sandoval | 6ed6209 | 2021-03-09 09:32:05 -0600 | [diff] [blame] | 134 | fi |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 135 | fi |
| 136 | else |
| 137 | echo "LAVA Job ID could not be obtained" |
Leonardo Sandoval | e945013 | 2021-04-19 13:51:11 -0500 | [diff] [blame] | 138 | exit 1 |
Leonardo Sandoval | 9f15980 | 2021-01-20 16:47:25 -0600 | [diff] [blame] | 139 | fi |
Milosz Wasilewski | 1043858 | 2020-12-03 11:36:21 +0000 | [diff] [blame] | 140 | fi |
| 141 | fi |