blob: 678270f88cdf1c6fd509d97ff85e8bf9fe015474 [file] [log] [blame]
Milosz Wasilewski10438582020-12-03 11:36:21 +00001#!/bin/bash
2
Leonardo Sandoval9f159802021-01-20 16:47:25 -06003set -xe
Milosz Wasilewski10438582020-12-03 11:36:21 +00004
Paul Sokolovsky896532e2023-05-12 23:22:49 +03005USE_SQUAD=0
Paul Sokolovsky35c231a2023-05-12 22:53:23 +03006
Leonardo Sandoval5a335662021-03-26 19:57:40 -06007# Wait for the LAVA job to finished
8# By default, timeout at 5400 secs (1.5 hours) and monitor every 60 seconds
9wait_lava_job() {
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070010 set +x
Leonardo Sandoval5a335662021-03-26 19:57:40 -060011 local id=$1
12 local timeout="${2:-5400}"
13 local interval="${3:-60}"
14
15 (( t = timeout ))
16
17 while ((t > 0)); do
18 sleep $interval
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070019 resilient_cmd lavacli jobs show $id | tee "${WORKSPACE}/lava-progress.show" | grep 'state *:'
20 set +x
Leonardo Sandoval5a335662021-03-26 19:57:40 -060021 if grep 'state.*: Finished' "${WORKSPACE}/lava-progress.show"; then
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070022 set -x
23 cat "${WORKSPACE}/lava-progress.show"
Paul Sokolovskya153b602022-10-12 20:50:05 +030024 # finished
25 return 0
Leonardo Sandoval5a335662021-03-26 19:57:40 -060026 fi
27 ((t -= interval))
28 done
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070029 set -x
30 cat "${WORKSPACE}/lava-progress.show"
31 echo "Timeout waiting for job to finish"
Paul Sokolovskya153b602022-10-12 20:50:05 +030032 # timeout
33 return 1
Leonardo Sandoval5a335662021-03-26 19:57:40 -060034}
35
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060036# Run the given command passed through parameters, if fails, try
37# at most more N-times with a pause of M-seconds until success.
38resilient_cmd() {
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070039 set +x
Paul Sokolovsky7fb59b52023-05-13 10:00:57 +030040 local max_retries=10
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060041 local sleep_body=2
42 local iter=0
43
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060044 while true; do
Paul Sokolovsky04004c12023-02-24 18:27:40 +070045 if "$@"; then
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060046 break
47 fi
48
49 sleep ${sleep_body}
Paul Sokolovsky719ac1d2023-05-13 10:03:37 +030050 # Exponential backoff
51 sleep_body=$(( sleep_body * 2 ))
52 if [ ${sleep_body} -ge 60 ]; then
53 sleep_body=60
54 echo "WARNING: Command '$@' still not successful on retry #${iter}, exp backoff already limited" 1>&2
55 fi
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060056
57 iter=$(( iter + 1 ))
Paul Sokolovsky7fb59b52023-05-13 10:00:57 +030058 if [ ${iter} -ge ${max_retries} ]; then
Paul Sokolovsky1f0b7482023-05-09 22:47:49 +030059 echo "ERROR: Command '$@' failed ${iter} times in row" 1>&2
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070060 set -x
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060061 return 1
62 fi
63 done
Paul Sokolovsky99eaff62023-01-25 19:41:23 +070064 set -x
Leonardo Sandovaleb94e912021-01-29 12:23:59 -060065 return 0
66}
67
Milosz Wasilewski10438582020-12-03 11:36:21 +000068ls -l ${WORKSPACE}
69
Paul Sokolovsky35c231a2023-05-12 22:53:23 +030070lavacli identities add --username ${LAVA_USER} --token ${LAVA_TOKEN} --uri "https://${LAVA_SERVER}/RPC2" default
71
72if [ $USE_SQUAD -ne 0 -a -n "${QA_SERVER_VERSION}" ]; then
73 # Submit via SQUAD
74
Leonardo Sandoval9f159802021-01-20 16:47:25 -060075 if [ -n "${GERRIT_CHANGE_NUMBER}" ] && [ -n "${GERRIT_PATCHSET_NUMBER}" ]; then
Milosz Wasilewski10438582020-12-03 11:36:21 +000076 curl \
Paul Sokolovskya3ac1262022-07-08 16:03:48 +030077 --fail \
Milosz Wasilewski10438582020-12-03 11:36:21 +000078 --retry 4 \
79 -X POST \
80 --header "Auth-Token: ${QA_REPORTS_TOKEN}" \
Milosz Wasilewski10438582020-12-03 11:36:21 +000081 ${QA_SERVER}/api/createbuild/${QA_SERVER_TEAM}/${QA_SERVER_PROJECT}/${QA_SERVER_VERSION}
82 fi
83
84 TESTJOB_ID=$(curl \
Paul Sokolovskya3ac1262022-07-08 16:03:48 +030085 --fail \
Milosz Wasilewski10438582020-12-03 11:36:21 +000086 --retry 4 \
87 -X POST \
88 --header "Auth-Token: ${QA_REPORTS_TOKEN}" \
89 --form backend=${LAVA_SERVER} \
Chris Kayf6ff4672022-11-03 13:09:44 +000090 --form definition=@artefacts-lava/job.yaml \
Milosz Wasilewski10438582020-12-03 11:36:21 +000091 ${QA_SERVER}/api/submitjob/${QA_SERVER_TEAM}/${QA_SERVER_PROJECT}/${QA_SERVER_VERSION}/${DEVICE_TYPE})
Leonardo Sandoval9f159802021-01-20 16:47:25 -060092
Arthur She2770cee2022-09-14 15:12:18 -070093 # SQUAD will send 400, curl error code 22, on bad test definition
94 if [ "$?" = "22" ]; then
95 echo "Bad test definition!!"
96 exit 1
97 fi
98
Leonardo Sandoval9f159802021-01-20 16:47:25 -060099 if [ -n "${TESTJOB_ID}" ]; then
Milosz Wasilewski10438582020-12-03 11:36:21 +0000100 echo "TEST JOB URL: ${QA_SERVER}/testjob/${TESTJOB_ID} TEST JOB ID: ${TESTJOB_ID}"
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600101
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600102
Leonardo Sandoval73d301a2021-02-12 13:42:55 -0600103 # The below loop with a sleep is intentional: LAVA could be under heavy load so previous job creation can
104 # take 'some' time to get the right numeric LAVA JOB ID
105 renumber='^[0-9]+$'
106 LAVAJOB_ID="null"
107 iter=0
Chris Kayf1b3da92022-09-08 13:15:16 +0100108 max_tries=120 # run retries for an hour
Leonardo Sandoval73d301a2021-02-12 13:42:55 -0600109 while ! [[ $LAVAJOB_ID =~ $renumber ]]; do
110 if [ $iter -eq $max_tries ] ; then
111 LAVAJOB_ID=''
112 break
113 fi
Leonardo Sandoval8267f432021-05-07 10:02:00 -0500114 sleep 30
Paul Sokolovskya3ac1262022-07-08 16:03:48 +0300115 LAVAJOB_ID=$(curl --fail --retry 4 ${QA_SERVER}/api/testjobs/${TESTJOB_ID}/?fields=job_id)
Leonardo Sandoval73d301a2021-02-12 13:42:55 -0600116
117 # Get the job_id value (whatever it is)
118 LAVAJOB_ID=$(echo ${LAVAJOB_ID} | jq '.job_id')
119 LAVAJOB_ID="${LAVAJOB_ID//\"/}"
120
121 iter=$(( iter + 1 ))
122 done
Paul Sokolovsky35c231a2023-05-12 22:53:23 +0300123 fi
124else
125 # Submit directly to LAVA
126 LAVAJOB_ID=$(resilient_cmd lavacli jobs submit artefacts-lava/job.yaml)
127fi
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600128
Paul Sokolovsky35c231a2023-05-12 22:53:23 +0300129
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300130# check that rest query at least get non-empty value
131if [ -n "${LAVAJOB_ID}" ]; then
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600132
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300133 echo "LAVA URL: https://${LAVA_SERVER}/scheduler/job/${LAVAJOB_ID} LAVA JOB ID: ${LAVAJOB_ID}"
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600134
Leonardo Sandovala8078d62021-02-11 16:29:25 -0600135
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300136 # if timeout on waiting for LAVA to complete, create an 'artificial' lava.log indicating
137 # job ID and timeout seconds
138 if ! wait_lava_job ${LAVAJOB_ID}; then
139 echo "Stopped monitoring LAVA JOB ${LAVAJOB_ID}, likely stuck or timeout too short?" | tee "${WORKSPACE}/lava.log"
140 exit 1
141 else
142 # Retrieve the test job plain log which is a yaml format file from LAVA
143 resilient_cmd sh -c "lavacli jobs logs --raw ${LAVAJOB_ID} > ${WORKSPACE}/lava-raw.log"
Arthur She5fc74272021-03-26 21:24:34 -0700144
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300145 # Fetch and store LAVA job result (1 failure, 0 success)
146 resilient_cmd lavacli results ${LAVAJOB_ID} | tee "${WORKSPACE}/lava.results"
147 if grep -q '\[fail\]' "${WORKSPACE}/lava.results"; then
148 exit 1
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600149 else
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300150 exit 0
Leonardo Sandoval9f159802021-01-20 16:47:25 -0600151 fi
Milosz Wasilewski10438582020-12-03 11:36:21 +0000152 fi
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300153else
154 echo "LAVA Job ID could not be obtained"
155 exit 1
Milosz Wasilewski10438582020-12-03 11:36:21 +0000156fi
Paul Sokolovsky74cd2e02023-05-12 23:40:55 +0300157