lava: handle reaching max number of retry for submit operation
[lttng-ci.git] / scripts / system-tests / lava2-submit.py
CommitLineData
21fec189 1#!/usr/bin/python3
878b4840
JR
2# Copyright (C) 2016 - Francis Deslauriers <francis.deslauriers@efficios.com>
3#
4# This program is free software: you can redistribute it and/or modify
5# it under the terms of the GNU General Public License as published by
6# the Free Software Foundation, either version 3 of the License, or
7# (at your option) any later version.
8#
9# This program is distributed in the hope that it will be useful,
10# but WITHOUT ANY WARRANTY; without even the implied warranty of
11# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12# GNU General Public License for more details.
13#
14# You should have received a copy of the GNU General Public License
15# along with this program. If not, see <http://www.gnu.org/licenses/>.
16
17import argparse
878b4840
JR
18import json
19import os
20import random
9356eef7 21import re
878b4840
JR
22import sys
23import time
24import xmlrpc.client
6d3950a9
JR
25from urllib.parse import urljoin
26from urllib.request import urlretrieve
21fec189
JR
27import yaml
28from jinja2 import Environment, FileSystemLoader
878b4840 29
ef84c6ec
JR
30USERNAME = 'lava-jenkins'
31HOSTNAME = 'lava-master-02.internal.efficios.com'
0425e1dd 32OBJSTORE_URL = "https://obj.internal.efficios.com/lava/results/"
878b4840 33
cf1271bb
JR
34def parse_stable_version(stable_version_string):
35 # Get the major and minor version numbers from the lttng version string.
36 version_match = re.search('stable-(\d).(\d\d)', stable_version_string)
37
38 if version_match is not None:
39 major_version = int(version_match.group(1))
40 minor_version = int(version_match.group(2))
41 else:
42 # Setting to zero to make the comparison below easier.
43 major_version = 0
44 minor_version = 0
45 return major_version, minor_version
46
f5f36c68
FD
47
48class TestType:
21fec189 49 """ Enum like for test type """
f5f36c68 50
523e784d
FD
51 baremetal_tests = 1
52 kvm_tests = 2
878b4840 53 values = {
f5f36c68
FD
54 'baremetal-tests': baremetal_tests,
55 'kvm-tests': kvm_tests,
878b4840
JR
56 }
57
f5f36c68
FD
58
59class DeviceType:
21fec189 60 """ Enum like for device type """
f5f36c68 61
4cb5cc4f 62 x86 = 'x86'
f9a184a9 63 kvm = 'qemu'
f5f36c68
FD
64 values = {'kvm': kvm, 'x86': x86}
65
4cb5cc4f 66
878b4840
JR
67def get_job_bundle_content(server, job):
68 try:
69 bundle_sha = server.scheduler.job_status(str(job))['bundle_sha1']
70 bundle = server.dashboard.get(bundle_sha)
21fec189
JR
71 except xmlrpc.client.Fault as error:
72 print('Error while fetching results bundle', error.faultString)
73 raise error
878b4840
JR
74
75 return json.loads(bundle['content'])
76
f5f36c68 77
878b4840 78def check_job_all_test_cases_state_count(server, job):
21fec189
JR
79 """
80 Parse the results bundle to see the run-tests testcase
81 of the lttng-kernel-tests passed successfully
82 """
0425e1dd
JR
83 print("Testcase result:")
84 content = server.results.get_testjob_results_yaml(str(job))
c2f8bcb9 85 testcases = yaml.unsafe_load(content)
878b4840 86
21fec189
JR
87 passed_tests = 0
88 failed_tests = 0
0425e1dd
JR
89 for testcase in testcases:
90 if testcase['result'] != 'pass':
f5f36c68
FD
91 print(
92 "\tFAILED {}\n\t\t See http://{}{}".format(
93 testcase['name'], HOSTNAME, testcase['url']
94 )
95 )
21fec189 96 failed_tests += 1
0425e1dd 97 else:
21fec189 98 passed_tests += 1
878b4840
JR
99 return (passed_tests, failed_tests)
100
f5f36c68 101
878b4840 102def print_test_output(server, job):
21fec189
JR
103 """
104 Parse the attachment of the testcase to fetch the stdout of the test suite
105 """
0425e1dd 106 job_finished, log = server.scheduler.jobs.logs(str(job))
be7f51b6 107 logs = yaml.unsafe_load(log.data.decode('ascii'))
0425e1dd
JR
108 print_line = False
109 for line in logs:
110 if line['lvl'] != 'target':
111 continue
112 if line['msg'] == '<LAVA_SIGNAL_STARTTC run-tests>':
113 print('---- TEST SUITE OUTPUT BEGIN ----')
114 print_line = True
115 continue
116 if line['msg'] == '<LAVA_SIGNAL_ENDTC run-tests>':
117 print('----- TEST SUITE OUTPUT END -----')
d132001f
FD
118 print_line = False
119 continue
0425e1dd
JR
120 if print_line:
121 print("{} {}".format(line['dt'], line['msg']))
878b4840 122
f5f36c68
FD
123
124def get_vlttng_cmd(
9356eef7 125 lttng_version, lttng_tools_url, lttng_tools_commit, lttng_ust_url=None, lttng_ust_commit=None
f5f36c68 126):
21fec189
JR
127 """
128 Return vlttng cmd to be used in the job template for setup.
129 """
0dd62728
JR
130
131 major_version, minor_version = parse_stable_version(lttng_version)
132
f1d85a63
JR
133 urcu_profile = ""
134 if lttng_version == 'master' or (major_version >= 2 and minor_version >= 11):
135 urcu_profile = "urcu-master"
136 else:
137 urcu_profile = "urcu-stable-0.12"
878b4840 138
f5f36c68 139 vlttng_cmd = (
f1d85a63
JR
140 'vlttng --jobs=$(nproc) --profile ' + urcu_profile
141 + ' --override projects.babeltrace.build-env.PYTHON=python3'
f5f36c68 142 ' --override projects.babeltrace.build-env.PYTHON_CONFIG=python3-config'
0c4ab1e7 143 ' --profile babeltrace-stable-1.5'
f5f36c68
FD
144 ' --profile babeltrace-python'
145 ' --profile lttng-tools-master'
146 ' --override projects.lttng-tools.source='
147 + lttng_tools_url
148 + ' --override projects.lttng-tools.checkout='
149 + lttng_tools_commit
150 + ' --profile lttng-tools-no-man-pages'
151 )
878b4840
JR
152
153 if lttng_ust_commit is not None:
f5f36c68
FD
154 vlttng_cmd += (
155 ' --profile lttng-ust-master '
156 ' --override projects.lttng-ust.source='
157 + lttng_ust_url
158 + ' --override projects.lttng-ust.checkout='
159 + lttng_ust_commit
160 + ' --profile lttng-ust-no-man-pages'
161 )
878b4840 162
9356eef7
FD
163
164 if lttng_version == 'master' or (major_version >= 2 and minor_version >= 11):
165 vlttng_cmd += (
166 ' --override projects.lttng-tools.configure+=--enable-test-sdt-uprobe'
167 )
168
888b31de 169 vlttng_path = '/tmp/virtenv'
c11ec858 170
4cb5cc4f 171 vlttng_cmd += ' ' + vlttng_path
878b4840 172
4cb5cc4f 173 return vlttng_cmd
878b4840 174
f5f36c68 175
878b4840 176def main():
559b83b3 177 send_retry_limit = 10
9a49d69d 178 nfsrootfs = "https://obj.internal.efficios.com/lava/rootfs/rootfs_amd64_xenial_2018-12-05.tar.gz"
878b4840
JR
179 test_type = None
180 parser = argparse.ArgumentParser(description='Launch baremetal test using Lava')
181 parser.add_argument('-t', '--type', required=True)
9356eef7 182 parser.add_argument('-lv', '--lttng-version', required=True)
878b4840
JR
183 parser.add_argument('-j', '--jobname', required=True)
184 parser.add_argument('-k', '--kernel', required=True)
878b4840 185 parser.add_argument('-lm', '--lmodule', required=True)
eb5bdbeb 186 parser.add_argument('-tu', '--tools-url', required=True)
878b4840 187 parser.add_argument('-tc', '--tools-commit', required=True)
6b35e57c 188 parser.add_argument('-id', '--build-id', required=True)
eb5bdbeb 189 parser.add_argument('-uu', '--ust-url', required=False)
878b4840 190 parser.add_argument('-uc', '--ust-commit', required=False)
f23dc688 191 parser.add_argument('-d', '--debug', required=False, action='store_true')
878b4840
JR
192 args = parser.parse_args()
193
194 if args.type not in TestType.values:
195 print('argument -t/--type {} unrecognized.'.format(args.type))
196 print('Possible values are:')
197 for k in TestType.values:
198 print('\t {}'.format(k))
199 return -1
878b4840
JR
200
201 lava_api_key = None
f23dc688
JR
202 if not args.debug:
203 try:
ef84c6ec 204 lava_api_key = os.environ['LAVA2_JENKINS_TOKEN']
21fec189 205 except Exception as error:
f5f36c68
FD
206 print(
207 'LAVA2_JENKINS_TOKEN not found in the environment variable. Exiting...',
208 error,
209 )
f23dc688 210 return -1
878b4840 211
4cb5cc4f 212 jinja_loader = FileSystemLoader(os.path.dirname(os.path.realpath(__file__)))
f5f36c68 213 jinja_env = Environment(loader=jinja_loader, trim_blocks=True, lstrip_blocks=True)
4cb5cc4f 214 jinja_template = jinja_env.get_template('template_lava_job.jinja2')
4cb5cc4f
JR
215
216 test_type = TestType.values[args.type]
217
523e784d 218 if test_type is TestType.baremetal_tests:
4cb5cc4f 219 device_type = DeviceType.x86
878b4840 220 else:
4cb5cc4f 221 device_type = DeviceType.kvm
e640b6d8
JR
222
223 vlttng_path = '/tmp/virtenv'
4cb5cc4f 224
f5f36c68 225 vlttng_cmd = get_vlttng_cmd(
9356eef7 226 args.lttng_version, args.tools_url, args.tools_commit, args.ust_url, args.ust_commit
f5f36c68 227 )
4cb5cc4f 228
cf1271bb
JR
229 if args.lttng_version == "master":
230 lttng_version_string = "master"
7ce9e417
JR
231 elif args.lttng_version == "canary":
232 lttng_version_string = "2.10"
cf1271bb
JR
233 else:
234 major, minor = parse_stable_version(args.lttng_version)
235 lttng_version_string = str(major) + "." + str(minor)
236
237
4cb5cc4f
JR
238 context = dict()
239 context['DeviceType'] = DeviceType
240 context['TestType'] = TestType
241
242 context['job_name'] = args.jobname
243 context['test_type'] = test_type
4cb5cc4f
JR
244 context['random_seed'] = random.randint(0, 1000000)
245 context['device_type'] = device_type
246
247 context['vlttng_cmd'] = vlttng_cmd
248 context['vlttng_path'] = vlttng_path
cf1271bb 249 context['lttng_version_string'] = lttng_version_string
4cb5cc4f
JR
250
251 context['kernel_url'] = args.kernel
252 context['nfsrootfs_url'] = nfsrootfs
253 context['lttng_modules_url'] = args.lmodule
6b35e57c 254 context['jenkins_build_id'] = args.build_id
4cb5cc4f
JR
255
256 context['kprobe_round_nb'] = 10
257
ef84c6ec
JR
258 render = jinja_template.render(context)
259
ef84c6ec
JR
260 print('Job to be submitted:')
261
262 print(render)
878b4840 263
f23dc688 264 if args.debug:
f23dc688
JR
265 return 0
266
f5f36c68
FD
267 server = xmlrpc.client.ServerProxy(
268 'http://%s:%s@%s/RPC2' % (USERNAME, lava_api_key, HOSTNAME)
269 )
878b4840 270
559b83b3 271 for attempt in range(1, send_retry_limit + 1):
21fec189
JR
272 try:
273 jobid = server.scheduler.submit_job(render)
274 except xmlrpc.client.ProtocolError as error:
f5f36c68
FD
275 print(
276 'Protocol error on submit, sleeping and retrying. Attempt #{}'.format(
277 attempt
278 )
279 )
21fec189
JR
280 time.sleep(5)
281 continue
282 else:
283 break
559b83b3
JR
284 # Early exit when the maximum number of retry is reached.
285 if attempt == send_retry_limit:
286 print(
287 'Protocol error on submit, maximum number of retry reached ({})'.format(
288 attempt
289 )
290 )
291 return -1
878b4840
JR
292
293 print('Lava jobid:{}'.format(jobid))
f5f36c68
FD
294 print(
295 'Lava job URL: http://lava-master-02.internal.efficios.com/scheduler/job/{}'.format(
296 jobid
297 )
298 )
878b4840 299
f5f36c68 300 # Check the status of the job every 30 seconds
0425e1dd
JR
301 jobstatus = server.scheduler.job_state(jobid)['job_state']
302 running = False
21fec189 303 while jobstatus in ['Submitted', 'Scheduling', 'Scheduled', 'Running']:
0425e1dd 304 if not running and jobstatus == 'Running':
878b4840 305 print('Job started running')
0425e1dd 306 running = True
878b4840 307 time.sleep(30)
26cbe60b
JR
308 try:
309 jobstatus = server.scheduler.job_state(jobid)['job_state']
21fec189
JR
310 except xmlrpc.client.ProtocolError as error:
311 print('Protocol error, retrying')
312 continue
878b4840 313 print('Job ended with {} status.'.format(jobstatus))
0425e1dd
JR
314
315 if jobstatus != 'Finished':
878b4840 316 return -1
878b4840 317
0425e1dd
JR
318 if test_type is TestType.kvm_tests or test_type is TestType.baremetal_tests:
319 print_test_output(server, jobid)
0425e1dd 320
21fec189 321 passed, failed = check_job_all_test_cases_state_count(server, jobid)
0425e1dd
JR
322 print('With {} passed and {} failed Lava test cases.'.format(passed, failed))
323
21fec189 324 if failed != 0:
0425e1dd 325 return -1
878b4840 326
21fec189
JR
327 return 0
328
f5f36c68 329
878b4840
JR
330if __name__ == "__main__":
331 sys.exit(main())
This page took 0.046969 seconds and 4 git commands to generate.