runtests.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577
  1. #!/usr/bin/env python
  2. #-------------------------------------------------------------------------------------------------------
  3. # Copyright (C) Microsoft. All rights reserved.
  4. # Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
  5. #-------------------------------------------------------------------------------------------------------
  6. from __future__ import print_function
  7. from datetime import datetime
  8. from multiprocessing import Pool, Manager
  9. from threading import Timer
  10. import sys
  11. import os
  12. import subprocess as SP
  13. import traceback
  14. import argparse
  15. import xml.etree.ElementTree as ET
  16. import re
  17. import time
  18. # handle command line args
  19. parser = argparse.ArgumentParser(
  20. description='ChakraCore *nix Test Script',
  21. formatter_class=argparse.RawDescriptionHelpFormatter,
  22. epilog='''\
  23. Samples:
  24. test all folders:
  25. runtests.py
  26. test only Array:
  27. runtests.py Array
  28. test a single file:
  29. runtests.py Basics/hello.js
  30. ''')
  31. parser.add_argument('folders', metavar='folder', nargs='*',
  32. help='folder subset to run tests')
  33. parser.add_argument('-b', '--binary', metavar='bin', help='ch full path')
  34. parser.add_argument('-d', '--debug', action='store_true',
  35. help='use debug build');
  36. parser.add_argument('-t', '--test', action='store_true', help='use test build')
  37. parser.add_argument('--include-slow', action='store_true',
  38. help='include slow tests')
  39. parser.add_argument('--only-slow', action='store_true',
  40. help='run only slow tests')
  41. parser.add_argument('--nightly', action='store_true',
  42. help='run as nightly tests')
  43. parser.add_argument('--tag', nargs='*',
  44. help='select tests with given tags')
  45. parser.add_argument('--not-tag', nargs='*',
  46. help='exclude tests with given tags')
  47. parser.add_argument('--timeout', type=int, default=60,
  48. help='test timeout (default 60 seconds)')
  49. parser.add_argument('-l', '--logfile', metavar='logfile', help='file to log results to', default=None)
  50. parser.add_argument('--x86', action='store_true', help='use x86 build')
  51. parser.add_argument('--x64', action='store_true', help='use x64 build')
  52. args = parser.parse_args()
  53. test_root = os.path.dirname(os.path.realpath(__file__))
  54. repo_root = os.path.dirname(test_root)
  55. # arch: x86, x64
  56. arch = 'x86' if args.x86 else ('x64' if args.x64 else None)
  57. if arch == None:
  58. arch = os.environ.get('_BuildArch', 'x86')
  59. if sys.platform != 'win32':
  60. arch = 'x64' # xplat: hard code arch == x64
  61. arch_alias = 'amd64' if arch == 'x64' else None
  62. # flavor: debug, test, release
  63. type_flavor = {'chk':'Debug', 'test':'Test', 'fre':'Release'}
  64. flavor = 'Debug' if args.debug else ('Test' if args.test else None)
  65. if flavor == None:
  66. print("ERROR: Test build target wasn't defined.")
  67. print("Try '-t' (test build) or '-d' (debug build).")
  68. sys.exit(1)
  69. flavor_alias = 'chk' if flavor == 'Debug' else 'fre'
  70. # binary: full ch path
  71. binary = args.binary
  72. if binary == None:
  73. if sys.platform == 'win32':
  74. binary = 'Build/VcBuild/bin/{}_{}/ch.exe'.format(arch, flavor)
  75. else:
  76. binary = 'BuildLinux/{0}/ch'.format(flavor)
  77. binary = os.path.join(repo_root, binary)
  78. if not os.path.isfile(binary):
  79. print('{} not found. Did you run ./build.sh already?'.format(binary))
  80. sys.exit(1)
  81. # global tags/not_tags
  82. tags = set(args.tag or [])
  83. not_tags = set(args.not_tag or []).union(['fail', 'exclude_' + arch])
  84. if arch_alias:
  85. not_tags.add('exclude_' + arch_alias)
  86. if flavor_alias:
  87. not_tags.add('exclude_' + flavor_alias)
  88. if args.only_slow:
  89. tags.add('Slow')
  90. elif not args.include_slow:
  91. not_tags.add('Slow')
  92. not_tags.add('exclude_nightly' if args.nightly else 'nightly')
  93. # xplat: temp hard coded to exclude unsupported tests
  94. if sys.platform != 'win32':
  95. not_tags.add('exclude_xplat')
  96. not_tags.add('Intl')
  97. not_tags.add('require_backend')
  98. not_tags.add('require_debugger')
  99. if sys.platform == 'darwin':
  100. not_tags.add('exclude_mac')
  101. not_compile_flags = set(['-simdjs']) \
  102. if sys.platform != 'win32' else None
  103. # use tags/not_tags/not_compile_flags as case-insensitive
  104. def lower_set(s):
  105. return set([x.lower() for x in s] if s else [])
  106. tags = lower_set(tags)
  107. not_tags = lower_set(not_tags)
  108. not_compile_flags = lower_set(not_compile_flags)
  109. # split tags text into tags set
  110. _empty_set = set()
  111. def split_tags(text):
  112. return set(x.strip() for x in text.lower().split(',')) if text \
  113. else _empty_set
  114. class LogFile(object):
  115. def __init__(self, log_file_path = None):
  116. self.file = None
  117. if log_file_path is None:
  118. # Set up the log file paths
  119. # Make sure the right directory exists and the log file doesn't
  120. log_file_name = "testrun.{0}{1}.log".format(arch, flavor)
  121. log_file_directory = os.path.join(repo_root, "test", "logs")
  122. if not os.path.exists(log_file_directory):
  123. os.mkdir(log_file_directory)
  124. self.log_file_path = os.path.join(log_file_directory, log_file_name)
  125. if os.path.exists(self.log_file_path):
  126. os.remove(self.log_file_path)
  127. else:
  128. self.log_file_path = log_file_path
  129. self.file = open(self.log_file_path, "w")
  130. def log(self, args):
  131. self.file.write(args)
  132. def __del__(self):
  133. if not (self.file is None):
  134. self.file.close()
  135. if __name__ == '__main__':
  136. log_file = LogFile(args.logfile)
  137. def log_message(msg = ""):
  138. log_file.log(msg + "\n")
  139. def print_and_log(msg = ""):
  140. print(msg)
  141. log_message(msg)
  142. # remove carriage returns at end of line to avoid platform difference
  143. def normalize_new_line(text):
  144. return re.sub(b'[\r]+\n', b'\n', text)
  145. # A test simply contains a collection of test attributes.
  146. # Misc attributes added by test run:
  147. # filename full path of test file
  148. # elapsed_time elapsed time when running the test
  149. #
  150. class Test(dict):
  151. __setattr__ = dict.__setitem__
  152. __delattr__ = dict.__delitem__
  153. # support dot syntax for normal attribute access
  154. def __getattr__(self, key):
  155. return super(Test, self).__getattr__(key) if key.startswith('__') \
  156. else self.get(key)
  157. # mark start of this test run, to compute elapsed_time
  158. def start(self):
  159. self.start_time = datetime.now()
  160. # mark end of this test run, compute elapsed_time
  161. def done(self):
  162. if not self.elapsed_time:
  163. self.elapsed_time = (datetime.now() - self.start_time)\
  164. .total_seconds()
  165. # records pass_count/fail_count
  166. class PassFailCount(object):
  167. def __init__(self):
  168. self.pass_count = 0
  169. self.fail_count = 0
  170. def __str__(self):
  171. return 'passed {}, failed {}'.format(self.pass_count, self.fail_count)
  172. def total_count(self):
  173. return self.pass_count + self.fail_count
  174. # records total and individual folder's pass_count/fail_count
  175. class TestResult(PassFailCount):
  176. def __init__(self):
  177. super(self.__class__, self).__init__()
  178. self.folders = {}
  179. def _get_folder_result(self, folder):
  180. r = self.folders.get(folder)
  181. if not r:
  182. r = PassFailCount()
  183. self.folders[folder] = r
  184. return r
  185. def log(self, filename, fail=False):
  186. folder = os.path.basename(os.path.dirname(filename))
  187. r = self._get_folder_result(folder)
  188. if fail:
  189. r.fail_count += 1
  190. self.fail_count += 1
  191. else:
  192. r.pass_count += 1
  193. self.pass_count += 1
  194. # test variants:
  195. # interpreted: -maxInterpretCount:1 -maxSimpleJitRunCount:1 -bgjit-
  196. # dynapogo: -forceNative -off:simpleJit -bgJitDelay:0
  197. class TestVariant(object):
  198. def __init__(self, name, compile_flags=[]):
  199. self.name = name
  200. self.compile_flags = \
  201. ['-WERExceptionSupport', '-ExtendedErrorStackForTestHost',
  202. '-BaselineMode'] + compile_flags
  203. self.tags = tags.copy()
  204. self.not_tags = not_tags.union(
  205. ['{}_{}'.format(x, name) for x in ('fails','exclude')])
  206. self.msg_queue = Manager().Queue() # messages from multi processes
  207. self.test_result = TestResult()
  208. self._print_lines = [] # _print lines buffer
  209. self._last_len = 0
  210. # check if this test variant should run a given test
  211. def _should_test(self, test):
  212. tags = split_tags(test.get('tags'))
  213. if not tags.isdisjoint(self.not_tags):
  214. return False
  215. if self.tags and not self.tags.issubset(tags):
  216. return False
  217. if not_compile_flags: # exclude unsupported compile-flags if any
  218. flags = test.get('compile-flags')
  219. if flags and \
  220. not not_compile_flags.isdisjoint(flags.lower().split()):
  221. return False
  222. return True
  223. # print output from multi-process run, to be sent with result message
  224. def _print(self, line):
  225. self._print_lines.append(str(line))
  226. # queue a test result from multi-process runs
  227. def _log_result(self, test, fail):
  228. output = '\n'.join(self._print_lines) # collect buffered _print output
  229. self._print_lines = []
  230. self.msg_queue.put((test.filename, fail, test.elapsed_time, output))
  231. # (on main process) process one queued message
  232. def _process_msg(self, msg):
  233. filename, fail, elapsed_time, output = msg
  234. self.test_result.log(filename, fail=fail)
  235. line = '[{}/{} {:4.2f}] {} -> {}'.format(
  236. self.test_result.total_count(),
  237. self.test_count,
  238. elapsed_time,
  239. 'Failed' if fail else 'Passed',
  240. self._short_name(filename))
  241. padding = self._last_len - len(line)
  242. print(line + ' ' * padding, end='\n' if fail else '\r')
  243. log_message(line)
  244. self._last_len = len(line) if not fail else 0
  245. if len(output) > 0:
  246. print_and_log(output)
  247. # get a shorter test file path for display only
  248. def _short_name(self, filename):
  249. folder = os.path.basename(os.path.dirname(filename))
  250. return os.path.join(folder, os.path.basename(filename))
  251. # (on main process) wait and process one queued message
  252. def _process_one_msg(self):
  253. self._process_msg(self.msg_queue.get())
  254. # log a failed test with details
  255. def _show_failed(self, test, flags, exit_code, output,
  256. expected_output=None, timedout=False):
  257. if timedout:
  258. self._print('ERROR: Test timed out!')
  259. self._print('{} {} {}'.format(binary, ' '.join(flags), test.filename))
  260. if expected_output == None or timedout:
  261. self._print("\nOutput:")
  262. self._print("----------------------------")
  263. self._print(output)
  264. self._print("----------------------------")
  265. else:
  266. lst_output = output.split(b'\n')
  267. lst_expected = expected_output.split(b'\n')
  268. ln = min(len(lst_output), len(lst_expected))
  269. for i in range(0, ln):
  270. if lst_output[i] != lst_expected[i]:
  271. self._print("Output: (at line " + str(i) + ")")
  272. self._print("----------------------------")
  273. self._print(lst_output[i])
  274. self._print("----------------------------")
  275. self._print("Expected Output:")
  276. self._print("----------------------------")
  277. self._print(lst_expected[i])
  278. self._print("----------------------------")
  279. break
  280. self._print("exit code: {}".format(exit_code))
  281. self._log_result(test, fail=True)
  282. # temp: try find real file name on hard drive if case mismatch
  283. def _check_file(self, folder, filename):
  284. path = os.path.join(folder, filename)
  285. if os.path.isfile(path):
  286. return path # file exists on disk
  287. filename_lower = filename.lower()
  288. files = os.listdir(folder)
  289. for i in range(len(files)):
  290. if files[i].lower() == filename_lower:
  291. self._print('\nWARNING: {} should be {}\n'.format(
  292. path, files[i]))
  293. return os.path.join(folder, files[i])
  294. # cann't find the file, just return the path and let it error out
  295. return path
  296. # run one test under this variant
  297. def test_one(self, test):
  298. try:
  299. test.start()
  300. self._run_one_test(test)
  301. except Exception:
  302. test.done()
  303. self._print(traceback.format_exc())
  304. self._log_result(test, fail=True)
  305. # internally perform one test run
  306. def _run_one_test(self, test):
  307. folder = test.folder
  308. js_file = test.filename = self._check_file(folder, test.files)
  309. js_output = b''
  310. working_path = os.path.dirname(js_file)
  311. flags = test.get('compile-flags')
  312. flags = self.compile_flags + (flags.split() if flags else [])
  313. cmd = [binary] + flags + [os.path.basename(js_file)]
  314. test.start()
  315. proc = SP.Popen(cmd, stdout=SP.PIPE, stderr=SP.STDOUT, cwd=working_path)
  316. timeout_data = [proc, False]
  317. def timeout_func(timeout_data):
  318. timeout_data[0].kill()
  319. timeout_data[1] = True
  320. timeout = test.get('timeout', args.timeout) # test override or default
  321. timer = Timer(timeout, timeout_func, [timeout_data])
  322. try:
  323. timer.start()
  324. js_output = normalize_new_line(proc.communicate()[0])
  325. exit_code = proc.wait()
  326. finally:
  327. timer.cancel()
  328. test.done()
  329. # shared _show_failed args
  330. fail_args = { 'test': test, 'flags': flags,
  331. 'exit_code': exit_code, 'output': js_output };
  332. # check timed out
  333. if (timeout_data[1]):
  334. return self._show_failed(timedout=True, **fail_args)
  335. # check ch failed
  336. if exit_code != 0:
  337. return self._show_failed(**fail_args)
  338. # check output
  339. if 'baseline' not in test:
  340. # output lines must be 'pass' or 'passed' or empty
  341. lines = (line.lower() for line in js_output.split(b'\n'))
  342. if any(line != b'' and line != b'pass' and line != b'passed'
  343. for line in lines):
  344. return self._show_failed(**fail_args)
  345. else:
  346. baseline = test.get('baseline')
  347. if baseline:
  348. # perform baseline comparison
  349. baseline = self._check_file(working_path, baseline)
  350. with open(baseline, 'rb') as bs_file:
  351. baseline_output = bs_file.read()
  352. # Cleanup carriage return
  353. # todo: remove carriage return at the end of the line
  354. # or better fix ch to output same on all platforms
  355. expected_output = normalize_new_line(baseline_output)
  356. if expected_output != js_output:
  357. return self._show_failed(
  358. expected_output=expected_output, **fail_args)
  359. # passed
  360. self._log_result(test, fail=False)
  361. # run tests under this variant, using given multiprocessing Pool
  362. def run(self, tests, pool):
  363. print_and_log('\n############# Starting {} variant #############'\
  364. .format(self.name))
  365. if self.tags:
  366. print_and_log(' tags: {}'.format(self.tags))
  367. for x in self.not_tags:
  368. print_and_log(' exclude: {}'.format(x))
  369. print_and_log()
  370. # filter tests to run
  371. tests = [x for x in tests if self._should_test(x)]
  372. self.test_count = len(tests)
  373. # run tests in parallel
  374. result = pool.map_async(run_one, [(self,test) for test in tests])
  375. while self.test_result.total_count() != self.test_count:
  376. self._process_one_msg()
  377. # print test result summary
  378. def print_summary(self):
  379. print_and_log('\n######## Logs for {} variant ########'\
  380. .format(self.name))
  381. for folder, result in sorted(self.test_result.folders.items()):
  382. print_and_log('{}: {}'.format(folder, result))
  383. print_and_log("----------------------------")
  384. print_and_log('Total: {}'.format(self.test_result))
  385. # global run one test function for multiprocessing, used by TestVariant
  386. def run_one(data):
  387. try:
  388. variant, test = data
  389. variant.test_one(test)
  390. except Exception:
  391. print('ERROR: Unhandled exception!!!')
  392. traceback.print_exc()
  393. # record folder/tags info from test_root/rlexedirs.xml
  394. class FolderTags(object):
  395. def __init__(self):
  396. xmlpath = os.path.join(test_root, 'rlexedirs.xml')
  397. try:
  398. xml = ET.parse(xmlpath).getroot()
  399. except IOError:
  400. print_and_log('ERROR: failed to read {}'.format(xmlpath))
  401. exit(-1)
  402. self._folder_tags = {}
  403. for x in xml:
  404. d = x.find('default')
  405. key = d.find('files').text.lower() # avoid case mismatch
  406. tags = d.find('tags')
  407. self._folder_tags[key] = \
  408. split_tags(tags.text) if tags != None else _empty_set
  409. # check if should test a given folder
  410. def should_test(self, folder):
  411. key = os.path.basename(os.path.normpath(folder)).lower()
  412. ftags = self._folder_tags.get(key)
  413. # folder listed in rlexedirs.xml and not exlucded by global not_tags
  414. return ftags != None and ftags.isdisjoint(not_tags)
  415. # load all tests in folder using rlexe.xml file
  416. def load_tests(folder, file):
  417. try:
  418. xmlpath = os.path.join(folder, 'rlexe.xml')
  419. xml = ET.parse(xmlpath).getroot()
  420. except IOError:
  421. return []
  422. def test_override(condition, check_tag, check_value, test):
  423. target = condition.find(check_tag)
  424. if target != None and target.text == check_value:
  425. for override in condition.find('override'):
  426. test[override.tag] = override.text
  427. def load_test(testXml):
  428. test = Test(folder=folder)
  429. for c in testXml.find('default'):
  430. if c.tag == 'timeout': # timeout seconds
  431. test[c.tag] = int(c.text)
  432. elif c.tag == 'tags' and c.tag in test: # merge multiple <tags>
  433. test[c.tag] = test[c.tag] + ',' + c.text
  434. else:
  435. test[c.tag] = c.text
  436. condition = testXml.find('condition')
  437. if condition != None:
  438. test_override(condition, 'target', arch_alias, test)
  439. return test
  440. tests = [load_test(x) for x in xml]
  441. if file != None:
  442. tests = [x for x in tests if x.files == file]
  443. if len(tests) == 0 and is_jsfile(file):
  444. tests = [Test(folder=folder, files=file, baseline='')]
  445. return tests
  446. def is_jsfile(path):
  447. return os.path.splitext(path)[1] == '.js'
  448. def main():
  449. # By default run all tests
  450. if len(args.folders) == 0:
  451. files = (os.path.join(test_root, x) for x in os.listdir(test_root))
  452. args.folders = [f for f in sorted(files) if not os.path.isfile(f)]
  453. # Set the right timezone, the tests need Pacific Standard Time
  454. os.environ['TZ'] = 'US/Pacific'
  455. time.tzset()
  456. # load all tests
  457. tests = []
  458. folder_tags = FolderTags()
  459. for path in args.folders:
  460. if os.path.isfile(path):
  461. folder, file = os.path.dirname(path), os.path.basename(path)
  462. else:
  463. folder, file = path, None
  464. if folder_tags.should_test(folder):
  465. tests += load_tests(folder, file)
  466. # test variants
  467. variants = [
  468. TestVariant('interpreted', [
  469. '-maxInterpretCount:1', '-maxSimpleJitRunCount:1', '-bgjit-'])
  470. ]
  471. # run each variant
  472. pool = Pool(1) # Use a multiprocessing process Pool -- TODO: forcing this to single threaded until we have support for sequential tag
  473. start_time = datetime.now()
  474. for variant in variants:
  475. variant.run(tests, pool)
  476. elapsed_time = datetime.now() - start_time
  477. # print summary
  478. for variant in variants:
  479. variant.print_summary()
  480. print()
  481. failed = any(variant.test_result.fail_count > 0 for variant in variants)
  482. print('[{}] {}'.format(
  483. str(elapsed_time), 'Success!' if not failed else 'Failed!'))
  484. return 1 if failed else 0
  485. if __name__ == '__main__':
  486. sys.exit(main())