test/sh_spec.py

OILS / test / sh_spec.py View on Github | oilshell.org

1509 lines, 934 significant

1	#!/usr/bin/env python2
2	from __future__ import print_function
3	"""
4	sh_spec.py -- Test framework to compare shells.
5
6	Assertion help:
7	stdout: A single line of expected stdout. Newline is implicit.
8	stdout-json: JSON-encoded string. Use for the empty string (no newline),
9	for unicode chars, etc.
10
11	stderr: Ditto for stderr stream.
12	status: Expected shell return code. If not specified, the case must exit 0.
13
14	Results:
15	PASS - we got the ideal, expected value
16	OK - we got a value that was not ideal, but expected
17	For OSH this is behavior that was defined to be different?
18	N-I - Not implemented (e.g. $''). Assertions still checked (in case it
19	starts working)
20	BUG - we verified the value of a known bug
21	FAIL - we got an unexpected value. If the implementation can't be changed,
22	it should be converted to BUG or OK. Otherwise it should be made to
23	PASS.
24
25	NOTE: The difference between OK and BUG is a matter of judgement. If the ideal
26	behavior is a compile time error (code 2), a runtime error is generally OK.
27
28	If ALL shells agree on a broken behavior, they are all marked OK (but our
29	implementation will be PASS.) But if the behavior is NOT POSIX compliant, then
30	it will be a BUG.
31
32	If one shell disagrees with others, that is generally a BUG.
33
34	Example test case:
35
36	#### hello and fail
37	echo hello
38	echo world
39	exit 1
40	## status: 1
41	#
42	# ignored comment
43	#
44	## STDOUT:
45	hello
46	world
47	## END
48
49	"""
50
51	import collections
52	import cgi
53	import cStringIO
54	import errno
55	import json
56	import optparse
57	import os
58	import pprint
59	import re
60	import shutil
61	import subprocess
62	import sys
63
64	from test import spec_lib
65	from doctools import html_head
66
67	log = spec_lib.log
68
69	# Magic strings for other variants of OSH.
70
71	# NOTE: osh_ALT is usually _bin/osh -- the release binary.
72	# It would be better to rename these osh-cpython and osh-ovm. Have the concept
73	# of a suffix?
74
75	OSH_CPYTHON = ('osh', 'osh-dbg')
76	OTHER_OSH = ('osh_ALT', )
77
78	YSH_CPYTHON = ('ysh', 'ysh-dbg')
79	OTHER_YSH = ('oil_ALT', )
80
81	# For now, only count the Oils CPython failures. TODO: the spec-cpp job should
82	# assert the osh-cpp and ysh-cpp deltas.
83	OTHER_OILS = OTHER_OSH + OTHER_YSH + ('osh-cpp', 'ysh-cpp')
84
85
86	class ParseError(Exception):
87	pass
88
89
90	# EXAMPLES:
91	## stdout: foo
92	## stdout-json: ""
93	#
94	# In other words, it could be (name, value) or (qualifier, name, value)
95
96	KEY_VALUE_RE = re.compile(
97	r'''
98	[#][#] \s+
99	# optional prefix with qualifier and shells
100	(?: (OK\|BUG\|N-I) \s+ ([\w+/]+) \s+ )?
101	([\w\-]+) # key
102	:
103	\s* (.*) # value
104	''', re.VERBOSE)
105
106	END_MULTILINE_RE = re.compile(r'''
107	[#][#] \s+ END
108	''', re.VERBOSE)
109
110	# Line types
111	TEST_CASE_BEGIN = 0 # Starts with ####
112	KEY_VALUE = 1 # Metadata
113	KEY_VALUE_MULTILINE = 2 # STDOUT STDERR
114	END_MULTILINE = 3 # STDOUT STDERR
115	PLAIN_LINE = 4 # Uncommented
116	EOF = 5
117
118	LEX_OUTER = 0 # Ignore blank lines, e.g. for separating cases
119	LEX_RAW = 1 # Blank lines are significant
120
121
122	class Tokenizer(object):
123	"""Modal lexer!"""
124
125	def __init__(self, f):
126	self.f = f
127
128	self.cursor = None
129	self.line_num = 0
130
131	self.next()
132
133	def _ClassifyLine(self, line, lex_mode):
134	if not line: # empty
135	return self.line_num, EOF, ''
136
137	if lex_mode == LEX_OUTER and not line.strip():
138	return None
139
140	if line.startswith('####'):
141	desc = line[4:].strip()
142	return self.line_num, TEST_CASE_BEGIN, desc
143
144	m = KEY_VALUE_RE.match(line)
145	if m:
146	qualifier, shells, name, value = m.groups()
147	# HACK: Expected data should have the newline.
148	if name in ('stdout', 'stderr'):
149	value += '\n'
150
151	if name in ('STDOUT', 'STDERR'):
152	token_type = KEY_VALUE_MULTILINE
153	else:
154	token_type = KEY_VALUE
155	return self.line_num, token_type, (qualifier, shells, name, value)
156
157	m = END_MULTILINE_RE.match(line)
158	if m:
159	return self.line_num, END_MULTILINE, None
160
161	# If it starts with ##, it should be metadata. This finds some typos.
162	if line.lstrip().startswith('##'):
163	raise RuntimeError('Invalid ## line %r' % line)
164
165	if line.lstrip().startswith('#'): # Ignore comments
166	return None # try again
167
168	# Non-empty line that doesn't start with '#'
169	# NOTE: We need the original line to test the whitespace sensitive <<-.
170	# And we need rstrip because we add newlines back below.
171	return self.line_num, PLAIN_LINE, line
172
173	def next(self, lex_mode=LEX_OUTER):
174	"""Raises StopIteration when exhausted."""
175	while True:
176	line = self.f.readline()
177	self.line_num += 1
178
179	tok = self._ClassifyLine(line, lex_mode)
180	if tok is not None:
181	break
182
183	self.cursor = tok
184	return self.cursor
185
186	def peek(self):
187	return self.cursor
188
189
190	def AddMetadataToCase(case, qualifier, shells, name, value, line_num):
191	shells = shells.split('/') # bash/dash/mksh
192	for shell in shells:
193	if shell not in case:
194	case[shell] = {}
195
196	# Check a duplicate specification
197	name_without_type = re.sub(r'-(json\|repr)$', '', name)
198	if (name_without_type in case[shell] or
199	name_without_type + '-json' in case[shell] or
200	name_without_type + '-repr' in case[shell]):
201	raise ParseError('Line %d: duplicate spec %r for %r' %
202	(line_num, name, shell))
203
204	# Check inconsistent qualifier
205	if 'qualifier' in case[shell] and qualifier != case[shell]['qualifier']:
206	raise ParseError(
207	'Line %d: inconsistent qualifier %r is specified for %r, '
208	'but %r was previously specified. '
209	% (line_num, qualifier, shell, case[shell]['qualifier']))
210
211	case[shell][name] = value
212	case[shell]['qualifier'] = qualifier
213
214
215	# Format of a test script.
216	#
217	# -- Code is either literal lines, or a commented out code: value.
218	# code = PLAIN_LINE*
219	# \| '## code:' VALUE
220	#
221	# -- Key value pairs can be single- or multi-line
222	# key_value = '##' KEY ':' VALUE
223	# \| KEY_VALUE_MULTILINE PLAIN_LINE* END_MULTILINE
224	#
225	# -- Description, then key-value pairs surrounding code.
226	# test_case = '####' DESC
227	# key_value*
228	# code
229	# key_value*
230	#
231	# -- Should be a blank line after each test case. Leading comments and code
232	# -- are OK.
233	#
234	# test_file =
235	# key_value* -- file level metadata
236	# (test_case '\n')*
237
238
239	def ParseKeyValue(tokens, case):
240	"""Parse commented-out metadata in a test case.
241
242	The metadata must be contiguous.
243
244	Args:
245	tokens: Tokenizer
246	case: dictionary to add to
247	"""
248	while True:
249	line_num, kind, item = tokens.peek()
250
251	if kind == KEY_VALUE_MULTILINE:
252	qualifier, shells, name, empty_value = item
253	if empty_value:
254	raise ParseError(
255	'Line %d: got value %r for %r, but the value should be on the '
256	'following lines' % (line_num, empty_value, name))
257
258	value_lines = []
259	while True:
260	tokens.next(lex_mode=LEX_RAW) # empty lines aren't skipped
261	_, kind2, item2 = tokens.peek()
262	if kind2 != PLAIN_LINE:
263	break
264	value_lines.append(item2)
265
266	value = ''.join(value_lines)
267
268	name = name.lower() # STDOUT -> stdout
269	if qualifier:
270	AddMetadataToCase(case, qualifier, shells, name, value,
271	line_num)
272	else:
273	case[name] = value
274
275	# END token is optional.
276	if kind2 == END_MULTILINE:
277	tokens.next()
278
279	elif kind == KEY_VALUE:
280	qualifier, shells, name, value = item
281
282	if qualifier:
283	AddMetadataToCase(case, qualifier, shells, name, value,
284	line_num)
285	else:
286	case[name] = value
287
288	tokens.next()
289
290	else: # Unknown token type
291	break
292
293
294	def ParseCodeLines(tokens, case):
295	"""Parse uncommented code in a test case."""
296	_, kind, item = tokens.peek()
297	if kind != PLAIN_LINE:
298	raise ParseError('Expected a line of code (got %r, %r)' % (kind, item))
299	code_lines = []
300	while True:
301	_, kind, item = tokens.peek()
302	if kind != PLAIN_LINE:
303	case['code'] = ''.join(code_lines)
304	return
305	code_lines.append(item)
306	tokens.next(lex_mode=LEX_RAW)
307
308
309	def ParseTestCase(tokens):
310	"""Parse a single test case and return it.
311
312	If at EOF, return None.
313	"""
314	line_num, kind, item = tokens.peek()
315	if kind == EOF:
316	return None
317
318	if kind != TEST_CASE_BEGIN:
319	raise RuntimeError("line %d: Expected TEST_CASE_BEGIN, got %r" %
320	(line_num, [kind, item]))
321
322	tokens.next()
323
324	case = {'desc': item, 'line_num': line_num}
325
326	ParseKeyValue(tokens, case)
327
328	# For broken code
329	if 'code' in case: # Got it through a key value pair
330	return case
331
332	ParseCodeLines(tokens, case)
333	ParseKeyValue(tokens, case)
334
335	return case
336
337
338	_META_FIELDS = [
339	'our_shell',
340	'compare_shells',
341	'suite',
342	'tags',
343	'oils_failures_allowed',
344	'oils_cpp_failures_allowed',
345	]
346
347
348	def ParseTestFile(test_file, tokens):
349	"""
350	test_file: Only for error message
351	"""
352	file_metadata = {}
353	test_cases = []
354
355	try:
356	# Skip over the header. Setup code can go here, although would we have to
357	# execute it on every case?
358	while True:
359	line_num, kind, item = tokens.peek()
360	if kind != KEY_VALUE:
361	break
362
363	qualifier, shells, name, value = item
364	if qualifier is not None:
365	raise RuntimeError('Invalid qualifier in spec file metadata')
366	if shells is not None:
367	raise RuntimeError('Invalid shells in spec file metadata')
368
369	file_metadata[name] = value
370
371	tokens.next()
372
373	while True: # Loop over cases
374	test_case = ParseTestCase(tokens)
375	if test_case is None:
376	break
377	test_cases.append(test_case)
378
379	except StopIteration:
380	raise RuntimeError('Unexpected EOF parsing test cases')
381
382	for name in file_metadata:
383	if name not in _META_FIELDS:
384	raise RuntimeError('Invalid file metadata %r in %r' %
385	(name, test_file))
386
387	return file_metadata, test_cases
388
389
390	def CreateStringAssertion(d, key, assertions, qualifier=False):
391	found = False
392
393	exp = d.get(key)
394	if exp is not None:
395	a = EqualAssertion(key, exp, qualifier=qualifier)
396	assertions.append(a)
397	found = True
398
399	exp_json = d.get(key + '-json')
400	if exp_json is not None:
401	exp = json.loads(exp_json, encoding='utf-8')
402	a = EqualAssertion(key, exp, qualifier=qualifier)
403	assertions.append(a)
404	found = True
405
406	# For testing invalid unicode
407	exp_repr = d.get(key + '-repr')
408	if exp_repr is not None:
409	exp = eval(exp_repr)
410	a = EqualAssertion(key, exp, qualifier=qualifier)
411	assertions.append(a)
412	found = True
413
414	return found
415
416
417	def CreateIntAssertion(d, key, assertions, qualifier=False):
418	exp = d.get(key) # expected
419	if exp is not None:
420	# For now, turn it into int
421	a = EqualAssertion(key, int(exp), qualifier=qualifier)
422	assertions.append(a)
423	return True
424	return False
425
426
427	def CreateAssertions(case, sh_label):
428	"""Given a raw test case and a shell label, create EqualAssertion instances
429	to run."""
430	assertions = []
431
432	# Whether we found assertions
433	stdout = False
434	stderr = False
435	status = False
436
437	# So the assertion are exactly the same for osh and osh_ALT
438
439	if sh_label.startswith('osh'):
440	case_sh = 'osh'
441	elif sh_label.startswith('bash'):
442	case_sh = 'bash'
443	else:
444	case_sh = sh_label
445
446	if case_sh in case:
447	q = case[case_sh]['qualifier']
448	if CreateStringAssertion(case[case_sh],
449	'stdout',
450	assertions,
451	qualifier=q):
452	stdout = True
453	if CreateStringAssertion(case[case_sh],
454	'stderr',
455	assertions,
456	qualifier=q):
457	stderr = True
458	if CreateIntAssertion(case[case_sh], 'status', assertions,
459	qualifier=q):
460	status = True
461
462	if not stdout:
463	CreateStringAssertion(case, 'stdout', assertions)
464	if not stderr:
465	CreateStringAssertion(case, 'stderr', assertions)
466	if not status:
467	if 'status' in case:
468	CreateIntAssertion(case, 'status', assertions)
469	else:
470	# If the user didn't specify a 'status' assertion, assert that the exit
471	# code is 0.
472	a = EqualAssertion('status', 0)
473	assertions.append(a)
474
475	no_traceback = SubstringAssertion('stderr', 'Traceback (most recent')
476	assertions.append(no_traceback)
477
478	#print 'SHELL', shell
479	#pprint.pprint(case)
480	#print(assertions)
481	return assertions
482
483
484	class Result(object):
485	"""Result of an stdout/stderr/status assertion or of a (case, shell) cell.
486
487	Order is important: the result of a cell is the minimum of the results of
488	each assertion.
489	"""
490	TIMEOUT = 0 # ONLY a cell result, not an assertion result
491	FAIL = 1
492	BUG = 2
493	NI = 3
494	OK = 4
495	PASS = 5
496
497	length = 6 # for loops
498
499
500	def QualifierToResult(qualifier):
501	# type: (str) -> Result
502	if qualifier == 'BUG': # equal, but known bad
503	return Result.BUG
504	if qualifier == 'N-I': # equal, and known UNIMPLEMENTED
505	return Result.NI
506	if qualifier == 'OK': # equal, but ok (not ideal)
507	return Result.OK
508	return Result.PASS # ideal behavior
509
510
511	class EqualAssertion(object):
512	"""Check that two values are equal."""
513
514	def __init__(self, key, expected, qualifier=None):
515	self.key = key
516	self.expected = expected # expected value
517	self.qualifier = qualifier # whether this was a special case?
518
519	def __repr__(self):
520	return '<EqualAssertion %s == %r>' % (self.key, self.expected)
521
522	def Check(self, shell, record):
523	actual = record[self.key]
524	if actual != self.expected:
525	if len(str(self.expected)) < 40:
526	msg = '[%s %s] Expected %r, got %r' % (shell, self.key,
527	self.expected, actual)
528	else:
529	msg = '''
530	[%s %s]
531	Expected %r
532	Got %r
533	''' % (shell, self.key, self.expected, actual)
534
535	# TODO: Make this better and add a flag for it.
536	if 0:
537	import difflib
538	for line in difflib.unified_diff(self.expected,
539	actual,
540	fromfile='expected',
541	tofile='actual'):
542	print(repr(line))
543
544	return Result.FAIL, msg
545
546	return QualifierToResult(self.qualifier), ''
547
548
549	class SubstringAssertion(object):
550	"""Check that a string like stderr doesn't have a substring."""
551
552	def __init__(self, key, substring):
553	self.key = key
554	self.substring = substring
555
556	def __repr__(self):
557	return '<SubstringAssertion %s == %r>' % (self.key, self.substring)
558
559	def Check(self, shell, record):
560	actual = record[self.key]
561	if self.substring in actual:
562	msg = '[%s %s] Found %r' % (shell, self.key, self.substring)
563	return Result.FAIL, msg
564	return Result.PASS, ''
565
566
567	class Stats(object):
568
569	def __init__(self, num_cases, sh_labels):
570	self.counters = collections.defaultdict(int)
571	c = self.counters
572	c['num_cases'] = num_cases
573	c['oils_num_passed'] = 0
574	c['oils_num_failed'] = 0
575	c['oils_cpp_num_failed'] = 0
576	# Number of osh_ALT results that differed from osh.
577	c['oils_ALT_delta'] = 0
578
579	self.by_shell = {}
580	for sh in sh_labels:
581	self.by_shell[sh] = collections.defaultdict(int)
582	self.nonzero_results = collections.defaultdict(int)
583
584	self.tsv_rows = []
585
586	def Inc(self, counter_name):
587	self.counters[counter_name] += 1
588
589	def Get(self, counter_name):
590	return self.counters[counter_name]
591
592	def Set(self, counter_name, val):
593	self.counters[counter_name] = val
594
595	def ReportCell(self, case_num, cell_result, sh_label):
596	self.tsv_rows.append(
597	(str(case_num), sh_label, TEXT_CELLS[cell_result]))
598
599	self.by_shell[sh_label][cell_result] += 1
600	self.nonzero_results[cell_result] += 1
601
602	c = self.counters
603	if cell_result == Result.TIMEOUT:
604	c['num_timeout'] += 1
605	elif cell_result == Result.FAIL:
606	# Special logic: don't count osh_ALT because its failures will be
607	# counted in the delta.
608	if sh_label not in OTHER_OILS:
609	c['num_failed'] += 1
610
611	if sh_label in OSH_CPYTHON + YSH_CPYTHON:
612	c['oils_num_failed'] += 1
613
614	if sh_label in ('osh-cpp', 'ysh-cpp'):
615	c['oils_cpp_num_failed'] += 1
616	elif cell_result == Result.BUG:
617	c['num_bug'] += 1
618	elif cell_result == Result.NI:
619	c['num_ni'] += 1
620	elif cell_result == Result.OK:
621	c['num_ok'] += 1
622	elif cell_result == Result.PASS:
623	c['num_passed'] += 1
624	if sh_label in OSH_CPYTHON + YSH_CPYTHON:
625	c['oils_num_passed'] += 1
626	else:
627	raise AssertionError()
628
629	def WriteTsv(self, f):
630	f.write('case\tshell\tresult\n')
631	for row in self.tsv_rows:
632	f.write('\t'.join(row))
633	f.write('\n')
634
635
636	PIPE = subprocess.PIPE
637
638
639	def RunCases(cases, case_predicate, shells, env, out, opts):
640	"""Run a list of test 'cases' for all 'shells' and write output to
641	'out'."""
642	if opts.trace:
643	for _, sh in shells:
644	log('\tshell: %s', sh)
645	print('\twhich $SH: ', end='', file=sys.stderr)
646	subprocess.call(['which', sh])
647
648	#pprint.pprint(cases)
649
650	sh_labels = [sh_label for sh_label, _ in shells]
651
652	out.WriteHeader(sh_labels)
653	stats = Stats(len(cases), sh_labels)
654
655	# Make an environment for each shell. $SH is the path to the shell, so we
656	# can test flags, etc.
657	sh_env = []
658	for _, sh_path in shells:
659	e = dict(env)
660	e[opts.sh_env_var_name] = sh_path
661	sh_env.append(e)
662
663	# Determine which one (if any) is osh-cpython, for comparison against other
664	# shells.
665	osh_cpython_index = -1
666	for i, (sh_label, _) in enumerate(shells):
667	if sh_label in OSH_CPYTHON:
668	osh_cpython_index = i
669	break
670
671	timeout_dir = os.path.abspath('_tmp/spec/timeouts')
672	try:
673	shutil.rmtree(timeout_dir)
674	os.mkdir(timeout_dir)
675	except OSError:
676	pass
677
678	# Now run each case, and print a table.
679	for i, case in enumerate(cases):
680	line_num = case['line_num']
681	desc = case['desc']
682	code = case['code']
683
684	if opts.trace:
685	log('case %d: %s', i, desc)
686
687	if not case_predicate(i, case):
688	stats.Inc('num_skipped')
689	continue
690
691	if opts.do_print:
692	print('#### %s' % case['desc'])
693	print(case['code'])
694	print()
695	continue
696
697	stats.Inc('num_cases_run')
698
699	result_row = []
700
701	for shell_index, (sh_label, sh_path) in enumerate(shells):
702	timeout_file = os.path.join(timeout_dir, '%02d-%s' % (i, sh_label))
703	if opts.timeout:
704	if opts.timeout_bin:
705	# This is what smoosh itself uses. See smoosh/tests/shell_tests.sh
706	# QUIRK: interval can only be a whole number
707	argv = [
708	opts.timeout_bin,
709	'-t',
710	opts.timeout,
711	# Somehow I'm not able to get this timeout file working? I think
712	# it has a bug when using stdin. It waits for the background
713	# process too.
714
715	#'-i', '1',
716	#'-l', timeout_file
717	]
718	else:
719	# This kills hanging tests properly, but somehow they fail with code
720	# -9?
721	#argv = ['timeout', '-s', 'KILL', opts.timeout]
722
723	# s suffix for seconds
724	argv = ['timeout', opts.timeout + 's']
725	else:
726	argv = []
727	argv.append(sh_path)
728
729	# dash doesn't support -o posix
730	if opts.posix and sh_label != 'dash':
731	argv.extend(['-o', 'posix'])
732
733	if opts.trace:
734	log('\targv: %s', ' '.join(argv))
735
736	case_env = sh_env[shell_index]
737
738	# Unique dir for every test case and shell
739	tmp_base = os.path.normpath(opts.tmp_env) # no . or ..
740	case_tmp_dir = os.path.join(tmp_base, '%02d-%s' % (i, sh_label))
741
742	try:
743	os.makedirs(case_tmp_dir)
744	except OSError as e:
745	if e.errno != errno.EEXIST:
746	raise
747
748	# Some tests assume _tmp exists
749	# TODO: get rid of this in the common case, to save inodes! I guess have
750	# an opt-in setting per FILE, like make_underscore_tmp: true.
751	try:
752	os.mkdir(os.path.join(case_tmp_dir, '_tmp'))
753	except OSError as e:
754	if e.errno != errno.EEXIST:
755	raise
756
757	case_env['TMP'] = case_tmp_dir
758
759	if opts.pyann_out_dir:
760	case_env = dict(case_env)
761	case_env['PYANN_OUT'] = os.path.join(opts.pyann_out_dir,
762	'%d.json' % i)
763
764	try:
765	p = subprocess.Popen(argv,
766	env=case_env,
767	cwd=case_tmp_dir,
768	stdin=PIPE,
769	stdout=PIPE,
770	stderr=PIPE)
771	except OSError as e:
772	print('Error running %r: %s' % (sh_path, e), file=sys.stderr)
773	sys.exit(1)
774
775	p.stdin.write(code)
776
777	actual = {}
778	actual['stdout'], actual['stderr'] = p.communicate()
779
780	actual['status'] = p.wait()
781
782	if opts.timeout_bin and os.path.exists(timeout_file):
783	cell_result = Result.TIMEOUT
784	elif not opts.timeout_bin and actual['status'] == 124:
785	cell_result = Result.TIMEOUT
786	else:
787	messages = []
788	cell_result = Result.PASS
789
790	# TODO: Warn about no assertions? Well it will always test the error
791	# code.
792	assertions = CreateAssertions(case, sh_label)
793	for a in assertions:
794	result, msg = a.Check(sh_label, actual)
795	# The minimum one wins.
796	# If any failed, then the result is FAIL.
797	# If any are OK, but none are FAIL, the result is OK.
798	cell_result = min(cell_result, result)
799	if msg:
800	messages.append(msg)
801
802	if cell_result != Result.PASS or opts.details:
803	d = (i, sh_label, actual['stdout'], actual['stderr'],
804	messages)
805	out.AddDetails(d)
806
807	result_row.append(cell_result)
808
809	stats.ReportCell(i, cell_result, sh_label)
810
811	if sh_label in OTHER_OSH:
812	# This is only an error if we tried to run ANY OSH.
813	if osh_cpython_index == -1:
814	raise RuntimeError(
815	"Couldn't determine index of osh-cpython")
816
817	other_result = result_row[shell_index]
818	cpython_result = result_row[osh_cpython_index]
819	if other_result != cpython_result:
820	stats.Inc('oils_ALT_delta')
821
822	out.WriteRow(i, line_num, result_row, desc)
823
824	return stats
825
826
827	# ANSI color constants
828	_RESET = '\033[0;0m'
829	_BOLD = '\033[1m'
830
831	_RED = '\033[31m'
832	_GREEN = '\033[32m'
833	_YELLOW = '\033[33m'
834	_PURPLE = '\033[35m'
835
836	TEXT_CELLS = {
837	Result.TIMEOUT: 'TIME',
838	Result.FAIL: 'FAIL',
839	Result.BUG: 'BUG',
840	Result.NI: 'N-I',
841	Result.OK: 'ok',
842	Result.PASS: 'pass',
843	}
844
845	ANSI_COLORS = {
846	Result.TIMEOUT: _PURPLE,
847	Result.FAIL: _RED,
848	Result.BUG: _YELLOW,
849	Result.NI: _YELLOW,
850	Result.OK: _YELLOW,
851	Result.PASS: _GREEN,
852	}
853
854
855	def _AnsiCells():
856	lookup = {}
857	for i in xrange(Result.length):
858	lookup[i] = ''.join([ANSI_COLORS[i], _BOLD, TEXT_CELLS[i], _RESET])
859	return lookup
860
861
862	ANSI_CELLS = _AnsiCells()
863
864	HTML_CELLS = {
865	Result.TIMEOUT: '<td class="timeout">TIME',
866	Result.FAIL: '<td class="fail">FAIL',
867	Result.BUG: '<td class="bug">BUG',
868	Result.NI: '<td class="n-i">N-I',
869	Result.OK: '<td class="ok">ok',
870	Result.PASS: '<td class="pass">pass',
871	}
872
873
874	def _ValidUtf8String(s):
875	"""Return an arbitrary string as a readable utf-8 string.
876
877	We output utf-8 to either HTML or the console. If we get invalid
878	utf-8 as stdout/stderr (which is very possible), then show the ASCII
879	repr().
880	"""
881	try:
882	s.decode('utf-8')
883	return s # it decoded OK
884	except UnicodeDecodeError:
885	return repr(s) # ASCII representation
886
887
888	class Output(object):
889
890	def __init__(self, f, verbose):
891	self.f = f
892	self.verbose = verbose
893	self.details = []
894
895	def BeginCases(self, test_file):
896	pass
897
898	def WriteHeader(self, sh_labels):
899	pass
900
901	def WriteRow(self, i, line_num, row, desc):
902	pass
903
904	def EndCases(self, sh_labels, stats):
905	pass
906
907	def AddDetails(self, entry):
908	self.details.append(entry)
909
910	# Helper function
911	def _WriteDetailsAsText(self, details):
912	for case_index, shell, stdout, stderr, messages in details:
913	print('case: %d' % case_index, file=self.f)
914	for m in messages:
915	print(m, file=self.f)
916
917	# Assume the terminal can show utf-8, but we don't want random binary.
918	print('%s stdout:' % shell, file=self.f)
919	print(_ValidUtf8String(stdout), file=self.f)
920
921	print('%s stderr:' % shell, file=self.f)
922	print(_ValidUtf8String(stderr), file=self.f)
923
924	print('', file=self.f)
925
926
927	class TeeOutput(object):
928	"""For multiple outputs in one run, e.g. HTML and TSV.
929
930	UNUSED
931	"""
932
933	def __init__(self, outs):
934	self.outs = outs
935
936	def BeginCases(self, test_file):
937	for out in self.outs:
938	out.BeginCases(test_file)
939
940	def WriteHeader(self, sh_labels):
941	for out in self.outs:
942	out.WriteHeader(sh_labels)
943
944	def WriteRow(self, i, line_num, row, desc):
945	for out in self.outs:
946	out.WriteRow(i, line_num, row, desc)
947
948	def EndCases(self, sh_labels, stats):
949	for out in self.outs:
950	out.EndCases(sh_labels, stats)
951
952	def AddDetails(self, entry):
953	for out in self.outs:
954	out.AddDetails(entry)
955
956
957	class TsvOutput(Output):
958	"""Write a plain-text TSV file.
959
960	UNUSED since we are outputting LONG format with --tsv-output.
961	"""
962
963	def WriteHeader(self, sh_labels):
964	self.f.write('case\tline\t') # case number and line number
965	for sh_label in sh_labels:
966	self.f.write(sh_label)
967	self.f.write('\t')
968	self.f.write('\n')
969
970	def WriteRow(self, i, line_num, row, desc):
971	self.f.write('%3d\t%3d\t' % (i, line_num))
972
973	for result in row:
974	c = TEXT_CELLS[result]
975	self.f.write(c)
976	self.f.write('\t')
977
978	# note: 'desc' could use TSV8, but just ignore it for now
979	#self.f.write(desc)
980	self.f.write('\n')
981
982
983	class AnsiOutput(Output):
984
985	def BeginCases(self, test_file):
986	self.f.write('%s\n' % test_file)
987
988	def WriteHeader(self, sh_labels):
989	self.f.write(_BOLD)
990	self.f.write('case\tline\t') # case number and line number
991	for sh_label in sh_labels:
992	self.f.write(sh_label)
993	self.f.write('\t')
994	self.f.write(_RESET)
995	self.f.write('\n')
996
997	def WriteRow(self, i, line_num, row, desc):
998	self.f.write('%3d\t%3d\t' % (i, line_num))
999
1000	for result in row:
1001	c = ANSI_CELLS[result]
1002	self.f.write(c)
1003	self.f.write('\t')
1004
1005	self.f.write(desc)
1006	self.f.write('\n')
1007
1008	if self.verbose:
1009	self._WriteDetailsAsText(self.details)
1010	self.details = []
1011
1012	def _WriteShellSummary(self, sh_labels, stats):
1013	if len(stats.nonzero_results) <= 1: # Skip trivial summaries
1014	return
1015
1016	# Reiterate header
1017	self.f.write(_BOLD)
1018	self.f.write('\t\t')
1019	for sh_label in sh_labels:
1020	self.f.write(sh_label)
1021	self.f.write('\t')
1022	self.f.write(_RESET)
1023	self.f.write('\n')
1024
1025	# Write totals by cell.
1026	for result in sorted(stats.nonzero_results, reverse=True):
1027	self.f.write('\t%s' % ANSI_CELLS[result])
1028	for sh_label in sh_labels:
1029	self.f.write('\t%d' % stats.by_shell[sh_label][result])
1030	self.f.write('\n')
1031
1032	# The bottom row is all the same, but it helps readability.
1033	self.f.write('\ttotal')
1034	for sh_label in sh_labels:
1035	self.f.write('\t%d' % stats.counters['num_cases_run'])
1036	self.f.write('\n')
1037	self.f.write('\n')
1038
1039	def EndCases(self, sh_labels, stats):
1040	print()
1041	self._WriteShellSummary(sh_labels, stats)
1042
1043
1044	class HtmlOutput(Output):
1045
1046	def __init__(self, f, verbose, spec_name, sh_labels, cases):
1047	Output.__init__(self, f, verbose)
1048	self.spec_name = spec_name
1049	self.sh_labels = sh_labels # saved from header
1050	self.cases = cases # for linking to code
1051	self.row_html = [] # buffered
1052
1053	def _SourceLink(self, line_num, desc):
1054	return '<a href="%s.test.html#L%d">%s</a>' % (self.spec_name, line_num,
1055	cgi.escape(desc))
1056
1057	def BeginCases(self, test_file):
1058	css_urls = ['../../../web/base.css', '../../../web/spec-tests.css']
1059	title = '%s: spec test case results' % self.spec_name
1060	html_head.Write(self.f, title, css_urls=css_urls)
1061
1062	self.f.write('''\
1063	<body class="width60">
1064	<p id="home-link">
1065	<a href=".">spec test index</a>
1066	/
1067	<a href="/">oilshell.org</a>
1068	</p>
1069	<h1>Results for %s</h1>
1070	<table>
1071	''' % test_file)
1072
1073	def _WriteShellSummary(self, sh_labels, stats):
1074	# NOTE: This table has multiple <thead>, which seems OK.
1075	self.f.write('''
1076	<thead>
1077	<tr class="table-header">
1078	''')
1079
1080	columns = ['status'] + sh_labels + ['']
1081	for c in columns:
1082	self.f.write('<td>%s</td>' % c)
1083
1084	self.f.write('''
1085	</tr>
1086	</thead>
1087	''')
1088
1089	# Write totals by cell.
1090	for result in sorted(stats.nonzero_results, reverse=True):
1091	self.f.write('<tr>')
1092
1093	self.f.write(HTML_CELLS[result])
1094	self.f.write('</td> ')
1095
1096	for sh_label in sh_labels:
1097	self.f.write('<td>%d</td>' % stats.by_shell[sh_label][result])
1098
1099	self.f.write('<td></td>')
1100	self.f.write('</tr>\n')
1101
1102	# The bottom row is all the same, but it helps readability.
1103	self.f.write('<tr>')
1104	self.f.write('<td>total</td>')
1105	for sh_label in sh_labels:
1106	self.f.write('<td>%d</td>' % stats.counters['num_cases_run'])
1107	self.f.write('<td></td>')
1108	self.f.write('</tr>\n')
1109
1110	# Blank row for space.
1111	self.f.write('<tr>')
1112	for i in xrange(len(sh_labels) + 2):
1113	self.f.write('<td style="height: 2em"></td>')
1114	self.f.write('</tr>\n')
1115
1116	def WriteHeader(self, sh_labels):
1117	f = cStringIO.StringIO()
1118
1119	f.write('''
1120	<thead>
1121	<tr class="table-header">
1122	''')
1123
1124	columns = ['case'] + sh_labels
1125	for c in columns:
1126	f.write('<td>%s</td>' % c)
1127	f.write('<td class="case-desc">description</td>')
1128
1129	f.write('''
1130	</tr>
1131	</thead>
1132	''')
1133
1134	self.row_html.append(f.getvalue())
1135
1136	def WriteRow(self, i, line_num, row, desc):
1137	f = cStringIO.StringIO()
1138	f.write('<tr>')
1139	f.write('<td>%3d</td>' % i)
1140
1141	show_details = False
1142
1143	for result in row:
1144	c = HTML_CELLS[result]
1145	if result not in (Result.PASS, Result.TIMEOUT): # nothing to show
1146	show_details = True
1147
1148	f.write(c)
1149	f.write('</td>')
1150	f.write('\t')
1151
1152	f.write('<td class="case-desc">')
1153	f.write(self._SourceLink(line_num, desc))
1154	f.write('</td>')
1155	f.write('</tr>\n')
1156
1157	# Show row with details link.
1158	if show_details:
1159	f.write('<tr>')
1160	f.write('<td class="details-row"></td>') # for the number
1161
1162	for col_index, result in enumerate(row):
1163	f.write('<td class="details-row">')
1164	if result != Result.PASS:
1165	sh_label = self.sh_labels[col_index]
1166	f.write('<a href="#details-%s-%s">details</a>' %
1167	(i, sh_label))
1168	f.write('</td>')
1169
1170	f.write('<td class="details-row"></td>') # for the description
1171	f.write('</tr>\n')
1172
1173	self.row_html.append(f.getvalue()) # buffer it
1174
1175	def _WriteStats(self, stats):
1176	self.f.write('%(num_passed)d passed, %(num_ok)d OK, '
1177	'%(num_ni)d not implemented, %(num_bug)d BUG, '
1178	'%(num_failed)d failed, %(num_timeout)d timeouts, '
1179	'%(num_skipped)d cases skipped\n' % stats.counters)
1180
1181	def EndCases(self, sh_labels, stats):
1182	self._WriteShellSummary(sh_labels, stats)
1183
1184	# Write all the buffered rows
1185	for h in self.row_html:
1186	self.f.write(h)
1187
1188	self.f.write('</table>\n')
1189	self.f.write('<pre>')
1190	self._WriteStats(stats)
1191	if stats.Get('oils_num_failed'):
1192	self.f.write('%(oils_num_failed)d failed under osh\n' %
1193	stats.counters)
1194	self.f.write('</pre>')
1195
1196	if self.details:
1197	self._WriteDetails()
1198
1199	self.f.write('</body></html>')
1200
1201	def _WriteDetails(self):
1202	self.f.write("<h2>Details on runs that didn't PASS</h2>")
1203	self.f.write('<table id="details">')
1204
1205	for case_index, sh_label, stdout, stderr, messages in self.details:
1206	self.f.write('<tr>')
1207	self.f.write('<td><a name="details-%s-%s"></a><b>%s</b></td>' %
1208	(case_index, sh_label, sh_label))
1209
1210	self.f.write('<td>')
1211
1212	# Write description and link to the code
1213	case = self.cases[case_index]
1214	line_num = case['line_num']
1215	desc = case['desc']
1216	self.f.write('%d ' % case_index)
1217	self.f.write(self._SourceLink(line_num, desc))
1218	self.f.write('<br/><br/>\n')
1219
1220	for m in messages:
1221	self.f.write('<span class="assertion">%s</span><br/>\n' %
1222	cgi.escape(m))
1223	if messages:
1224	self.f.write('<br/>\n')
1225
1226	def _WriteRaw(s):
1227	self.f.write('<pre>')
1228
1229	# stdout might contain invalid utf-8; make it valid;
1230	valid_utf8 = _ValidUtf8String(s)
1231
1232	self.f.write(cgi.escape(valid_utf8))
1233	self.f.write('</pre>')
1234
1235	self.f.write('<i>stdout:</i> <br/>\n')
1236	_WriteRaw(stdout)
1237
1238	self.f.write('<i>stderr:</i> <br/>\n')
1239	_WriteRaw(stderr)
1240
1241	self.f.write('</td>')
1242	self.f.write('</tr>')
1243
1244	self.f.write('</table>')
1245
1246
1247	def MakeTestEnv(opts):
1248	if not opts.tmp_env:
1249	raise RuntimeError('--tmp-env required')
1250	if not opts.path_env:
1251	raise RuntimeError('--path-env required')
1252	env = {
1253	'PATH': opts.path_env,
1254	#'LANG': opts.lang_env,
1255	}
1256	for p in opts.env_pair:
1257	name, value = p.split('=', 1)
1258	env[name] = value
1259
1260	return env
1261
1262
1263	def _DefaultSuite(spec_name):
1264	if spec_name.startswith('ysh-'):
1265	suite = 'ysh'
1266	elif spec_name.startswith('hay'): # hay.test.sh is ysh
1267	suite = 'ysh'
1268
1269	elif spec_name.startswith('tea-'):
1270	suite = 'tea'
1271	else:
1272	suite = 'osh'
1273
1274	return suite
1275
1276
1277	def ParseTestList(test_files):
1278	for test_file in test_files:
1279	with open(test_file) as f:
1280	tokens = Tokenizer(f)
1281	try:
1282	file_metadata, cases = ParseTestFile(test_file, tokens)
1283	except RuntimeError as e:
1284	log('ERROR in %r', test_file)
1285	raise
1286	except ParseError as e:
1287	log('PARSE ERROR in %r', test_file)
1288	raise
1289
1290	tmp = os.path.basename(test_file)
1291	spec_name = tmp.split('.')[0] # foo.test.sh -> foo
1292
1293	suite = file_metadata.get('suite') or _DefaultSuite(spec_name)
1294
1295	tmp = file_metadata.get('tags')
1296	tags = tmp.split() if tmp else []
1297
1298	# Don't need compare_shells, etc. to decide what to run
1299
1300	row = {'spec_name': spec_name, 'suite': suite, 'tags': tags}
1301	#print(row)
1302	yield row
1303
1304
1305	def main(argv):
1306	# First check if bash is polluting the environment. Tests rely on the
1307	# environment.
1308	v = os.getenv('RANDOM')
1309	if v is not None:
1310	raise AssertionError('got $RANDOM = %s' % v)
1311	v = os.getenv('PPID')
1312	if v is not None:
1313	raise AssertionError('got $PPID = %s' % v)
1314
1315	p = optparse.OptionParser('%s [options] TEST_FILE shell...' % sys.argv[0])
1316	spec_lib.DefineCommon(p)
1317	spec_lib.DefineShSpec(p)
1318	opts, argv = p.parse_args(argv)
1319
1320	# --print-tagged to figure out what to run
1321	if opts.print_tagged:
1322	to_find = opts.print_tagged
1323	for row in ParseTestList(argv[1:]):
1324	if to_find in row['tags']:
1325	print(row['spec_name'])
1326	return 0
1327
1328	# --print-table to figure out what to run
1329	if opts.print_table:
1330	for row in ParseTestList(argv[1:]):
1331	print('%(suite)s\t%(spec_name)s' % row)
1332	#print(row)
1333	return 0
1334
1335	#
1336	# Now deal with a single file
1337	#
1338
1339	try:
1340	test_file = argv[1]
1341	except IndexError:
1342	p.print_usage()
1343	return 1
1344
1345	with open(test_file) as f:
1346	tokens = Tokenizer(f)
1347	file_metadata, cases = ParseTestFile(test_file, tokens)
1348
1349	# List test cases and return
1350	if opts.do_list:
1351	for i, case in enumerate(cases):
1352	if opts.verbose: # print the raw dictionary for debugging
1353	print(pprint.pformat(case))
1354	else:
1355	print('%d\t%s' % (i, case['desc']))
1356	return 0
1357
1358	# for test/spec-cpp.sh
1359	if opts.print_spec_suite:
1360	tmp = os.path.basename(test_file)
1361	spec_name = tmp.split('.')[0] # foo.test.sh -> foo
1362
1363	suite = file_metadata.get('suite') or _DefaultSuite(spec_name)
1364	print(suite)
1365	return 0
1366
1367	if opts.verbose:
1368	for k, v in file_metadata.items():
1369	print('\t%-20s: %s' % (k, v), file=sys.stderr)
1370	print('', file=sys.stderr)
1371
1372	if opts.oils_bin_dir:
1373
1374	shells = []
1375
1376	if opts.compare_shells:
1377	comp = file_metadata.get('compare_shells')
1378	# Compare 'compare_shells' and Python
1379	shells.extend(comp.split() if comp else [])
1380
1381	# Always run with the Python version
1382	our_shell = file_metadata.get('our_shell', 'osh') # default is OSH
1383	if our_shell != '-':
1384	shells.append(os.path.join(opts.oils_bin_dir, our_shell))
1385
1386	# Legacy OVM/CPython build
1387	if opts.ovm_bin_dir:
1388	shells.append(os.path.join(opts.ovm_bin_dir, our_shell))
1389
1390	# New C++ build
1391	if opts.oils_cpp_bin_dir:
1392	shells.append(os.path.join(opts.oils_cpp_bin_dir, our_shell))
1393
1394	# Overwrite it when --oils-bin-dir is set
1395	# It's no longer a flag
1396	opts.oils_failures_allowed = \
1397	int(file_metadata.get('oils_failures_allowed', 0))
1398
1399	else:
1400	# TODO: remove this mode?
1401	shells = argv[2:]
1402
1403	shell_pairs = spec_lib.MakeShellPairs(shells)
1404
1405	if opts.range:
1406	begin, end = spec_lib.ParseRange(opts.range)
1407	case_predicate = spec_lib.RangePredicate(begin, end)
1408	elif opts.regex:
1409	desc_re = re.compile(opts.regex, re.IGNORECASE)
1410	case_predicate = spec_lib.RegexPredicate(desc_re)
1411	else:
1412	case_predicate = lambda i, case: True
1413
1414	out_f = sys.stderr if opts.do_print else sys.stdout
1415
1416	# Set up output style. Also see asdl/format.py
1417	if opts.format == 'ansi':
1418	out = AnsiOutput(out_f, opts.verbose)
1419
1420	elif opts.format == 'html':
1421	spec_name = os.path.basename(test_file)
1422	spec_name = spec_name.split('.')[0]
1423
1424	sh_labels = [label for label, _ in shell_pairs]
1425
1426	out = HtmlOutput(out_f, opts.verbose, spec_name, sh_labels, cases)
1427
1428	else:
1429	raise AssertionError()
1430
1431	out.BeginCases(os.path.basename(test_file))
1432
1433	env = MakeTestEnv(opts)
1434	stats = RunCases(cases, case_predicate, shell_pairs, env, out, opts)
1435
1436	out.EndCases([sh_label for sh_label, _ in shell_pairs], stats)
1437
1438	if opts.tsv_output:
1439	with open(opts.tsv_output, 'w') as f:
1440	stats.WriteTsv(f)
1441
1442	# TODO: Could --stats-{file,template} be a separate awk step on .tsv files?
1443	stats.Set('oils_failures_allowed', opts.oils_failures_allowed)
1444
1445	# If it's not set separately for C++, we default to the allowed number
1446	# above
1447	x = int(
1448	file_metadata.get('oils_cpp_failures_allowed',
1449	opts.oils_failures_allowed))
1450	stats.Set('oils_cpp_failures_allowed', x)
1451
1452	if opts.stats_file:
1453	with open(opts.stats_file, 'w') as f:
1454	f.write(opts.stats_template % stats.counters)
1455	f.write('\n') # bash 'read' requires a newline
1456
1457	# spec/smoke.test.sh -> smoke
1458	test_name = os.path.basename(test_file).split('.')[0]
1459
1460	return _SuccessOrFailure(test_name, stats)
1461
1462
1463	def _SuccessOrFailure(test_name, stats):
1464	allowed = stats.Get('oils_failures_allowed')
1465	allowed_cpp = stats.Get('oils_cpp_failures_allowed')
1466
1467	all_count = stats.Get('num_failed')
1468	oils_count = stats.Get('oils_num_failed')
1469	oils_cpp_count = stats.Get('oils_cpp_num_failed')
1470
1471	errors = []
1472	if oils_count != allowed:
1473	errors.append('Got %d Oils failures, but %d are allowed' %
1474	(oils_count, allowed))
1475	else:
1476	if allowed != 0:
1477	log('%s: note: Got %d allowed Oils failures', test_name, allowed)
1478
1479	# TODO: remove special case for 0
1480	if oils_cpp_count != 0:
1481	if oils_cpp_count != allowed_cpp:
1482	errors.append('Got %d Oils C++ failures, but %d are allowed' %
1483	(oils_cpp_count, allowed_cpp))
1484	else:
1485	if allowed_cpp != 0:
1486	log('%s: note: Got %d allowed Oils C++ failures', test_name,
1487	allowed_cpp)
1488
1489	if all_count != allowed:
1490	errors.append('Got %d total failures, but %d are allowed' %
1491	(all_count, allowed))
1492
1493	if errors:
1494	for msg in errors:
1495	log('%s: FATAL: %s', test_name, msg)
1496	return 1
1497
1498	return 0
1499
1500
1501	if __name__ == '__main__':
1502	try:
1503	sys.exit(main(sys.argv))
1504	except KeyboardInterrupt as e:
1505	print('%s: interrupted with Ctrl-C' % sys.argv[0], file=sys.stderr)
1506	sys.exit(1)
1507	except RuntimeError as e:
1508	print('FATAL: %s' % e, file=sys.stderr)
1509	sys.exit(1)