Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Blame
Revision Log

test_tokenize.py@ 3951

Visit:

Last change on this file since 3951 was 3225, checked in by bird, 19 years ago
Python 2.5
File size: 3.6 KB

Line
1	import os, glob, random
2	from cStringIO import StringIO
3	from test.test_support import (verbose, findfile, is_resource_enabled,
4	TestFailed)
5	from tokenize import (tokenize, generate_tokens, untokenize,
6	NUMBER, NAME, OP, STRING)
7
8	# Test roundtrip for `untokenize`. `f` is a file path. The source code in f
9	# is tokenized, converted back to source code via tokenize.untokenize(),
10	# and tokenized again from the latter. The test fails if the second
11	# tokenization doesn't match the first.
12	def test_roundtrip(f):
13	## print 'Testing:', f
14	fobj = open(f)
15	try:
16	fulltok = list(generate_tokens(fobj.readline))
17	finally:
18	fobj.close()
19
20	t1 = [tok[:2] for tok in fulltok]
21	newtext = untokenize(t1)
22	readline = iter(newtext.splitlines(1)).next
23	t2 = [tok[:2] for tok in generate_tokens(readline)]
24	if t1 != t2:
25	raise TestFailed("untokenize() roundtrip failed for %r" % f)
26
27	# This is an example from the docs, set up as a doctest.
28	def decistmt(s):
29	"""Substitute Decimals for floats in a string of statements.
30
31	>>> from decimal import Decimal
32	>>> s = 'print +21.3e-5*-.1234/81.7'
33	>>> decistmt(s)
34	"print +Decimal ('21.3e-5')*-Decimal ('.1234')/Decimal ('81.7')"
35
36	The format of the exponent is inherited from the platform C library.
37	Known cases are "e-007" (Windows) and "e-07" (not Windows). Since
38	we're only showing 12 digits, and the 13th isn't close to 5, the
39	rest of the output should be platform-independent.
40
41	>>> exec(s) #doctest: +ELLIPSIS
42	-3.21716034272e-0...7
43
44	Output from calculations with Decimal should be identical across all
45	platforms.
46
47	>>> exec(decistmt(s))
48	-3.217160342717258261933904529E-7
49	"""
50
51	result = []
52	g = generate_tokens(StringIO(s).readline) # tokenize the string
53	for toknum, tokval, _, _, _ in g:
54	if toknum == NUMBER and '.' in tokval: # replace NUMBER tokens
55	result.extend([
56	(NAME, 'Decimal'),
57	(OP, '('),
58	(STRING, repr(tokval)),
59	(OP, ')')
60	])
61	else:
62	result.append((toknum, tokval))
63	return untokenize(result)
64
65	def test_main():
66	if verbose:
67	print 'starting...'
68
69	# This displays the tokenization of tokenize_tests.py to stdout, and
70	# regrtest.py checks that this equals the expected output (in the
71	# test/output/ directory).
72	f = open(findfile('tokenize_tests' + os.extsep + 'txt'))
73	tokenize(f.readline)
74	f.close()
75
76	# Now run test_roundtrip() over tokenize_test.py too, and over all
77	# (if the "compiler" resource is enabled) or a small random sample (if
78	# "compiler" is not enabled) of the test*.py files.
79	f = findfile('tokenize_tests' + os.extsep + 'txt')
80	test_roundtrip(f)
81
82	testdir = os.path.dirname(f) or os.curdir
83	testfiles = glob.glob(testdir + os.sep + 'test*.py')
84	if not is_resource_enabled('compiler'):
85	testfiles = random.sample(testfiles, 10)
86
87	for f in testfiles:
88	test_roundtrip(f)
89
90	# Test detecton of IndentationError.
91	sampleBadText = """\
92	def foo():
93	bar
94	baz
95	"""
96
97	try:
98	for tok in generate_tokens(StringIO(sampleBadText).readline):
99	pass
100	except IndentationError:
101	pass
102	else:
103	raise TestFailed("Did not detect IndentationError:")
104
105	# Run the doctests in this module.
106	from test import test_tokenize # i.e., this module
107	from test.test_support import run_doctest
108	run_doctest(test_tokenize)
109
110	if verbose:
111	print 'finished'
112
113	if __name__ == "__main__":
114	test_main()

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: trunk/essentials/dev-lang/python/Lib/test/test_tokenize.py@ 3951

Download in other formats: