]> git.proxmox.com Git - mirror_edk2.git/blob - AppPkg/Applications/Python/Python-2.7.2/Lib/test/test_tokenize.py
EmbeddedPkg: Extend NvVarStoreFormattedLib LIBRARY_CLASS
[mirror_edk2.git] / AppPkg / Applications / Python / Python-2.7.2 / Lib / test / test_tokenize.py
1 doctests = """
2 Tests for the tokenize module.
3
4 >>> import glob, random, sys
5
6 The tests can be really simple. Given a small fragment of source
7 code, print out a table with tokens. The ENDMARK is omitted for
8 brevity.
9
10 >>> dump_tokens("1 + 1")
11 NUMBER '1' (1, 0) (1, 1)
12 OP '+' (1, 2) (1, 3)
13 NUMBER '1' (1, 4) (1, 5)
14
15 >>> dump_tokens("if False:\\n"
16 ... " # NL\\n"
17 ... " True = False # NEWLINE\\n")
18 NAME 'if' (1, 0) (1, 2)
19 NAME 'False' (1, 3) (1, 8)
20 OP ':' (1, 8) (1, 9)
21 NEWLINE '\\n' (1, 9) (1, 10)
22 COMMENT '# NL' (2, 4) (2, 8)
23 NL '\\n' (2, 8) (2, 9)
24 INDENT ' ' (3, 0) (3, 4)
25 NAME 'True' (3, 4) (3, 8)
26 OP '=' (3, 9) (3, 10)
27 NAME 'False' (3, 11) (3, 16)
28 COMMENT '# NEWLINE' (3, 17) (3, 26)
29 NEWLINE '\\n' (3, 26) (3, 27)
30 DEDENT '' (4, 0) (4, 0)
31
32 >>> indent_error_file = \"""
33 ... def k(x):
34 ... x += 2
35 ... x += 5
36 ... \"""
37
38 >>> for tok in generate_tokens(StringIO(indent_error_file).readline): pass
39 Traceback (most recent call last):
40 ...
41 IndentationError: unindent does not match any outer indentation level
42
43 Test roundtrip for `untokenize`. `f` is an open file or a string. The source
44 code in f is tokenized, converted back to source code via tokenize.untokenize(),
45 and tokenized again from the latter. The test fails if the second tokenization
46 doesn't match the first.
47
48 >>> def roundtrip(f):
49 ... if isinstance(f, str): f = StringIO(f)
50 ... token_list = list(generate_tokens(f.readline))
51 ... f.close()
52 ... tokens1 = [tok[:2] for tok in token_list]
53 ... new_text = untokenize(tokens1)
54 ... readline = iter(new_text.splitlines(1)).next
55 ... tokens2 = [tok[:2] for tok in generate_tokens(readline)]
56 ... return tokens1 == tokens2
57 ...
58
59 There are some standard formatting practices that are easy to get right.
60
61 >>> roundtrip("if x == 1:\\n"
62 ... " print x\\n")
63 True
64
65 >>> roundtrip("# This is a comment\\n# This also")
66 True
67
68 Some people use different formatting conventions, which makes
69 untokenize a little trickier. Note that this test involves trailing
70 whitespace after the colon. Note that we use hex escapes to make the
71 two trailing blanks apperant in the expected output.
72
73 >>> roundtrip("if x == 1 : \\n"
74 ... " print x\\n")
75 True
76
77 >>> f = test_support.findfile("tokenize_tests" + os.extsep + "txt")
78 >>> roundtrip(open(f))
79 True
80
81 >>> roundtrip("if x == 1:\\n"
82 ... " # A comment by itself.\\n"
83 ... " print x # Comment here, too.\\n"
84 ... " # Another comment.\\n"
85 ... "after_if = True\\n")
86 True
87
88 >>> roundtrip("if (x # The comments need to go in the right place\\n"
89 ... " == 1):\\n"
90 ... " print 'x==1'\\n")
91 True
92
93 >>> roundtrip("class Test: # A comment here\\n"
94 ... " # A comment with weird indent\\n"
95 ... " after_com = 5\\n"
96 ... " def x(m): return m*5 # a one liner\\n"
97 ... " def y(m): # A whitespace after the colon\\n"
98 ... " return y*4 # 3-space indent\\n")
99 True
100
101 Some error-handling code
102
103 >>> roundtrip("try: import somemodule\\n"
104 ... "except ImportError: # comment\\n"
105 ... " print 'Can not import' # comment2\\n"
106 ... "else: print 'Loaded'\\n")
107 True
108
109 Balancing continuation
110
111 >>> roundtrip("a = (3,4, \\n"
112 ... "5,6)\\n"
113 ... "y = [3, 4,\\n"
114 ... "5]\\n"
115 ... "z = {'a': 5,\\n"
116 ... "'b':15, 'c':True}\\n"
117 ... "x = len(y) + 5 - a[\\n"
118 ... "3] - a[2]\\n"
119 ... "+ len(z) - z[\\n"
120 ... "'b']\\n")
121 True
122
123 Ordinary integers and binary operators
124
125 >>> dump_tokens("0xff <= 255")
126 NUMBER '0xff' (1, 0) (1, 4)
127 OP '<=' (1, 5) (1, 7)
128 NUMBER '255' (1, 8) (1, 11)
129 >>> dump_tokens("0b10 <= 255")
130 NUMBER '0b10' (1, 0) (1, 4)
131 OP '<=' (1, 5) (1, 7)
132 NUMBER '255' (1, 8) (1, 11)
133 >>> dump_tokens("0o123 <= 0123")
134 NUMBER '0o123' (1, 0) (1, 5)
135 OP '<=' (1, 6) (1, 8)
136 NUMBER '0123' (1, 9) (1, 13)
137 >>> dump_tokens("01234567 > ~0x15")
138 NUMBER '01234567' (1, 0) (1, 8)
139 OP '>' (1, 9) (1, 10)
140 OP '~' (1, 11) (1, 12)
141 NUMBER '0x15' (1, 12) (1, 16)
142 >>> dump_tokens("2134568 != 01231515")
143 NUMBER '2134568' (1, 0) (1, 7)
144 OP '!=' (1, 8) (1, 10)
145 NUMBER '01231515' (1, 11) (1, 19)
146 >>> dump_tokens("(-124561-1) & 0200000000")
147 OP '(' (1, 0) (1, 1)
148 OP '-' (1, 1) (1, 2)
149 NUMBER '124561' (1, 2) (1, 8)
150 OP '-' (1, 8) (1, 9)
151 NUMBER '1' (1, 9) (1, 10)
152 OP ')' (1, 10) (1, 11)
153 OP '&' (1, 12) (1, 13)
154 NUMBER '0200000000' (1, 14) (1, 24)
155 >>> dump_tokens("0xdeadbeef != -1")
156 NUMBER '0xdeadbeef' (1, 0) (1, 10)
157 OP '!=' (1, 11) (1, 13)
158 OP '-' (1, 14) (1, 15)
159 NUMBER '1' (1, 15) (1, 16)
160 >>> dump_tokens("0xdeadc0de & 012345")
161 NUMBER '0xdeadc0de' (1, 0) (1, 10)
162 OP '&' (1, 11) (1, 12)
163 NUMBER '012345' (1, 13) (1, 19)
164 >>> dump_tokens("0xFF & 0x15 | 1234")
165 NUMBER '0xFF' (1, 0) (1, 4)
166 OP '&' (1, 5) (1, 6)
167 NUMBER '0x15' (1, 7) (1, 11)
168 OP '|' (1, 12) (1, 13)
169 NUMBER '1234' (1, 14) (1, 18)
170
171 Long integers
172
173 >>> dump_tokens("x = 0L")
174 NAME 'x' (1, 0) (1, 1)
175 OP '=' (1, 2) (1, 3)
176 NUMBER '0L' (1, 4) (1, 6)
177 >>> dump_tokens("x = 0xfffffffffff")
178 NAME 'x' (1, 0) (1, 1)
179 OP '=' (1, 2) (1, 3)
180 NUMBER '0xffffffffff (1, 4) (1, 17)
181 >>> dump_tokens("x = 123141242151251616110l")
182 NAME 'x' (1, 0) (1, 1)
183 OP '=' (1, 2) (1, 3)
184 NUMBER '123141242151 (1, 4) (1, 26)
185 >>> dump_tokens("x = -15921590215012591L")
186 NAME 'x' (1, 0) (1, 1)
187 OP '=' (1, 2) (1, 3)
188 OP '-' (1, 4) (1, 5)
189 NUMBER '159215902150 (1, 5) (1, 23)
190
191 Floating point numbers
192
193 >>> dump_tokens("x = 3.14159")
194 NAME 'x' (1, 0) (1, 1)
195 OP '=' (1, 2) (1, 3)
196 NUMBER '3.14159' (1, 4) (1, 11)
197 >>> dump_tokens("x = 314159.")
198 NAME 'x' (1, 0) (1, 1)
199 OP '=' (1, 2) (1, 3)
200 NUMBER '314159.' (1, 4) (1, 11)
201 >>> dump_tokens("x = .314159")
202 NAME 'x' (1, 0) (1, 1)
203 OP '=' (1, 2) (1, 3)
204 NUMBER '.314159' (1, 4) (1, 11)
205 >>> dump_tokens("x = 3e14159")
206 NAME 'x' (1, 0) (1, 1)
207 OP '=' (1, 2) (1, 3)
208 NUMBER '3e14159' (1, 4) (1, 11)
209 >>> dump_tokens("x = 3E123")
210 NAME 'x' (1, 0) (1, 1)
211 OP '=' (1, 2) (1, 3)
212 NUMBER '3E123' (1, 4) (1, 9)
213 >>> dump_tokens("x+y = 3e-1230")
214 NAME 'x' (1, 0) (1, 1)
215 OP '+' (1, 1) (1, 2)
216 NAME 'y' (1, 2) (1, 3)
217 OP '=' (1, 4) (1, 5)
218 NUMBER '3e-1230' (1, 6) (1, 13)
219 >>> dump_tokens("x = 3.14e159")
220 NAME 'x' (1, 0) (1, 1)
221 OP '=' (1, 2) (1, 3)
222 NUMBER '3.14e159' (1, 4) (1, 12)
223
224 String literals
225
226 >>> dump_tokens("x = ''; y = \\\"\\\"")
227 NAME 'x' (1, 0) (1, 1)
228 OP '=' (1, 2) (1, 3)
229 STRING "''" (1, 4) (1, 6)
230 OP ';' (1, 6) (1, 7)
231 NAME 'y' (1, 8) (1, 9)
232 OP '=' (1, 10) (1, 11)
233 STRING '""' (1, 12) (1, 14)
234 >>> dump_tokens("x = '\\\"'; y = \\\"'\\\"")
235 NAME 'x' (1, 0) (1, 1)
236 OP '=' (1, 2) (1, 3)
237 STRING '\\'"\\'' (1, 4) (1, 7)
238 OP ';' (1, 7) (1, 8)
239 NAME 'y' (1, 9) (1, 10)
240 OP '=' (1, 11) (1, 12)
241 STRING '"\\'"' (1, 13) (1, 16)
242 >>> dump_tokens("x = \\\"doesn't \\\"shrink\\\", does it\\\"")
243 NAME 'x' (1, 0) (1, 1)
244 OP '=' (1, 2) (1, 3)
245 STRING '"doesn\\'t "' (1, 4) (1, 14)
246 NAME 'shrink' (1, 14) (1, 20)
247 STRING '", does it"' (1, 20) (1, 31)
248 >>> dump_tokens("x = u'abc' + U'ABC'")
249 NAME 'x' (1, 0) (1, 1)
250 OP '=' (1, 2) (1, 3)
251 STRING "u'abc'" (1, 4) (1, 10)
252 OP '+' (1, 11) (1, 12)
253 STRING "U'ABC'" (1, 13) (1, 19)
254 >>> dump_tokens('y = u"ABC" + U"ABC"')
255 NAME 'y' (1, 0) (1, 1)
256 OP '=' (1, 2) (1, 3)
257 STRING 'u"ABC"' (1, 4) (1, 10)
258 OP '+' (1, 11) (1, 12)
259 STRING 'U"ABC"' (1, 13) (1, 19)
260 >>> dump_tokens("x = ur'abc' + Ur'ABC' + uR'ABC' + UR'ABC'")
261 NAME 'x' (1, 0) (1, 1)
262 OP '=' (1, 2) (1, 3)
263 STRING "ur'abc'" (1, 4) (1, 11)
264 OP '+' (1, 12) (1, 13)
265 STRING "Ur'ABC'" (1, 14) (1, 21)
266 OP '+' (1, 22) (1, 23)
267 STRING "uR'ABC'" (1, 24) (1, 31)
268 OP '+' (1, 32) (1, 33)
269 STRING "UR'ABC'" (1, 34) (1, 41)
270 >>> dump_tokens('y = ur"abc" + Ur"ABC" + uR"ABC" + UR"ABC"')
271 NAME 'y' (1, 0) (1, 1)
272 OP '=' (1, 2) (1, 3)
273 STRING 'ur"abc"' (1, 4) (1, 11)
274 OP '+' (1, 12) (1, 13)
275 STRING 'Ur"ABC"' (1, 14) (1, 21)
276 OP '+' (1, 22) (1, 23)
277 STRING 'uR"ABC"' (1, 24) (1, 31)
278 OP '+' (1, 32) (1, 33)
279 STRING 'UR"ABC"' (1, 34) (1, 41)
280
281 Operators
282
283 >>> dump_tokens("def d22(a, b, c=2, d=2, *k): pass")
284 NAME 'def' (1, 0) (1, 3)
285 NAME 'd22' (1, 4) (1, 7)
286 OP '(' (1, 7) (1, 8)
287 NAME 'a' (1, 8) (1, 9)
288 OP ',' (1, 9) (1, 10)
289 NAME 'b' (1, 11) (1, 12)
290 OP ',' (1, 12) (1, 13)
291 NAME 'c' (1, 14) (1, 15)
292 OP '=' (1, 15) (1, 16)
293 NUMBER '2' (1, 16) (1, 17)
294 OP ',' (1, 17) (1, 18)
295 NAME 'd' (1, 19) (1, 20)
296 OP '=' (1, 20) (1, 21)
297 NUMBER '2' (1, 21) (1, 22)
298 OP ',' (1, 22) (1, 23)
299 OP '*' (1, 24) (1, 25)
300 NAME 'k' (1, 25) (1, 26)
301 OP ')' (1, 26) (1, 27)
302 OP ':' (1, 27) (1, 28)
303 NAME 'pass' (1, 29) (1, 33)
304 >>> dump_tokens("def d01v_(a=1, *k, **w): pass")
305 NAME 'def' (1, 0) (1, 3)
306 NAME 'd01v_' (1, 4) (1, 9)
307 OP '(' (1, 9) (1, 10)
308 NAME 'a' (1, 10) (1, 11)
309 OP '=' (1, 11) (1, 12)
310 NUMBER '1' (1, 12) (1, 13)
311 OP ',' (1, 13) (1, 14)
312 OP '*' (1, 15) (1, 16)
313 NAME 'k' (1, 16) (1, 17)
314 OP ',' (1, 17) (1, 18)
315 OP '**' (1, 19) (1, 21)
316 NAME 'w' (1, 21) (1, 22)
317 OP ')' (1, 22) (1, 23)
318 OP ':' (1, 23) (1, 24)
319 NAME 'pass' (1, 25) (1, 29)
320
321 Comparison
322
323 >>> dump_tokens("if 1 < 1 > 1 == 1 >= 5 <= 0x15 <= 0x12 != " +
324 ... "1 and 5 in 1 not in 1 is 1 or 5 is not 1: pass")
325 NAME 'if' (1, 0) (1, 2)
326 NUMBER '1' (1, 3) (1, 4)
327 OP '<' (1, 5) (1, 6)
328 NUMBER '1' (1, 7) (1, 8)
329 OP '>' (1, 9) (1, 10)
330 NUMBER '1' (1, 11) (1, 12)
331 OP '==' (1, 13) (1, 15)
332 NUMBER '1' (1, 16) (1, 17)
333 OP '>=' (1, 18) (1, 20)
334 NUMBER '5' (1, 21) (1, 22)
335 OP '<=' (1, 23) (1, 25)
336 NUMBER '0x15' (1, 26) (1, 30)
337 OP '<=' (1, 31) (1, 33)
338 NUMBER '0x12' (1, 34) (1, 38)
339 OP '!=' (1, 39) (1, 41)
340 NUMBER '1' (1, 42) (1, 43)
341 NAME 'and' (1, 44) (1, 47)
342 NUMBER '5' (1, 48) (1, 49)
343 NAME 'in' (1, 50) (1, 52)
344 NUMBER '1' (1, 53) (1, 54)
345 NAME 'not' (1, 55) (1, 58)
346 NAME 'in' (1, 59) (1, 61)
347 NUMBER '1' (1, 62) (1, 63)
348 NAME 'is' (1, 64) (1, 66)
349 NUMBER '1' (1, 67) (1, 68)
350 NAME 'or' (1, 69) (1, 71)
351 NUMBER '5' (1, 72) (1, 73)
352 NAME 'is' (1, 74) (1, 76)
353 NAME 'not' (1, 77) (1, 80)
354 NUMBER '1' (1, 81) (1, 82)
355 OP ':' (1, 82) (1, 83)
356 NAME 'pass' (1, 84) (1, 88)
357
358 Shift
359
360 >>> dump_tokens("x = 1 << 1 >> 5")
361 NAME 'x' (1, 0) (1, 1)
362 OP '=' (1, 2) (1, 3)
363 NUMBER '1' (1, 4) (1, 5)
364 OP '<<' (1, 6) (1, 8)
365 NUMBER '1' (1, 9) (1, 10)
366 OP '>>' (1, 11) (1, 13)
367 NUMBER '5' (1, 14) (1, 15)
368
369 Additive
370
371 >>> dump_tokens("x = 1 - y + 15 - 01 + 0x124 + z + a[5]")
372 NAME 'x' (1, 0) (1, 1)
373 OP '=' (1, 2) (1, 3)
374 NUMBER '1' (1, 4) (1, 5)
375 OP '-' (1, 6) (1, 7)
376 NAME 'y' (1, 8) (1, 9)
377 OP '+' (1, 10) (1, 11)
378 NUMBER '15' (1, 12) (1, 14)
379 OP '-' (1, 15) (1, 16)
380 NUMBER '01' (1, 17) (1, 19)
381 OP '+' (1, 20) (1, 21)
382 NUMBER '0x124' (1, 22) (1, 27)
383 OP '+' (1, 28) (1, 29)
384 NAME 'z' (1, 30) (1, 31)
385 OP '+' (1, 32) (1, 33)
386 NAME 'a' (1, 34) (1, 35)
387 OP '[' (1, 35) (1, 36)
388 NUMBER '5' (1, 36) (1, 37)
389 OP ']' (1, 37) (1, 38)
390
391 Multiplicative
392
393 >>> dump_tokens("x = 1//1*1/5*12%0x12")
394 NAME 'x' (1, 0) (1, 1)
395 OP '=' (1, 2) (1, 3)
396 NUMBER '1' (1, 4) (1, 5)
397 OP '//' (1, 5) (1, 7)
398 NUMBER '1' (1, 7) (1, 8)
399 OP '*' (1, 8) (1, 9)
400 NUMBER '1' (1, 9) (1, 10)
401 OP '/' (1, 10) (1, 11)
402 NUMBER '5' (1, 11) (1, 12)
403 OP '*' (1, 12) (1, 13)
404 NUMBER '12' (1, 13) (1, 15)
405 OP '%' (1, 15) (1, 16)
406 NUMBER '0x12' (1, 16) (1, 20)
407
408 Unary
409
410 >>> dump_tokens("~1 ^ 1 & 1 |1 ^ -1")
411 OP '~' (1, 0) (1, 1)
412 NUMBER '1' (1, 1) (1, 2)
413 OP '^' (1, 3) (1, 4)
414 NUMBER '1' (1, 5) (1, 6)
415 OP '&' (1, 7) (1, 8)
416 NUMBER '1' (1, 9) (1, 10)
417 OP '|' (1, 11) (1, 12)
418 NUMBER '1' (1, 12) (1, 13)
419 OP '^' (1, 14) (1, 15)
420 OP '-' (1, 16) (1, 17)
421 NUMBER '1' (1, 17) (1, 18)
422 >>> dump_tokens("-1*1/1+1*1//1 - ---1**1")
423 OP '-' (1, 0) (1, 1)
424 NUMBER '1' (1, 1) (1, 2)
425 OP '*' (1, 2) (1, 3)
426 NUMBER '1' (1, 3) (1, 4)
427 OP '/' (1, 4) (1, 5)
428 NUMBER '1' (1, 5) (1, 6)
429 OP '+' (1, 6) (1, 7)
430 NUMBER '1' (1, 7) (1, 8)
431 OP '*' (1, 8) (1, 9)
432 NUMBER '1' (1, 9) (1, 10)
433 OP '//' (1, 10) (1, 12)
434 NUMBER '1' (1, 12) (1, 13)
435 OP '-' (1, 14) (1, 15)
436 OP '-' (1, 16) (1, 17)
437 OP '-' (1, 17) (1, 18)
438 OP '-' (1, 18) (1, 19)
439 NUMBER '1' (1, 19) (1, 20)
440 OP '**' (1, 20) (1, 22)
441 NUMBER '1' (1, 22) (1, 23)
442
443 Selector
444
445 >>> dump_tokens("import sys, time\\nx = sys.modules['time'].time()")
446 NAME 'import' (1, 0) (1, 6)
447 NAME 'sys' (1, 7) (1, 10)
448 OP ',' (1, 10) (1, 11)
449 NAME 'time' (1, 12) (1, 16)
450 NEWLINE '\\n' (1, 16) (1, 17)
451 NAME 'x' (2, 0) (2, 1)
452 OP '=' (2, 2) (2, 3)
453 NAME 'sys' (2, 4) (2, 7)
454 OP '.' (2, 7) (2, 8)
455 NAME 'modules' (2, 8) (2, 15)
456 OP '[' (2, 15) (2, 16)
457 STRING "'time'" (2, 16) (2, 22)
458 OP ']' (2, 22) (2, 23)
459 OP '.' (2, 23) (2, 24)
460 NAME 'time' (2, 24) (2, 28)
461 OP '(' (2, 28) (2, 29)
462 OP ')' (2, 29) (2, 30)
463
464 Methods
465
466 >>> dump_tokens("@staticmethod\\ndef foo(x,y): pass")
467 OP '@' (1, 0) (1, 1)
468 NAME 'staticmethod (1, 1) (1, 13)
469 NEWLINE '\\n' (1, 13) (1, 14)
470 NAME 'def' (2, 0) (2, 3)
471 NAME 'foo' (2, 4) (2, 7)
472 OP '(' (2, 7) (2, 8)
473 NAME 'x' (2, 8) (2, 9)
474 OP ',' (2, 9) (2, 10)
475 NAME 'y' (2, 10) (2, 11)
476 OP ')' (2, 11) (2, 12)
477 OP ':' (2, 12) (2, 13)
478 NAME 'pass' (2, 14) (2, 18)
479
480 Backslash means line continuation, except for comments
481
482 >>> roundtrip("x=1+\\\\n"
483 ... "1\\n"
484 ... "# This is a comment\\\\n"
485 ... "# This also\\n")
486 True
487 >>> roundtrip("# Comment \\\\nx = 0")
488 True
489
490 Two string literals on the same line
491
492 >>> roundtrip("'' ''")
493 True
494
495 Test roundtrip on random python modules.
496 pass the '-ucpu' option to process the full directory.
497
498 >>>
499 >>> tempdir = os.path.dirname(f) or os.curdir
500 >>> testfiles = glob.glob(os.path.join(tempdir, "test*.py"))
501
502 >>> if not test_support.is_resource_enabled("cpu"):
503 ... testfiles = random.sample(testfiles, 10)
504 ...
505 >>> for testfile in testfiles:
506 ... if not roundtrip(open(testfile)):
507 ... print "Roundtrip failed for file %s" % testfile
508 ... break
509 ... else: True
510 True
511
512 Evil tabs
513 >>> dump_tokens("def f():\\n\\tif x\\n \\tpass")
514 NAME 'def' (1, 0) (1, 3)
515 NAME 'f' (1, 4) (1, 5)
516 OP '(' (1, 5) (1, 6)
517 OP ')' (1, 6) (1, 7)
518 OP ':' (1, 7) (1, 8)
519 NEWLINE '\\n' (1, 8) (1, 9)
520 INDENT '\\t' (2, 0) (2, 1)
521 NAME 'if' (2, 1) (2, 3)
522 NAME 'x' (2, 4) (2, 5)
523 NEWLINE '\\n' (2, 5) (2, 6)
524 INDENT ' \\t' (3, 0) (3, 9)
525 NAME 'pass' (3, 9) (3, 13)
526 DEDENT '' (4, 0) (4, 0)
527 DEDENT '' (4, 0) (4, 0)
528 """
529
530
531 from test import test_support
532 from tokenize import (untokenize, generate_tokens, NUMBER, NAME, OP,
533 STRING, ENDMARKER, tok_name)
534 from StringIO import StringIO
535 import os
536
537 def dump_tokens(s):
538 """Print out the tokens in s in a table format.
539
540 The ENDMARKER is omitted.
541 """
542 f = StringIO(s)
543 for type, token, start, end, line in generate_tokens(f.readline):
544 if type == ENDMARKER:
545 break
546 type = tok_name[type]
547 print("%(type)-10.10s %(token)-13.13r %(start)s %(end)s" % locals())
548
549 # This is an example from the docs, set up as a doctest.
550 def decistmt(s):
551 """Substitute Decimals for floats in a string of statements.
552
553 >>> from decimal import Decimal
554 >>> s = 'print +21.3e-5*-.1234/81.7'
555 >>> decistmt(s)
556 "print +Decimal ('21.3e-5')*-Decimal ('.1234')/Decimal ('81.7')"
557
558 The format of the exponent is inherited from the platform C library.
559 Known cases are "e-007" (Windows) and "e-07" (not Windows). Since
560 we're only showing 12 digits, and the 13th isn't close to 5, the
561 rest of the output should be platform-independent.
562
563 >>> exec(s) #doctest: +ELLIPSIS
564 -3.21716034272e-0...7
565
566 Output from calculations with Decimal should be identical across all
567 platforms.
568
569 >>> exec(decistmt(s))
570 -3.217160342717258261933904529E-7
571 """
572
573 result = []
574 g = generate_tokens(StringIO(s).readline) # tokenize the string
575 for toknum, tokval, _, _, _ in g:
576 if toknum == NUMBER and '.' in tokval: # replace NUMBER tokens
577 result.extend([
578 (NAME, 'Decimal'),
579 (OP, '('),
580 (STRING, repr(tokval)),
581 (OP, ')')
582 ])
583 else:
584 result.append((toknum, tokval))
585 return untokenize(result)
586
587
588 __test__ = {"doctests" : doctests, 'decistmt': decistmt}
589
590
591 def test_main():
592 from test import test_tokenize
593 test_support.run_doctest(test_tokenize, True)
594
595 if __name__ == "__main__":
596 test_main()