test_parser.py 21.2 KB
Newer Older
1
import parser
2
import unittest
Christian Heimes's avatar
Christian Heimes committed
3
import sys
4
import operator
5
from test import support
6 7 8 9 10 11 12

#
#  First, we test that we can generate trees from valid source fragments,
#  and that these valid trees are indeed allowed by the tree-loading side
#  of the parser module.
#

13
class RoundtripLegalSyntaxTestCase(unittest.TestCase):
14

15 16 17 18
    def roundtrip(self, f, s):
        st1 = f(s)
        t = st1.totuple()
        try:
19
            st2 = parser.sequence2st(t)
20
        except parser.ParserError as why:
21
            self.fail("could not roundtrip %r: %s" % (s, why))
22 23 24 25 26 27 28

        self.assertEquals(t, st2.totuple(),
                          "could not re-generate syntax tree")

    def check_expr(self, s):
        self.roundtrip(parser.expr, s)

29 30 31 32 33 34 35
    def test_flags_passed(self):
        # The unicode literals flags has to be passed from the paser to AST
        # generation.
        suite = parser.suite("from __future__ import unicode_literals; x = ''")
        code = suite.compile()
        scope = {}
        exec(code, {}, scope)
36
        self.assertIsInstance(scope["x"], str)
37

38 39 40
    def check_suite(self, s):
        self.roundtrip(parser.suite, s)

41
    def test_yield_statement(self):
42
        self.check_suite("def f(): yield 1")
43 44 45 46 47 48 49 50
        self.check_suite("def f(): yield")
        self.check_suite("def f(): x += yield")
        self.check_suite("def f(): x = yield 1")
        self.check_suite("def f(): x = y = yield 1")
        self.check_suite("def f(): x = yield")
        self.check_suite("def f(): x = y = yield")
        self.check_suite("def f(): 1 + (yield)*2")
        self.check_suite("def f(): (yield 1)*2")
51 52 53
        self.check_suite("def f(): return; yield 1")
        self.check_suite("def f(): yield 1; return")
        self.check_suite("def f():\n"
54 55
                         "    for x in range(30):\n"
                         "        yield x\n")
56 57 58
        self.check_suite("def f():\n"
                         "    if (yield):\n"
                         "        yield x\n")
59

60 61 62 63 64
    def test_expressions(self):
        self.check_expr("foo(1)")
        self.check_expr("[1, 2, 3]")
        self.check_expr("[x**3 for x in range(20)]")
        self.check_expr("[x**3 for x in range(20) if x % 3]")
65 66 67 68
        self.check_expr("[x**3 for x in range(20) if x % 2 if x % 3]")
        self.check_expr("list(x**3 for x in range(20))")
        self.check_expr("list(x**3 for x in range(20) if x % 3)")
        self.check_expr("list(x**3 for x in range(20) if x % 2 if x % 3)")
69 70 71 72 73 74 75 76 77 78
        self.check_expr("foo(*args)")
        self.check_expr("foo(*args, **kw)")
        self.check_expr("foo(**kw)")
        self.check_expr("foo(key=value)")
        self.check_expr("foo(key=value, *args)")
        self.check_expr("foo(key=value, *args, **kw)")
        self.check_expr("foo(key=value, **kw)")
        self.check_expr("foo(a, b, c, *args)")
        self.check_expr("foo(a, b, c, *args, **kw)")
        self.check_expr("foo(a, b, c, **kw)")
79
        self.check_expr("foo(a, *args, keyword=23)")
80
        self.check_expr("foo + bar")
81 82 83 84
        self.check_expr("foo - bar")
        self.check_expr("foo * bar")
        self.check_expr("foo / bar")
        self.check_expr("foo // bar")
85 86 87 88 89 90 91 92 93 94 95 96
        self.check_expr("lambda: 0")
        self.check_expr("lambda x: 0")
        self.check_expr("lambda *y: 0")
        self.check_expr("lambda *y, **z: 0")
        self.check_expr("lambda **z: 0")
        self.check_expr("lambda x, y: 0")
        self.check_expr("lambda foo=bar: 0")
        self.check_expr("lambda foo=bar, spaz=nifty+spit: 0")
        self.check_expr("lambda foo=bar, **z: 0")
        self.check_expr("lambda foo=bar, blaz=blat+2, **z: 0")
        self.check_expr("lambda foo=bar, blaz=blat+2, *y, **z: 0")
        self.check_expr("lambda x, *y, **z: 0")
97 98
        self.check_expr("(x for x in range(10))")
        self.check_expr("foo(x for x in range(10))")
99 100 101 102 103 104 105 106 107 108 109 110 111 112

    def test_simple_expression(self):
        # expr_stmt
        self.check_suite("a")

    def test_simple_assignments(self):
        self.check_suite("a = b")
        self.check_suite("a = b = c = d = e")

    def test_simple_augmented_assignments(self):
        self.check_suite("a += b")
        self.check_suite("a -= b")
        self.check_suite("a *= b")
        self.check_suite("a /= b")
113
        self.check_suite("a //= b")
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140
        self.check_suite("a %= b")
        self.check_suite("a &= b")
        self.check_suite("a |= b")
        self.check_suite("a ^= b")
        self.check_suite("a <<= b")
        self.check_suite("a >>= b")
        self.check_suite("a **= b")

    def test_function_defs(self):
        self.check_suite("def f(): pass")
        self.check_suite("def f(*args): pass")
        self.check_suite("def f(*args, **kw): pass")
        self.check_suite("def f(**kw): pass")
        self.check_suite("def f(foo=bar): pass")
        self.check_suite("def f(foo=bar, *args): pass")
        self.check_suite("def f(foo=bar, *args, **kw): pass")
        self.check_suite("def f(foo=bar, **kw): pass")

        self.check_suite("def f(a, b): pass")
        self.check_suite("def f(a, b, *args): pass")
        self.check_suite("def f(a, b, *args, **kw): pass")
        self.check_suite("def f(a, b, **kw): pass")
        self.check_suite("def f(a, b, foo=bar): pass")
        self.check_suite("def f(a, b, foo=bar, *args): pass")
        self.check_suite("def f(a, b, foo=bar, *args, **kw): pass")
        self.check_suite("def f(a, b, foo=bar, **kw): pass")

141 142 143 144 145 146 147 148
        self.check_suite("@staticmethod\n"
                         "def f(): pass")
        self.check_suite("@staticmethod\n"
                         "@funcattrs(x, y)\n"
                         "def f(): pass")
        self.check_suite("@funcattrs()\n"
                         "def f(): pass")

149 150
    def test_class_defs(self):
        self.check_suite("class foo():pass")
151
        self.check_suite("class foo(object):pass")
152 153 154 155 156 157 158
        self.check_suite("@class_decorator\n"
                         "class foo():pass")
        self.check_suite("@class_decorator(arg)\n"
                         "class foo():pass")
        self.check_suite("@decorator1\n"
                         "@decorator2\n"
                         "class foo():pass")
Tim Peters's avatar
Tim Peters committed
159

160 161 162
    def test_import_from_statement(self):
        self.check_suite("from sys.path import *")
        self.check_suite("from sys.path import dirname")
163 164
        self.check_suite("from sys.path import (dirname)")
        self.check_suite("from sys.path import (dirname,)")
165
        self.check_suite("from sys.path import dirname as my_dirname")
166 167
        self.check_suite("from sys.path import (dirname as my_dirname)")
        self.check_suite("from sys.path import (dirname as my_dirname,)")
168
        self.check_suite("from sys.path import dirname, basename")
169 170
        self.check_suite("from sys.path import (dirname, basename)")
        self.check_suite("from sys.path import (dirname, basename,)")
171 172
        self.check_suite(
            "from sys.path import dirname as my_dirname, basename")
173 174 175 176
        self.check_suite(
            "from sys.path import (dirname as my_dirname, basename)")
        self.check_suite(
            "from sys.path import (dirname as my_dirname, basename,)")
177 178
        self.check_suite(
            "from sys.path import dirname, basename as my_basename")
179 180 181 182
        self.check_suite(
            "from sys.path import (dirname, basename as my_basename)")
        self.check_suite(
            "from sys.path import (dirname, basename as my_basename,)")
183
        self.check_suite("from .bogus import x")
184 185 186 187 188 189 190

    def test_basic_import_statement(self):
        self.check_suite("import sys")
        self.check_suite("import sys as system")
        self.check_suite("import sys, math")
        self.check_suite("import sys as system, math")
        self.check_suite("import sys, math as my_math")
191

192 193 194
    def test_relative_imports(self):
        self.check_suite("from . import name")
        self.check_suite("from .. import name")
195 196 197 198
        # check all the way up to '....', since '...' is tokenized
        # differently from '.' (it's an ellipsis token).
        self.check_suite("from ... import name")
        self.check_suite("from .... import name")
199 200
        self.check_suite("from .pkg import name")
        self.check_suite("from ..pkg import name")
201 202
        self.check_suite("from ...pkg import name")
        self.check_suite("from ....pkg import name")
203

204 205 206 207 208 209 210
    def test_pep263(self):
        self.check_suite("# -*- coding: iso-8859-1 -*-\n"
                         "pass\n")

    def test_assert(self):
        self.check_suite("assert alo < ahi and blo < bhi\n")

Benjamin Peterson's avatar
Benjamin Peterson committed
211 212 213
    def test_with(self):
        self.check_suite("with open('x'): pass\n")
        self.check_suite("with open('x') as f: pass\n")
214
        self.check_suite("with open('x') as f, open('y') as g: pass\n")
Benjamin Peterson's avatar
Benjamin Peterson committed
215

216 217 218 219 220 221 222 223 224 225
    def test_try_stmt(self):
        self.check_suite("try: pass\nexcept: pass\n")
        self.check_suite("try: pass\nfinally: pass\n")
        self.check_suite("try: pass\nexcept A: pass\nfinally: pass\n")
        self.check_suite("try: pass\nexcept A: pass\nexcept: pass\n"
                         "finally: pass\n")
        self.check_suite("try: pass\nexcept: pass\nelse: pass\n")
        self.check_suite("try: pass\nexcept: pass\nelse: pass\n"
                         "finally: pass\n")

226 227 228
    def test_position(self):
        # An absolutely minimal test of position information.  Better
        # tests would be a big project.
229
        code = "def f(x):\n    return x + 1"
230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257
        st1 = parser.suite(code)
        st2 = st1.totuple(line_info=1, col_info=1)

        def walk(tree):
            node_type = tree[0]
            next = tree[1]
            if isinstance(next, tuple):
                for elt in tree[1:]:
                    for x in walk(elt):
                        yield x
            else:
                yield tree

        terminals = list(walk(st2))
        self.assertEqual([
            (1, 'def', 1, 0),
            (1, 'f', 1, 4),
            (7, '(', 1, 5),
            (1, 'x', 1, 6),
            (8, ')', 1, 7),
            (11, ':', 1, 8),
            (4, '', 1, 9),
            (5, '', 2, -1),
            (1, 'return', 2, 4),
            (1, 'x', 2, 11),
            (14, '+', 2, 13),
            (2, '1', 2, 15),
            (4, '', 2, 16),
258 259 260
            (6, '', 2, -1),
            (4, '', 2, -1),
            (0, '', 2, -1)],
261 262
                         terminals)

263 264 265 266 267 268
    def test_extended_unpacking(self):
        self.check_suite("*a = y")
        self.check_suite("x, *b, = m")
        self.check_suite("[*a, *b] = y")
        self.check_suite("for [*x, b] in x: pass")

269

270 271 272 273 274
#
#  Second, we take *invalid* trees and make sure we get ParserError
#  rejections for them.
#

275
class IllegalSyntaxTestCase(unittest.TestCase):
276

277 278
    def check_bad_tree(self, tree, label):
        try:
279
            parser.sequence2st(tree)
280 281 282 283 284 285 286 287 288
        except parser.ParserError:
            pass
        else:
            self.fail("did not detect invalid tree for %r" % label)

    def test_junk(self):
        # not even remotely valid:
        self.check_bad_tree((1, 2, 3), "<junk>")

289
    def test_illegal_yield_1(self):
290
        # Illegal yield statement: def f(): return 1; yield 1
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344
        tree = \
        (257,
         (264,
          (285,
           (259,
            (1, 'def'),
            (1, 'f'),
            (260, (7, '('), (8, ')')),
            (11, ':'),
            (291,
             (4, ''),
             (5, ''),
             (264,
              (265,
               (266,
                (272,
                 (275,
                  (1, 'return'),
                  (313,
                   (292,
                    (293,
                     (294,
                      (295,
                       (297,
                        (298,
                         (299,
                          (300,
                           (301,
                            (302, (303, (304, (305, (2, '1')))))))))))))))))),
               (264,
                (265,
                 (266,
                  (272,
                   (276,
                    (1, 'yield'),
                    (313,
                     (292,
                      (293,
                       (294,
                        (295,
                         (297,
                          (298,
                           (299,
                            (300,
                             (301,
                              (302,
                               (303, (304, (305, (2, '1')))))))))))))))))),
                 (4, ''))),
               (6, ''))))),
           (4, ''),
           (0, ''))))
        self.check_bad_tree(tree, "def f():\n  return 1\n  yield 1")

    def test_illegal_yield_2(self):
345
        # Illegal return in generator: def f(): return 1; yield 1
346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407
        tree = \
        (257,
         (264,
          (265,
           (266,
            (278,
             (1, 'from'),
             (281, (1, '__future__')),
             (1, 'import'),
             (279, (1, 'generators')))),
           (4, ''))),
         (264,
          (285,
           (259,
            (1, 'def'),
            (1, 'f'),
            (260, (7, '('), (8, ')')),
            (11, ':'),
            (291,
             (4, ''),
             (5, ''),
             (264,
              (265,
               (266,
                (272,
                 (275,
                  (1, 'return'),
                  (313,
                   (292,
                    (293,
                     (294,
                      (295,
                       (297,
                        (298,
                         (299,
                          (300,
                           (301,
                            (302, (303, (304, (305, (2, '1')))))))))))))))))),
               (264,
                (265,
                 (266,
                  (272,
                   (276,
                    (1, 'yield'),
                    (313,
                     (292,
                      (293,
                       (294,
                        (295,
                         (297,
                          (298,
                           (299,
                            (300,
                             (301,
                              (302,
                               (303, (304, (305, (2, '1')))))))))))))))))),
                 (4, ''))),
               (6, ''))))),
           (4, ''),
           (0, ''))))
        self.check_bad_tree(tree, "def f():\n  return 1\n  yield 1")

408
    def test_a_comma_comma_c(self):
409
        # Illegal input: a,,c
410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435
        tree = \
        (258,
         (311,
          (290,
           (291,
            (292,
             (293,
              (295,
               (296,
                (297,
                 (298, (299, (300, (301, (302, (303, (1, 'a')))))))))))))),
          (12, ','),
          (12, ','),
          (290,
           (291,
            (292,
             (293,
              (295,
               (296,
                (297,
                 (298, (299, (300, (301, (302, (303, (1, 'c'))))))))))))))),
         (4, ''),
         (0, ''))
        self.check_bad_tree(tree, "a,,c")

    def test_illegal_operator(self):
436
        # Illegal input: a $= b
437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467
        tree = \
        (257,
         (264,
          (265,
           (266,
            (267,
             (312,
              (291,
               (292,
                (293,
                 (294,
                  (296,
                   (297,
                    (298,
                     (299,
                      (300, (301, (302, (303, (304, (1, 'a'))))))))))))))),
             (268, (37, '$=')),
             (312,
              (291,
               (292,
                (293,
                 (294,
                  (296,
                   (297,
                    (298,
                     (299,
                      (300, (301, (302, (303, (304, (1, 'b'))))))))))))))))),
           (4, ''))),
         (0, ''))
        self.check_bad_tree(tree, "a $= b")

468 469 470 471 472 473 474 475
    def test_malformed_global(self):
        #doesn't have global keyword in ast
        tree = (257,
                (264,
                 (265,
                  (266,
                   (282, (1, 'foo'))), (4, ''))),
                (4, ''),
Tim Peters's avatar
Tim Peters committed
476
                (0, ''))
477
        self.check_bad_tree(tree, "malformed global ast")
478

479
    def test_missing_import_source(self):
480
        # from import fred
481 482
        tree = \
            (257,
483 484 485 486 487 488
             (268,
              (269,
               (270,
                (282,
                 (284, (1, 'from'), (1, 'import'),
                  (287, (285, (1, 'fred')))))),
489 490
               (4, ''))),
             (4, ''), (0, ''))
491
        self.check_bad_tree(tree, "from import fred")
492

Jeremy Hylton's avatar
Jeremy Hylton committed
493 494 495 496 497 498 499 500 501 502 503 504 505 506

class CompileTestCase(unittest.TestCase):

    # These tests are very minimal. :-(

    def test_compile_expr(self):
        st = parser.expr('2 + 3')
        code = parser.compilest(st)
        self.assertEquals(eval(code), 5)

    def test_compile_suite(self):
        st = parser.suite('x = 2; y = x + 3')
        code = parser.compilest(st)
        globs = {}
507
        exec(code, globs)
Jeremy Hylton's avatar
Jeremy Hylton committed
508 509 510 511 512 513
        self.assertEquals(globs['y'], 5)

    def test_compile_error(self):
        st = parser.suite('1 = 3 + 4')
        self.assertRaises(SyntaxError, parser.compilest, st)

514
    def test_compile_badunicode(self):
515
        st = parser.suite('a = "\\U12345678"')
516
        self.assertRaises(SyntaxError, parser.compilest, st)
517
        st = parser.suite('a = "\\u1"')
518 519
        self.assertRaises(SyntaxError, parser.compilest, st)

520 521 522 523 524 525 526 527 528 529
    def test_issue_9011(self):
        # Issue 9011: compilation of an unary minus expression changed
        # the meaning of the ST, so that a second compilation produced
        # incorrect results.
        st = parser.expr('-3')
        code1 = parser.compilest(st)
        self.assertEqual(eval(code1), -3)
        code2 = parser.compilest(st)
        self.assertEqual(eval(code2), -3)

Christian Heimes's avatar
Christian Heimes committed
530
class ParserStackLimitTestCase(unittest.TestCase):
531
    """try to push the parser to/over its limits.
Christian Heimes's avatar
Christian Heimes committed
532 533 534 535 536 537 538 539 540 541 542 543 544
    see http://bugs.python.org/issue1881 for a discussion
    """
    def _nested_expression(self, level):
        return "["*level+"]"*level

    def test_deeply_nested_list(self):
        # XXX used to be 99 levels in 2.x
        e = self._nested_expression(93)
        st = parser.expr(e)
        st.compile()

    def test_trigger_memory_error(self):
        e = self._nested_expression(100)
Christian Heimes's avatar
Christian Heimes committed
545 546
        print("Expecting 's_push: parser stack overflow' in next line",
              file=sys.stderr)
547
        sys.stderr.flush()
Christian Heimes's avatar
Christian Heimes committed
548 549
        self.assertRaises(MemoryError, parser.expr, e)

550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596
class STObjectTestCase(unittest.TestCase):
    """Test operations on ST objects themselves"""

    def test_comparisons(self):
        # ST objects should support order and equality comparisons
        st1 = parser.expr('2 + 3')
        st2 = parser.suite('x = 2; y = x + 3')
        st3 = parser.expr('list(x**3 for x in range(20))')
        st1_copy = parser.expr('2 + 3')
        st2_copy = parser.suite('x = 2; y = x + 3')
        st3_copy = parser.expr('list(x**3 for x in range(20))')

        # exercise fast path for object identity
        self.assertEquals(st1 == st1, True)
        self.assertEquals(st2 == st2, True)
        self.assertEquals(st3 == st3, True)
        # slow path equality
        self.assertEqual(st1, st1_copy)
        self.assertEqual(st2, st2_copy)
        self.assertEqual(st3, st3_copy)
        self.assertEquals(st1 == st2, False)
        self.assertEquals(st1 == st3, False)
        self.assertEquals(st2 == st3, False)
        self.assertEquals(st1 != st1, False)
        self.assertEquals(st2 != st2, False)
        self.assertEquals(st3 != st3, False)
        self.assertEquals(st1 != st1_copy, False)
        self.assertEquals(st2 != st2_copy, False)
        self.assertEquals(st3 != st3_copy, False)
        self.assertEquals(st2 != st1, True)
        self.assertEquals(st1 != st3, True)
        self.assertEquals(st3 != st2, True)
        # we don't particularly care what the ordering is;  just that
        # it's usable and self-consistent
        self.assertEquals(st1 < st2, not (st2 <= st1))
        self.assertEquals(st1 < st3, not (st3 <= st1))
        self.assertEquals(st2 < st3, not (st3 <= st2))
        self.assertEquals(st1 < st2, st2 > st1)
        self.assertEquals(st1 < st3, st3 > st1)
        self.assertEquals(st2 < st3, st3 > st2)
        self.assertEquals(st1 <= st2, st2 >= st1)
        self.assertEquals(st3 <= st1, st1 >= st3)
        self.assertEquals(st2 <= st3, st3 >= st2)
        # transitivity
        bottom = min(st1, st2, st3)
        top = max(st1, st2, st3)
        mid = sorted([st1, st2, st3])[1]
597 598 599 600 601 602 603 604 605
        self.assertTrue(bottom < mid)
        self.assertTrue(bottom < top)
        self.assertTrue(mid < top)
        self.assertTrue(bottom <= mid)
        self.assertTrue(bottom <= top)
        self.assertTrue(mid <= top)
        self.assertTrue(bottom <= bottom)
        self.assertTrue(mid <= mid)
        self.assertTrue(top <= top)
606 607 608 609 610 611 612 613 614 615 616 617
        # interaction with other types
        self.assertEquals(st1 == 1588.602459, False)
        self.assertEquals('spanish armada' != st2, True)
        self.assertRaises(TypeError, operator.ge, st3, None)
        self.assertRaises(TypeError, operator.le, False, st1)
        self.assertRaises(TypeError, operator.lt, st1, 1815)
        self.assertRaises(TypeError, operator.gt, b'waterloo', st2)


    # XXX tests for pickling and unpickling of ST objects should go here


618
def test_main():
619
    support.run_unittest(
620
        RoundtripLegalSyntaxTestCase,
Jeremy Hylton's avatar
Jeremy Hylton committed
621 622
        IllegalSyntaxTestCase,
        CompileTestCase,
Christian Heimes's avatar
Christian Heimes committed
623
        ParserStackLimitTestCase,
624
        STObjectTestCase,
625
    )
626 627 628 629


if __name__ == "__main__":
    test_main()