annotate python/testpyy.py @ 192:6cd6260789a1

Added more tests for parser generator
author Windel Bouwman
date Sun, 26 May 2013 23:19:27 +0200
parents 6b2bec5653f1
children b01429a5d695
rev   line source
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
1 import unittest, pprint
192
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
2 from pyyacc import Grammar, Item, EOF, ParserGenerationException
191
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
3 from ppci import Token
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
4
191
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
5 def genTokens(lst):
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
6 for t in lst:
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
7 yield Token(t, t, 0)
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
8
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
9 class testLR(unittest.TestCase):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
10 def setUp(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
11 pass
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
12
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
13 def testSimpleGrammar(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
14 # 1. define a simple grammar:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
15 g = Grammar(['EOF', 'identifier', '(', ')', '+', '*'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
16 g.add_production('input', ['expression'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
17 g.add_production('expression', ['term'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
18 g.add_production('expression', ['expression', '+', 'term'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
19 g.add_production('term', ['factor'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
20 g.add_production('term', ['term', '*', 'factor'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
21 g.add_production('factor', ['(', 'expression', ')'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
22 g.add_production('factor', ['identifier'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
23 g.start_symbol = 'input'
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
24 # 2. define input:
191
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
25 tokens = genTokens(['identifier', '+', 'identifier', '+', 'identifier'])
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
26 # 3. build parser:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
27 p = g.genParser()
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
28 # 4. feed input:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
29 p.parse(tokens)
192
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
30 def testReduceReduceConflict(self):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
31 """ Check if a reduce-reduce conflict is detected """
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
32 # Define a grammar with an obvious reduce-reduce conflict:
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
33 g = Grammar([EOF, 'id'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
34 g.add_production('goal', ['a'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
35 g.add_production('a', ['b'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
36 g.add_production('a', ['c'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
37 g.add_production('b', ['id'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
38 g.add_production('c', ['id'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
39 g.start_symbol = 'goal'
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
40 with self.assertRaises(ParserGenerationException):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
41 p = g.genParser()
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
42 def testShiftReduceConflict(self):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
43 g = Grammar([EOF, 'if', 'then', 'else'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
44 g.add_production('if_stmt', ['if', 'then'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
45 g.add_production('if_stmt', ['if', 'then', 'else'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
46 g.add_production('stmt', ['if_stmt', 'else'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
47 g.start_symbol = 'stmt'
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
48 with self.assertRaises(ParserGenerationException):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
49 g.genParser()
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
50 def testUndefinedTerminal(self):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
51 """ Test correct behavior when a terminal is undefined """
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
52 g = Grammar([EOF, 'b'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
53 g.add_production('goal', ['a'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
54 g.add_production('a', ['b'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
55 g.add_production('a', ['c'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
56 g.start_symbol = 'goal'
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
57 with self.assertRaises(ParserGenerationException):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
58 g.genParser()
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
59 def testRedefineTerminal(self):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
60 """ Test correct behavior when a terminal is redefined """
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
61 g = Grammar([EOF, 'b', 'c'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
62 g.add_production('goal', ['a'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
63 with self.assertRaises(ParserGenerationException):
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
64 g.add_production('b', ['c']) # Not allowed
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
65 g.add_production('a', ['c'])
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
66 g.start_symbol = 'goal'
6cd6260789a1 Added more tests for parser generator
Windel Bouwman
parents: 191
diff changeset
67 g.genParser()
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
68
185
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
69 class testExpressionGrammar(unittest.TestCase):
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
70 def setUp(self):
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
71 g = Grammar(['EOF', 'identifier', '(', ')', '+', '*', 'num'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
72 g.add_production('input', ['expression'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
73 g.add_production('expression', ['term'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
74 g.add_production('expression', ['expression', '+', 'term'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
75 g.add_production('term', ['factor'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
76 g.add_production('term', ['term', '*', 'factor'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
77 g.add_production('factor', ['(', 'expression', ')'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
78 g.add_production('factor', ['identifier'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
79 g.add_production('factor', ['num'])
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
80 g.start_symbol = 'input'
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
81 self.g = g
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
82
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
83 def testFirstSimpleGrammar(self):
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
84 # 1. define a simple grammar:
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
85 first = self.g.calcFirstSets()
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
86 self.assertEqual(first['input'], {'identifier', '(', 'num'})
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
87 self.assertEqual(first['term'], {'identifier', '(', 'num'})
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
88
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
89 def testCanonical(self):
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
90 s0 = self.g.initialItemSet()
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
91 s, gt = self.g.genCanonicalSet(s0)
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
92 # Must result in 12 sets:
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
93 self.assertEqual(len(s), 24)
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
94
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
95 class testPG(unittest.TestCase):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
96 """ Tests several parts of the parser generator """
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
97 def setUp(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
98 g = Grammar(['(', ')'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
99 g.add_production('goal', ['list'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
100 g.add_production('list', ['list', 'pair'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
101 g.add_production('list', ['pair'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
102 g.add_production('pair', ['(', 'pair', ')'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
103 g.add_production('pair', ['(', ')'])
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
104 g.start_symbol = 'goal'
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
105 self.g = g
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
106
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
107 def testFirstSet(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
108 for a in ['(', ')', EOF, 'EPS']:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
109 self.assertEqual(self.g.first[a], {a})
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
110 for nt in ['list', 'pair', 'goal']:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
111 self.assertEqual(self.g.first[nt], {'('})
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
112
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
113 def testInitItemSet(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
114 p0, p1, p2, p3, p4 = self.g.productions
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
115 s0 = self.g.initialItemSet()
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
116 self.assertEqual(len(s0), 9) # 9 with the goal rule included!
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
117 self.assertIn(Item(p0, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
118 self.assertIn(Item(p1, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
119 self.assertIn(Item(p1, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
120 self.assertIn(Item(p2, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
121 self.assertIn(Item(p2, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
122 self.assertIn(Item(p3, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
123 self.assertIn(Item(p3, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
124 self.assertIn(Item(p4, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
125 self.assertIn(Item(p4, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
126
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
127 def testCanonical(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
128 s0 = self.g.initialItemSet()
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
129 s, gt = self.g.genCanonicalSet(s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
130 # Must result in 12 sets:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
131 self.assertEqual(len(s), 12)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
132
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
133 def testClosure(self):
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
134 p0, p1, p2, p3, p4 = self.g.productions
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
135 s0 = set()
185
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
136 s0.add(Item(p0, 0, EOF))
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
137 self.assertEqual(len(s0), 1) # 1 rule
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
138 self.assertIn(Item(p0, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
139
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
140 # Invoke closure on set:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
141 s0 = self.g.closure(s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
142 self.assertIn(Item(p0, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
143 self.assertIn(Item(p1, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
144 self.assertIn(Item(p1, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
145 self.assertIn(Item(p2, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
146 self.assertIn(Item(p2, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
147 self.assertIn(Item(p3, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
148 self.assertIn(Item(p3, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
149 self.assertIn(Item(p4, 0, EOF), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
150 self.assertIn(Item(p4, 0, '('), s0)
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
151
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
152 def testParser(self):
191
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
153 tokens = ['(', '(', ')', ')', '(', ')']
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
154 # 3. build parser:
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
155 p = self.g.genParser()
185
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
156 self.assertEqual(len(p.goto_table), 5)
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
157 self.assertEqual(len(p.action_table), 19)
51a6440d6398 Fixed LR(1) parser
Windel Bouwman
parents: 184
diff changeset
158
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
159 # 4. feed input:
191
6b2bec5653f1 Added assembler testset
Windel Bouwman
parents: 185
diff changeset
160 p.parse(genTokens(tokens))
184
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
161
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
162 if __name__ == '__main__':
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
163 unittest.main()
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
164
fe2b72381a83 Added testset for pyy
Windel Bouwman
parents:
diff changeset
165