lcfOS: python/pyburg.py comparison

comparison python/pyburg.py @ 382:0c44e494ef58

Made lexer more generic

author	Windel Bouwman
date	Sun, 27 Apr 2014 12:24:21 +0200
parents	d2ddfe134c48
children	fb3c1f029b30

comparison

equal deleted inserted replaced

-:6df89163e114
+:0c44e494ef58
 import os
 import io
 import types
 import argparse
 from ppci import Token
-from pyyacc import ParserException, EOF
+from pyyacc import ParserException
 import yacc
 import baselex
 from tree import Tree
 # Generate parser on the fly:
 spec_file = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'burg.x')
 burg_parser = yacc.load_as_module(spec_file)
-class BurgLexer:
+class BurgLexer(baselex.BaseLexer):
-def feed(self, txt):
+def __init__(self):
 tok_spec = [
 ('id', r'[A-Za-z][A-Za-z\d_]*', lambda typ, val: (typ, val)),
 ('kw', r'%[A-Za-z][A-Za-z\d_]*', lambda typ, val: (val, val)),
 ('number', r'\d+', lambda typ, val: (typ, int(val))),
 ('STRING', r"'[^']*'", lambda typ, val: ('string', val[1:-1])),
 ('OTHER', r'[:;\|\(\),]', lambda typ, val: (val, val)),
 ('SKIP', r'[ ]', None)
 ]
+super().__init__(tok_spec)
+def tokenize(self, txt):
 lines = txt.split('\n')
 header_lines = []
+section = 0
-def tokenize():
+for line in lines:
-section = 0
+line = line.strip()
-for line in lines:
+if not line:
-line = line.strip()
+continue  # Skip empty lines
-if not line:
+elif line == '%%':
-continue  # Skip empty lines
+section += 1
-elif line == '%%':
+if section == 1:
-section += 1
+yield Token('header', header_lines)
-if section == 1:
+yield Token('%%', '%%')
-yield Token('header', header_lines)
+else:
-yield Token('%%', '%%')
+if section == 0:
+header_lines.append(line)
 else:
-if section == 0:
+# we could use yield from below, but python 3.2 does not work then:
-header_lines.append(line)
+for tk in super().tokenize(line):
-else:
+yield tk
-for tk in baselex.tokenize(tok_spec, line):
-yield tk
-yield Token(EOF, EOF)
-self.tokens = tokenize()
-self.token = self.tokens.__next__()
-def next_token(self):
-t = self.token
-if t.typ != EOF:
-self.token = self.tokens.__next__()
-return t
 class Rule:
 """ A rewrite rule. Specifies a tree that can be rewritten into a result
 at a specific cost """
 help='the parser specification')
 parser.add_argument('-o', '--output', type=argparse.FileType('w'), \
 default=sys.stdout)
 return parser
 def load_as_module(filename):
 """ Load a parser spec file, generate LR tables and create module """
 ob = io.StringIO()
 args = argparse.Namespace(source=open(filename), output=ob)
 main(args)

Mercurial > lcfOS

comparison python/pyburg.py @ 382:0c44e494ef58