lcfOS: python/c3/lexer.py comparison

comparison python/c3/lexer.py @ 287:1c7c1e619be8

File movage

author	Windel Bouwman
date	Thu, 21 Nov 2013 11:57:27 +0100
parents	05184b95fa16
children	a747a45dcd78

comparison

equal deleted inserted replaced

-:d9df72971cbf
+:1c7c1e619be8
 'else', 'if', 'while', 'return', \
 'function', 'var', 'type', 'const', \
 'struct', 'cast', \
 'import', 'module' ]
-def tokenize(s):
+def tokenize(input_file):
 """
 Tokenizer, generates an iterator that
 returns tokens!
+Input is a file like object.
 This GREAT example was taken from python re doc page!
 """
-tok_spec = [
+filename = input_file.name if hasattr(input_file, 'name') else ''
+s = input_file.read()
+tok_spec = [
 ('REAL', r'\d+\.\d+'),
 ('HEXNUMBER', r'0x[\da-fA-F]+'),
 ('NUMBER', r'\d+'),
 ('ID', r'[A-Za-z][A-Za-z\d_]*'),
 ('NEWLINE', r'\n'),
 ('LONGCOMMENTBEGIN', r'\/\*'),
 ('LONGCOMMENTEND', r'\*\/'),
 ('LEESTEKEN', r'==|->|<<|>>|[\.,=:;\-+*\[\]/\(\)]|>=|<=|<>|>|<|{|}|&|\^|\|'),
 ('STRING', r"'.*?'")
 ]
 tok_re = '|'.join('(?P<%s>%s)' % pair for pair in tok_spec)
 gettok = re.compile(tok_re).match
 line = 1
 pos = line_start = 0
 mo = gettok(s)
 incomment = False
 while mo is not None:
 typ = mo.lastgroup
 val = mo.group(typ)
 if typ == 'NEWLINE':
 line_start = pos
 line += 1
 typ = 'NUMBER'
 elif typ == 'REAL':
 val = float(val)
 elif typ == 'STRING':
 val = val[1:-1]
-loc = SourceLocation(line, mo.start()-line_start, mo.end() - mo.start())
+loc = SourceLocation(filename, line, mo.start() - line_start, mo.end() - mo.start())
 yield Token(typ, val, loc)
 pos = mo.end()
 mo = gettok(s, pos)
 if pos != len(s):
 col = pos - line_start
-loc = SourceLocation(line, col, 1)
+loc = SourceLocation(filename, line, col, 1)
 raise CompilerError('Unexpected character "{0}"'.format(s[pos]), loc)
-loc = SourceLocation(line, 0, 0)
+loc = SourceLocation(filename, line, 0, 0)
 yield Token('END', '', loc)

Mercurial > lcfOS

comparison python/c3/lexer.py @ 287:1c7c1e619be8