|
|
|
#!/usr/bin/python3 -tt
|
|
|
|
|
|
|
|
# Copyright 2012 Jussi Pakkanen
|
|
|
|
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
import ply.lex as lex
|
|
|
|
import ply.yacc as yacc
|
|
|
|
|
|
|
|
tokens = ['LPAREN',
|
|
|
|
'RPAREN',
|
|
|
|
'LBRACKET',
|
|
|
|
'RBRACKET',
|
|
|
|
'LBRACE',
|
|
|
|
'RBRACE',
|
|
|
|
'VARIABLE',
|
|
|
|
'COMMENT',
|
|
|
|
'EQUALS',
|
|
|
|
'COMMA',
|
|
|
|
'DOT',
|
|
|
|
'STRING',
|
|
|
|
'EOL_CONTINUE',
|
|
|
|
'EOL',
|
|
|
|
]
|
|
|
|
|
|
|
|
t_EQUALS = '='
|
|
|
|
t_LPAREN = '\('
|
|
|
|
t_RPAREN = '\)'
|
|
|
|
t_LBRACKET = '\['
|
|
|
|
t_RBRACKET = '\]'
|
|
|
|
t_LBRACE = '\{'
|
|
|
|
t_RBRACE = '\}'
|
|
|
|
t_VARIABLE = '[a-zA-Z][_0-9a-zA-Z]*'
|
|
|
|
t_COMMENT = '\#[^\n]*'
|
|
|
|
t_COMMA = ','
|
|
|
|
t_DOT = '\.'
|
|
|
|
t_STRING = "'[^']*'"
|
|
|
|
|
|
|
|
t_ignore = ' \t'
|
|
|
|
|
|
|
|
def t_EOL(t):
|
|
|
|
r'\n'
|
|
|
|
t.lexer.lineno += 1
|
|
|
|
return t
|
|
|
|
|
|
|
|
def t_EOL_CONTINUE(t):
|
|
|
|
r'\\[ \t]*\n'
|
|
|
|
t.lexer.lineno += 1
|
|
|
|
|
|
|
|
def t_error(t):
|
|
|
|
print("Illegal character '%s'" % t.value[0])
|
|
|
|
t.lexer.skip(1)
|
|
|
|
|
|
|
|
def test_lexer():
|
|
|
|
s = """hello = (something) # this = (that)
|
|
|
|
two = ['file1', 'file2']
|
|
|
|
function(h) { stuff }
|
|
|
|
obj.method(lll, \\
|
|
|
|
'string')
|
|
|
|
"""
|
|
|
|
lexer = lex.lex()
|
|
|
|
lexer.input(s)
|
|
|
|
while True:
|
|
|
|
tok = lexer.token()
|
|
|
|
if not tok:
|
|
|
|
break
|
|
|
|
print(tok)
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
test_lexer()
|