blob: 1b620d1eaf894feb3e2dd038922f6df2f362e053 [file] [log] [blame]
import unittest
import textwrap
import antlr3
import antlr3.tree
import antlr3.debug
import testbase
import sys
import threading
import socket
import errno
import time
class Debugger(threading.Thread):
def __init__(self, port):
super(Debugger, self).__init__()
self.events = []
self.success = False
self.port = port
def run(self):
# create listening socket
s = None
tstart = time.time()
while time.time() - tstart < 10:
try:
s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
s.connect(('127.0.0.1', self.port))
break
except socket.error, exc:
if exc.args[0] != errno.ECONNREFUSED:
raise
time.sleep(0.1)
if s is None:
self.events.append(['nosocket'])
return
s.setblocking(1)
s.settimeout(10.0)
output = s.makefile('w', 0)
input = s.makefile('r', 0)
try:
# handshake
l = input.readline().strip()
assert l == 'ANTLR 2'
l = input.readline().strip()
assert l.startswith('grammar "')
output.write('ACK\n')
output.flush()
while True:
event = input.readline().strip()
self.events.append(event.split('\t'))
output.write('ACK\n')
output.flush()
if event == 'terminate':
self.success = True
break
except socket.timeout:
self.events.append(['timeout'])
except socket.error, exc:
self.events.append(['socketerror', exc.args])
s.close()
class T(testbase.ANTLRTest):
def execParser(self, grammar, grammarEntry, input, listener,
parser_args={}):
if listener is None:
port = 49100
debugger = Debugger(port)
debugger.start()
# TODO(pink): install alarm, so it doesn't hang forever in case of a bug
else:
port = None
try:
lexerCls, parserCls = self.compileInlineGrammar(
grammar, options='-debug')
cStream = antlr3.StringStream(input)
lexer = lexerCls(cStream)
tStream = antlr3.CommonTokenStream(lexer)
parser = parserCls(tStream, dbg=listener, port=port, **parser_args)
getattr(parser, grammarEntry)()
finally:
if listener is None:
debugger.join()
return debugger
def testBasicParser(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID EOF;
ID : 'a'..'z'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
listener = antlr3.debug.RecordDebugEventListener()
self.execParser(
grammar, 'a',
input="a",
listener=listener)
# We only check that some LT events are present. How many is subject
# to change (at the time of writing there are two, which is one too
# many).
lt_events = [event for event in listener.events
if event.startswith("LT ")]
self.assertNotEqual(lt_events, [])
# For the rest, filter out LT events to get a reliable test.
expected = ["enterRule a",
"location 6:1",
"location 6:5",
"location 6:8",
"location 6:11",
"exitRule a"]
found = [event for event in listener.events
if not event.startswith("LT ")]
self.assertListEqual(found, expected)
def testSocketProxy(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID EOF;
ID : 'a'..'z'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['location', '6', '8'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '1', '"<EOF>'],
['location', '6', '11'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testRecognitionException(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID EOF;
ID : 'a'..'z'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a b",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['consumeHiddenToken', '1', '5', '99', '1', '1', '"'],
['location', '6', '8'],
['LT', '1', '2', '4', '0', '1', '2', '"b'],
['LT', '1', '2', '4', '0', '1', '2', '"b'],
['LT', '2', '-1', '-1', '0', '1', '3', '"<EOF>'],
['LT', '1', '2', '4', '0', '1', '2', '"b'],
['LT', '1', '2', '4', '0', '1', '2', '"b'],
['beginResync'],
['consumeToken', '2', '4', '0', '1', '2', '"b'],
['endResync'],
['exception', 'UnwantedTokenException', '2', '1', '2'],
['LT', '1', '-1', '-1', '0', '1', '3', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '3', '"<EOF>'],
['location', '6', '11'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testSemPred(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : {True}? ID EOF;
ID : 'a'..'z'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['semanticPredicate', '1', 'True'],
['location', '6', '13'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['location', '6', '16'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '1', '"<EOF>'],
['location', '6', '19'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testPositiveClosureBlock(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID ( ID | INT )+ EOF;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a 1 b c 3",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['consumeHiddenToken', '1', '6', '99', '1', '1', '"'],
['location', '6', '8'],
['enterSubRule', '1'],
['enterDecision', '1', '0'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['consumeToken', '2', '5', '0', '1', '2', '"1'],
['consumeHiddenToken', '3', '6', '99', '1', '3', '"'],
['enterDecision', '1', '0'],
['LT', '1', '4', '4', '0', '1', '4', '"b'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '4', '4', '0', '1', '4', '"b'],
['consumeToken', '4', '4', '0', '1', '4', '"b'],
['consumeHiddenToken', '5', '6', '99', '1', '5', '"'],
['enterDecision', '1', '0'],
['LT', '1', '6', '4', '0', '1', '6', '"c'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '6', '4', '0', '1', '6', '"c'],
['consumeToken', '6', '4', '0', '1', '6', '"c'],
['consumeHiddenToken', '7', '6', '99', '1', '7', '"'],
['enterDecision', '1', '0'],
['LT', '1', '8', '5', '0', '1', '8', '"3'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '8', '5', '0', '1', '8', '"3'],
['consumeToken', '8', '5', '0', '1', '8', '"3'],
['enterDecision', '1', '0'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['exitDecision', '1'],
['exitSubRule', '1'],
['location', '6', '22'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '9', '"<EOF>'],
['location', '6', '25'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testClosureBlock(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID ( ID | INT )* EOF;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a 1 b c 3",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['consumeHiddenToken', '1', '6', '99', '1', '1', '"'],
['location', '6', '8'],
['enterSubRule', '1'],
['enterDecision', '1', '0'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['consumeToken', '2', '5', '0', '1', '2', '"1'],
['consumeHiddenToken', '3', '6', '99', '1', '3', '"'],
['enterDecision', '1', '0'],
['LT', '1', '4', '4', '0', '1', '4', '"b'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '4', '4', '0', '1', '4', '"b'],
['consumeToken', '4', '4', '0', '1', '4', '"b'],
['consumeHiddenToken', '5', '6', '99', '1', '5', '"'],
['enterDecision', '1', '0'],
['LT', '1', '6', '4', '0', '1', '6', '"c'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '6', '4', '0', '1', '6', '"c'],
['consumeToken', '6', '4', '0', '1', '6', '"c'],
['consumeHiddenToken', '7', '6', '99', '1', '7', '"'],
['enterDecision', '1', '0'],
['LT', '1', '8', '5', '0', '1', '8', '"3'],
['exitDecision', '1'],
['enterAlt', '1'],
['location', '6', '8'],
['LT', '1', '8', '5', '0', '1', '8', '"3'],
['consumeToken', '8', '5', '0', '1', '8', '"3'],
['enterDecision', '1', '0'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['exitDecision', '1'],
['exitSubRule', '1'],
['location', '6', '22'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '9', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '9', '"<EOF>'],
['location', '6', '25'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testMismatchedSetException(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID ( ID | INT ) EOF;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['location', '6', '8'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['exception', 'MismatchedSetException', '1', '1', '1'],
['exception', 'MismatchedSetException', '1', '1', '1'],
['beginResync'],
['LT', '1', '-1', '-1', '0', '1', '1', '"<EOF>'],
['endResync'],
['location', '6', '24'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testBlock(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID ( b | c ) EOF;
b : ID;
c : INT;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a 1",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['consumeHiddenToken', '1', '6', '99', '1', '1', '"'],
['location', '6', '8'],
['enterSubRule', '1'],
['enterDecision', '1', '0'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['exitDecision', '1'],
['enterAlt', '2'],
['location', '6', '14'],
['enterRule', 'T.g', 'c'],
['location', '8', '1'],
['enterAlt', '1'],
['location', '8', '5'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['LT', '1', '2', '5', '0', '1', '2', '"1'],
['consumeToken', '2', '5', '0', '1', '2', '"1'],
['location', '8', '8'],
['exitRule', 'T.g', 'c'],
['exitSubRule', '1'],
['location', '6', '18'],
['LT', '1', '-1', '-1', '0', '1', '3', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '3', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '3', '"<EOF>'],
['location', '6', '21'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testNoViableAlt(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ID ( b | c ) EOF;
b : ID;
c : INT;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
BANG : '!' ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a !",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['consumeToken', '0', '5', '0', '1', '0', '"a'],
['consumeHiddenToken', '1', '7', '99', '1', '1', '"'],
['location', '6', '8'],
['enterSubRule', '1'],
['enterDecision', '1', '0'],
['LT', '1', '2', '4', '0', '1', '2', '"!'],
['LT', '1', '2', '4', '0', '1', '2', '"!'],
['LT', '1', '2', '4', '0', '1', '2', '"!'],
['exception', 'NoViableAltException', '2', '1', '2'],
['exitDecision', '1'],
['exitSubRule', '1'],
['exception', 'NoViableAltException', '2', '1', '2'],
['beginResync'],
['LT', '1', '2', '4', '0', '1', '2', '"!'],
['consumeToken', '2', '4', '0', '1', '2', '"!'],
['LT', '1', '-1', '-1', '0', '1', '3', '"<EOF>'],
['endResync'],
['location', '6', '21'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testRuleBlock(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : b | c;
b : ID;
c : INT;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="1",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterDecision', '1', '0'],
['LT', '1', '0', '5', '0', '1', '0', '"1'],
['exitDecision', '1'],
['enterAlt', '2'],
['location', '6', '9'],
['enterRule', 'T.g', 'c'],
['location', '8', '1'],
['enterAlt', '1'],
['location', '8', '5'],
['LT', '1', '0', '5', '0', '1', '0', '"1'],
['LT', '1', '0', '5', '0', '1', '0', '"1'],
['consumeToken', '0', '5', '0', '1', '0', '"1'],
['location', '8', '8'],
['exitRule', 'T.g', 'c'],
['location', '6', '10'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testRuleBlockSingleAlt(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : b;
b : ID;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['enterRule', 'T.g', 'b'],
['location', '7', '1'],
['enterAlt', '1'],
['location', '7', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['location', '7', '7'],
['exitRule', 'T.g', 'b'],
['location', '6', '6'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testBlockSingleAlt(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ( b );
b : ID;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['enterAlt', '1'],
['location', '6', '7'],
['enterRule', 'T.g', 'b'],
['location', '7', '1'],
['enterAlt', '1'],
['location', '7', '5'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['LT', '1', '0', '4', '0', '1', '0', '"a'],
['consumeToken', '0', '4', '0', '1', '0', '"a'],
['location', '7', '7'],
['exitRule', 'T.g', 'b'],
['location', '6', '10'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testDFA(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
}
a : ( b | c ) EOF;
b : ID* INT;
c : ID+ BANG;
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
BANG : '!';
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
debugger = self.execParser(
grammar, 'a',
input="a!",
listener=None)
self.assertTrue(debugger.success)
expected = [['enterRule', 'T.g', 'a'],
['location', '6', '1'],
['enterAlt', '1'],
['location', '6', '5'],
['enterSubRule', '1'],
['enterDecision', '1', '0'],
['mark', '0'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['consumeToken', '0', '5', '0', '1', '0', '"a'],
['LT', '1', '1', '4', '0', '1', '1', '"!'],
['consumeToken', '1', '4', '0', '1', '1', '"!'],
['rewind', '0'],
['exitDecision', '1'],
['enterAlt', '2'],
['location', '6', '11'],
['enterRule', 'T.g', 'c'],
['location', '8', '1'],
['enterAlt', '1'],
['location', '8', '5'],
['enterSubRule', '3'],
['enterDecision', '3', '0'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['exitDecision', '3'],
['enterAlt', '1'],
['location', '8', '5'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['LT', '1', '0', '5', '0', '1', '0', '"a'],
['consumeToken', '0', '5', '0', '1', '0', '"a'],
['enterDecision', '3', '0'],
['LT', '1', '1', '4', '0', '1', '1', '"!'],
['exitDecision', '3'],
['exitSubRule', '3'],
['location', '8', '9'],
['LT', '1', '1', '4', '0', '1', '1', '"!'],
['LT', '1', '1', '4', '0', '1', '1', '"!'],
['consumeToken', '1', '4', '0', '1', '1', '"!'],
['location', '8', '13'],
['exitRule', 'T.g', 'c'],
['exitSubRule', '1'],
['location', '6', '15'],
['LT', '1', '-1', '-1', '0', '1', '2', '"<EOF>'],
['LT', '1', '-1', '-1', '0', '1', '2', '"<EOF>'],
['consumeToken', '-1', '-1', '0', '1', '2', '"<EOF>'],
['location', '6', '18'],
['exitRule', 'T.g', 'a'],
['terminate']]
self.assertListEqual(debugger.events, expected)
def testBasicAST(self):
grammar = textwrap.dedent(
r'''
grammar T;
options {
language=Python;
output=AST;
}
a : ( b | c ) EOF!;
b : ID* INT -> ^(INT ID*);
c : ID+ BANG -> ^(BANG ID+);
ID : 'a'..'z'+ ;
INT : '0'..'9'+ ;
BANG : '!';
WS : (' '|'\n') {$channel=HIDDEN;} ;
''')
listener = antlr3.debug.RecordDebugEventListener()
self.execParser(
grammar, 'a',
input="a!",
listener=listener)
# don't check output for now (too dynamic), I'm satisfied if it
# doesn't crash
if __name__ == '__main__':
unittest.main()