aboutsummaryrefslogtreecommitdiff
path: root/runtime/Python/tests/t010lexer.py
blob: 7cd318cea9309f3eef8481e3a9c9ad537506fc9a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
import antlr3
import testbase
import unittest

class t010lexer(testbase.ANTLRTest):
    def setUp(self):
        self.compileGrammar()
        
        
    def lexerClass(self, base):
        class TLexer(base):
            def emitErrorMessage(self, msg):
                # report errors to /dev/null
                pass

            def reportError(self, re):
                # no error recovery yet, just crash!
                raise re

        return TLexer
    
        
    def testValid(self):
        stream = antlr3.StringStream('foobar _Ab98 \n A12sdf')
        lexer = self.getLexer(stream)

        token = lexer.nextToken()
        assert token.type == self.lexerModule.IDENTIFIER
        assert token.start == 0, token.start
        assert token.stop == 5, token.stop
        assert token.text == 'foobar', token.text

        token = lexer.nextToken()
        assert token.type == self.lexerModule.WS
        assert token.start == 6, token.start
        assert token.stop == 6, token.stop
        assert token.text == ' ', token.text

        token = lexer.nextToken()
        assert token.type == self.lexerModule.IDENTIFIER
        assert token.start == 7, token.start
        assert token.stop == 11, token.stop
        assert token.text == '_Ab98', token.text

        token = lexer.nextToken()
        assert token.type == self.lexerModule.WS
        assert token.start == 12, token.start
        assert token.stop == 14, token.stop
        assert token.text == ' \n ', token.text

        token = lexer.nextToken()
        assert token.type == self.lexerModule.IDENTIFIER
        assert token.start == 15, token.start
        assert token.stop == 20, token.stop
        assert token.text == 'A12sdf', token.text

        token = lexer.nextToken()
        assert token.type == self.lexerModule.EOF


    def testMalformedInput(self):
        stream = antlr3.StringStream('a-b')
        lexer = self.getLexer(stream)

        lexer.nextToken()
        try:
            token = lexer.nextToken()
            raise AssertionError, token

        except antlr3.NoViableAltException, exc:
            assert exc.unexpectedType == '-', repr(exc.unexpectedType)
            assert exc.charPositionInLine == 1, repr(exc.charPositionInLine)
            assert exc.line == 1, repr(exc.line)

            

if __name__ == '__main__':
    unittest.main()