File: tokenizer.py

package info (click to toggle)
python-pegen 0.3.0-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 11,148 kB
  • sloc: python: 15,081; makefile: 89
file content (43 lines) | stat: -rw-r--r-- 1,103 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
from tokenize import ERRORTOKEN, NL, COMMENT


class Tokenizer:

    def __init__(self, tokengen, vis=None):
        """Call with tokenize.generate_tokens(...)."""
        self.tokengen = tokengen
        self.vis = vis
        self.tokens = []
        self.pos = 0

    def mark(self):
        return self.pos

    def reset(self, pos):
        if pos == self.pos:
            return
        self.pos = pos
        self.report()

    def get_token(self):
        token = self.peek_token()
        self.pos += 1
        self.report()
        return token

    def peek_token(self):
        if self.pos == len(self.tokens):
            while True:
                token = next(self.tokengen)
                if token.type == ERRORTOKEN and token.string.isspace():
                    continue
                if token.type in (NL, COMMENT):
                    continue
                break
            self.tokens.append(token)
            self.report()
        return self.tokens[self.pos]

    def report(self):
        if self.vis is not None:
            self.vis.vis_tokens(self.tokens, self.pos)