File: comment_stripper.py

package info (click to toggle)
firefox 143.0.3-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 4,617,328 kB
  • sloc: cpp: 7,478,492; javascript: 6,417,157; ansic: 3,720,058; python: 1,396,372; xml: 627,523; asm: 438,677; java: 186,156; sh: 63,477; makefile: 19,171; objc: 13,059; perl: 12,983; yacc: 4,583; cs: 3,846; pascal: 3,405; lex: 1,720; ruby: 1,003; exp: 762; php: 436; lisp: 258; awk: 247; sql: 66; sed: 53; csh: 10
file content (51 lines) | stat: -rw-r--r-- 1,710 bytes parent folder | download | duplicates (51)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
# Copyright (C) 2018 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html

import io

class CommentStripper(object):
    """Removes lines starting with "//" from a file stream."""

    def __init__(self, f):
        self.f = f
        self.state = 0

    def read(self, size=-1):
        bytes = self.f.read(size)
        # TODO: Do we need to read more bytes if comments were stripped
        # in order to obey the size request?
        return "".join(self._strip_comments(bytes))

    def _strip_comments(self, bytes):
        for byte in bytes:
            if self.state == 0:
                # state 0: start of a line
                if byte == "/":
                    self.state = 1
                elif byte == "\n":
                    self.state = 0
                    yield byte
                else:
                    self.state = 2
                    yield byte
            elif self.state == 1:
                # state 1: read a single '/'
                if byte == "/":
                    self.state = 3
                elif byte == "\n":
                    self.state = 0
                    yield "/"  # the one that was skipped
                    yield "\n"
                else:
                    self.state = 2
                    yield "/"  # the one that was skipped
                    yield byte
            elif self.state == 2:
                # state 2: middle of a line, no comment
                if byte == "\n":
                    self.state = 0
                yield byte
            elif self.state == 3:
                # state 3: inside a comment
                if byte == "\n":
                    self.state = 0