File: comment_stripper.py

package info (click to toggle)
firefox-esr 140.4.0esr-1~deb13u1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 4,539,284 kB
  • sloc: cpp: 7,381,286; javascript: 6,388,710; ansic: 3,710,139; python: 1,393,780; xml: 628,165; asm: 426,916; java: 184,004; sh: 65,742; makefile: 19,302; objc: 13,059; perl: 12,912; yacc: 4,583; cs: 3,846; pascal: 3,352; lex: 1,720; ruby: 1,226; exp: 762; php: 436; lisp: 258; awk: 247; sql: 66; sed: 54; csh: 10
file content (51 lines) | stat: -rw-r--r-- 1,710 bytes parent folder | download | duplicates (58)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
# Copyright (C) 2018 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html

import io

class CommentStripper(object):
    """Removes lines starting with "//" from a file stream."""

    def __init__(self, f):
        self.f = f
        self.state = 0

    def read(self, size=-1):
        bytes = self.f.read(size)
        # TODO: Do we need to read more bytes if comments were stripped
        # in order to obey the size request?
        return "".join(self._strip_comments(bytes))

    def _strip_comments(self, bytes):
        for byte in bytes:
            if self.state == 0:
                # state 0: start of a line
                if byte == "/":
                    self.state = 1
                elif byte == "\n":
                    self.state = 0
                    yield byte
                else:
                    self.state = 2
                    yield byte
            elif self.state == 1:
                # state 1: read a single '/'
                if byte == "/":
                    self.state = 3
                elif byte == "\n":
                    self.state = 0
                    yield "/"  # the one that was skipped
                    yield "\n"
                else:
                    self.state = 2
                    yield "/"  # the one that was skipped
                    yield byte
            elif self.state == 2:
                # state 2: middle of a line, no comment
                if byte == "\n":
                    self.state = 0
                yield byte
            elif self.state == 3:
                # state 3: inside a comment
                if byte == "\n":
                    self.state = 0