File: comment_stripper.py

package info (click to toggle)
firefox-esr 128.13.0esr-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 4,230,012 kB
  • sloc: cpp: 7,103,971; javascript: 6,088,450; ansic: 3,653,980; python: 1,212,330; xml: 594,604; asm: 420,652; java: 182,969; sh: 71,124; makefile: 20,747; perl: 13,449; objc: 12,399; yacc: 4,583; cs: 3,846; pascal: 2,973; lex: 1,720; ruby: 1,194; exp: 762; php: 436; lisp: 258; awk: 247; sql: 66; sed: 54; csh: 10
file content (51 lines) | stat: -rw-r--r-- 1,710 bytes parent folder | download | duplicates (55)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
# Copyright (C) 2018 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html

import io

class CommentStripper(object):
    """Removes lines starting with "//" from a file stream."""

    def __init__(self, f):
        self.f = f
        self.state = 0

    def read(self, size=-1):
        bytes = self.f.read(size)
        # TODO: Do we need to read more bytes if comments were stripped
        # in order to obey the size request?
        return "".join(self._strip_comments(bytes))

    def _strip_comments(self, bytes):
        for byte in bytes:
            if self.state == 0:
                # state 0: start of a line
                if byte == "/":
                    self.state = 1
                elif byte == "\n":
                    self.state = 0
                    yield byte
                else:
                    self.state = 2
                    yield byte
            elif self.state == 1:
                # state 1: read a single '/'
                if byte == "/":
                    self.state = 3
                elif byte == "\n":
                    self.state = 0
                    yield "/"  # the one that was skipped
                    yield "\n"
                else:
                    self.state = 2
                    yield "/"  # the one that was skipped
                    yield byte
            elif self.state == 2:
                # state 2: middle of a line, no comment
                if byte == "\n":
                    self.state = 0
                yield byte
            elif self.state == 3:
                # state 3: inside a comment
                if byte == "\n":
                    self.state = 0