File: tokenizer.rb

package info (click to toggle)
ruby-simple-po-parser 1.1.5-2
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, forky, sid, trixie
  • size: 224 kB
  • sloc: ruby: 646; makefile: 4
file content (31 lines) | stat: -rw-r--r-- 686 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# encoding: utf-8

module SimplePoParser
  # Split a PO file into single PO message entities (a message is seperated by two newline)
  class Tokenizer
    def initialize
      @messages = []
    end

    def parse_file(path)
      file = File.open(path, "r")
      if(file.gets =~ /\r$/)
        # detected windows line ending
        file.close
        file = File.open(path, "rt")
      else
        file.rewind
      end
      file.each_line("\n\n") do |block|
        block.strip! # dont parse empty blocks
        @messages << parse_block(block) if block != ''
      end
      @messages
    end

  private
    def parse_block(block)
      Parser.new.parse(block)
    end
  end
end