1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370
|
# -*- mode: ruby; coding: utf-8 -*-
#
# po_parser.ry - ruby version of msgfmt
#
# Copyright (C) 2002-2008 Masao Mutoh <mutomasa at gmail.com>
# Copyright (C) 2012-2023 Sutou Kouhei <kou@clear-code.com>
# Copyright (C) 2012-2013 Haruka Yoshihara <yoshihara@clear-code.com>
#
# You may redistribute it and/or modify it under the same
# license terms as Ruby or LGPL.
class GetText::POParser
token COMMENT MSGID MSGCTXT MSGID_PLURAL MSGSTR STRING PLURAL_NUM
rule
msgfmt
: /* empty */
| msgfmt comment
| msgfmt msgctxt
| msgfmt message
;
msgctxt
: MSGCTXT string_list
{
@msgctxt = val[1]
}
;
message
: single_message
| plural_message
;
single_message
: MSGID string_list MSGSTR string_list
{
msgid = val[1]
msgstr = val[3]
use_message_p = true
if @fuzzy and not msgid.empty?
use_message_p = (not ignore_fuzzy?)
if report_warning?
if ignore_fuzzy?
$stderr.print _("Warning: fuzzy message was ignored.\n")
else
$stderr.print _("Warning: fuzzy message was used.\n")
end
$stderr.print " #{@po_file}: msgid '#{msgid}'\n"
end
end
@fuzzy = false
if use_message_p
on_message(msgid, msgstr)
else
clear
end
result = ""
}
plural_message
: MSGID string_list MSGID_PLURAL string_list msgstr_plural
{
if @fuzzy and ignore_fuzzy?
if val[1] != ""
if report_warning?
$stderr.print _("Warning: fuzzy message was ignored.\n")
$stderr.print "msgid = '#{val[1]}\n"
end
else
on_message("", unescape(val[3]))
end
@fuzzy = false
else
@msgid_plural = unescape(val[3])
on_message(unescape(val[1]), unescape(val[4]))
end
result = ""
}
;
msgstr_plural
: msgstr_plural msgstr_plural_line
{
if val[0].size > 0
result = val[0] + "\000" + val[1]
else
result = ""
end
}
| msgstr_plural_line
;
msgstr_plural_line
: MSGSTR PLURAL_NUM string_list
{
result = val[2]
}
;
comment
: COMMENT
{
on_comment(val[0])
}
#| COMMENT
#;
string_list
: string_list STRING
{
result = val.delete_if{|item| item == ""}.join
}
| STRING
{
result = val[0]
}
;
end
---- header
require "gettext/po"
---- inner
if GetText.respond_to?(:bindtextdomain)
include GetText
GetText.bindtextdomain("gettext")
else
def _(message_id)
message_id
end
private :_
end
attr_writer :ignore_fuzzy, :report_warning
def initialize
@ignore_fuzzy = true
@report_warning = true
end
def ignore_fuzzy?
@ignore_fuzzy
end
def report_warning?
@report_warning
end
def unescape(string)
string.gsub(/\\(.)/) do
escaped_character = $1
case escaped_character
when "t"
"\t"
when "r"
"\r"
when "n"
"\n"
else
escaped_character
end
end
end
private :unescape
def parse(str, data)
clear
@data = data
str = str.strip
@q = []
until str.empty? do
case str
when /\A\s+/
str = $'
when /\Amsgctxt/
@q.push [:MSGCTXT, $&]
str = $'
when /\Amsgid_plural/
@q.push [:MSGID_PLURAL, $&]
str = $'
when /\Amsgid/
@q.push [:MSGID, $&]
str = $'
when /\Amsgstr/
@q.push [:MSGSTR, $&]
str = $'
when /\A\[(\d+)\]/
@q.push [:PLURAL_NUM, $1]
str = $'
when /\A\#~(.*)/
if report_warning?
$stderr.print _("Warning: obsolete msgid exists.\n")
$stderr.print " #{$&}\n"
end
@q.push [:COMMENT, $&]
str = $'
when /\A\#(.*)/
@q.push [:COMMENT, $&]
str = $'
when /\A\"(.*)\"/
@q.push [:STRING, unescape($1)]
str = $'
else
#c = str[0,1]
#@q.push [:STRING, c]
str = str[1..-1]
end
end
@q.push [false, "$end"]
if $DEBUG
@q.each do |a,b|
puts "[#{a}, #{b}]"
end
end
@yydebug = true if $DEBUG
do_parse
if @comments.size > 0
@data.set_comment(:last, @comments.join("\n"))
end
@data
end
def next_token
@q.shift
end
def on_message(msgid, msgstr)
msgstr = nil if msgstr.empty?
if @data.instance_of?(PO)
type = detect_entry_type
entry = POEntry.new(type)
entry.translator_comment = format_comment(@translator_comments)
entry.extracted_comment = format_comment(@extracted_comments)
entry.flags = @flags
entry.previous = format_comment(@previous)
entry.references = @references
entry.msgctxt = @msgctxt
entry.msgid = msgid
entry.msgid_plural = @msgid_plural
entry.msgstr = msgstr
@data[@msgctxt, msgid] = entry
else
options = {}
options[:msgctxt] = @msgctxt
options[:msgid_plural] = @msgid_plural
@data.store(msgid, msgstr, options)
@data.set_comment(msgid, format_comment(@comments))
end
clear
end
def format_comment(comments)
return "" if comments.empty?
comment = comments.join("\n")
comment << "\n" if comments.last.empty?
comment
end
def on_comment(comment)
if comment.start_with?(POFormat::FLAG_MARK)
content = comment[POFormat::FLAG_MARK.size..-1]
flags = parse_flags_line(content)
@fuzzy = flags.include?("fuzzy")
end
if @data.instance_of?(PO)
if comment == "#"
@translator_comments << ""
elsif /\A(#.)\s*(.*)\z/ =~ comment
mark = $1
content = $2
case mark
when POFormat::TRANSLATOR_COMMENT_MARK
@translator_comments << content
when POFormat::EXTRACTED_COMMENT_MARK
@extracted_comments << content
when POFormat::REFERENCE_COMMENT_MARK
@references.concat(parse_references_line(content))
when POFormat::FLAG_MARK
@flags.concat(flags)
when POFormat::PREVIOUS_COMMENT_MARK
@previous << content
else
@comments << comment
end
end
else
@comments << comment
end
end
def parse_file(po_file, data)
args = [ po_file ]
# In Ruby 1.9, we must detect proper encoding of a PO file.
if String.instance_methods.include?(:encode)
encoding = detect_file_encoding(po_file)
args << "r:#{encoding}"
end
@po_file = po_file
parse(File.open(*args) {|io| io.read }, data)
end
private
def detect_file_encoding(po_file)
open(po_file, :encoding => "ASCII-8BIT") do |input|
in_header = false
input.each_line do |line|
case line.chomp
when /\Amsgid\s+"(.*)"\z/
id = $1
break unless id.empty?
in_header = true
when /\A"Content-Type:.*\scharset=(.*)\\n"\z/
charset = $1
next unless in_header
break if template_charset?(charset)
return Encoding.find(charset)
end
end
end
Encoding.default_external
end
def template_charset?(charset)
charset == "CHARSET"
end
def detect_entry_type
if @msgctxt.nil?
if @msgid_plural.nil?
:normal
else
:plural
end
else
if @msgid_plural.nil?
:msgctxt
else
:msgctxt_plural
end
end
end
def parse_references_line(line)
line.split(/\s+/)
end
def parse_flags_line(line)
line.split(",").collect(&:strip)
end
def clear
@translator_comments = []
@extracted_comments = []
@references = []
@flags = []
@previous = []
@references = []
@comments = []
@msgctxt = nil
@msgid_plural = nil
end
---- footer
|