1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77
|
# encoding: UTF-8
# frozen_string_literal: true
require "helper"
module Nokogiri
module XML
class TestNodeEncoding < Nokogiri::TestCase
def test_serialize_encoding_xml
@xml = Nokogiri::XML(File.open(SHIFT_JIS_XML))
assert_equal(@xml.encoding.downcase,
@xml.serialize.encoding.name.downcase)
@doc = Nokogiri::XML(@xml.serialize)
assert_equal(@xml.serialize, @doc.serialize)
end
def test_default_encoding
doc = Nokogiri::XML(VEHICLE_XML)
assert_nil(doc.encoding)
assert_equal("UTF-8", doc.serialize.encoding.name)
end
def test_encoding_GH_1113
utf8 = "<frag>shahid ὡ 𐄣 𢂁</frag>"
hex = "<frag>shahid ὡ 𐄣 𢂁</frag>"
decimal = "<frag>shahid ὡ 𐄣 𢂁</frag>"
expected = Nokogiri.jruby? ? hex : decimal
frag = Nokogiri::XML(utf8, nil, "UTF-8", Nokogiri::XML::ParseOptions::STRICT)
assert_equal(utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)
frag = Nokogiri::XML(expected, nil, "UTF-8", Nokogiri::XML::ParseOptions::STRICT)
assert_equal(utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)
frag = Nokogiri::XML(expected, nil, "US-ASCII", Nokogiri::XML::ParseOptions::STRICT)
assert_equal(expected, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)
end
VEHICLE_XML = <<-eoxml
<root>
<car xmlns:part="http://general-motors.com/">
<part:tire>Michelin Model XGV</part:tire>
</car>
<bicycle xmlns:part="http://schwinn.com/">
<part:tire>I'm a bicycle tire!</part:tire>
</bicycle>
</root>
eoxml
def test_namespace
doc = Nokogiri::XML(VEHICLE_XML.encode("Shift_JIS"), nil, "Shift_JIS")
assert_equal("Shift_JIS", doc.encoding)
n = doc.xpath("//part:tire", { "part" => "http://schwinn.com/" }).first
assert(n)
assert_equal("UTF-8", n.namespace.href.encoding.name)
assert_equal("UTF-8", n.namespace.prefix.encoding.name)
end
def test_namespace_as_hash
doc = Nokogiri::XML(VEHICLE_XML.encode("Shift_JIS"), nil, "Shift_JIS")
assert_equal("Shift_JIS", doc.encoding)
assert(n = doc.xpath("//car").first)
n.namespace_definitions.each do |nd|
assert_equal("UTF-8", nd.href.encoding.name)
assert_equal("UTF-8", nd.prefix.encoding.name)
end
n.namespaces.each do |k, v|
assert_equal("UTF-8", k.encoding.name)
assert_equal("UTF-8", v.encoding.name)
end
end
end
end
end
|