File: test_node_encoding.rb

package info (click to toggle)
ruby-nokogiri 1.13.10%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 7,416 kB
  • sloc: ansic: 38,198; xml: 28,086; ruby: 22,271; java: 15,517; cpp: 7,037; yacc: 244; sh: 148; makefile: 136
file content (77 lines) | stat: -rw-r--r-- 2,655 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
# encoding: UTF-8
# frozen_string_literal: true

require "helper"

module Nokogiri
  module XML
    class TestNodeEncoding < Nokogiri::TestCase
      def test_serialize_encoding_xml
        @xml = Nokogiri::XML(File.open(SHIFT_JIS_XML))
        assert_equal(@xml.encoding.downcase,
          @xml.serialize.encoding.name.downcase)

        @doc = Nokogiri::XML(@xml.serialize)
        assert_equal(@xml.serialize, @doc.serialize)
      end

      def test_default_encoding
        doc = Nokogiri::XML(VEHICLE_XML)
        assert_nil(doc.encoding)
        assert_equal("UTF-8", doc.serialize.encoding.name)
      end

      def test_encoding_GH_1113
        utf8 = "<frag>shahid ὡ 𐄣 𢂁</frag>"
        hex = "<frag>shahid &#x1f61; &#x10123; &#x22081;</frag>"
        decimal = "<frag>shahid &#8033; &#65827; &#139393;</frag>"
        expected = Nokogiri.jruby? ? hex : decimal

        frag = Nokogiri::XML(utf8, nil, "UTF-8", Nokogiri::XML::ParseOptions::STRICT)
        assert_equal(utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)

        frag = Nokogiri::XML(expected, nil, "UTF-8", Nokogiri::XML::ParseOptions::STRICT)
        assert_equal(utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)

        frag = Nokogiri::XML(expected, nil, "US-ASCII", Nokogiri::XML::ParseOptions::STRICT)
        assert_equal(expected, frag.to_xml.sub(/^<.xml[^>]*>\n/m, "").strip)
      end

      VEHICLE_XML = <<-eoxml
        <root>
          <car xmlns:part="http://general-motors.com/">
            <part:tire>Michelin Model XGV</part:tire>
          </car>
          <bicycle xmlns:part="http://schwinn.com/">
            <part:tire>I'm a bicycle tire!</part:tire>
          </bicycle>
        </root>
      eoxml

      def test_namespace
        doc = Nokogiri::XML(VEHICLE_XML.encode("Shift_JIS"), nil, "Shift_JIS")
        assert_equal("Shift_JIS", doc.encoding)
        n = doc.xpath("//part:tire", { "part" => "http://schwinn.com/" }).first
        assert(n)
        assert_equal("UTF-8", n.namespace.href.encoding.name)
        assert_equal("UTF-8", n.namespace.prefix.encoding.name)
      end

      def test_namespace_as_hash
        doc = Nokogiri::XML(VEHICLE_XML.encode("Shift_JIS"), nil, "Shift_JIS")
        assert_equal("Shift_JIS", doc.encoding)
        assert(n = doc.xpath("//car").first)

        n.namespace_definitions.each do |nd|
          assert_equal("UTF-8", nd.href.encoding.name)
          assert_equal("UTF-8", nd.prefix.encoding.name)
        end

        n.namespaces.each do |k, v|
          assert_equal("UTF-8", k.encoding.name)
          assert_equal("UTF-8", v.encoding.name)
        end
      end
    end
  end
end