File: test_node_encoding.rb

package info (click to toggle)
ruby-nokogiri 1.11.1%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 5,576 kB
  • sloc: xml: 28,086; ruby: 18,456; java: 13,067; ansic: 5,138; yacc: 265; sh: 208; makefile: 27
file content (75 lines) | stat: -rw-r--r-- 2,606 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
# encoding: UTF-8
require "helper"

module Nokogiri
  module XML
    class TestNodeEncoding < Nokogiri::TestCase
      def test_serialize_encoding_xml
        @xml = Nokogiri::XML(File.open(SHIFT_JIS_XML))
        assert_equal @xml.encoding.downcase,
          @xml.serialize.encoding.name.downcase

        @doc = Nokogiri::XML(@xml.serialize)
        assert_equal @xml.serialize, @doc.serialize
      end

      def test_default_encoding
        doc = Nokogiri::XML(VEHICLE_XML)
        assert_nil doc.encoding
        assert_equal 'UTF-8', doc.serialize.encoding.name
      end

      def test_encoding_GH_1113
        utf8 = '<frag>shahid ὡ 𐄣 𢂁</frag>'
        hex = '<frag>shahid &#x1f61; &#x10123; &#x22081;</frag>'
        decimal = '<frag>shahid &#8033; &#65827; &#139393;</frag>'
        expected = Nokogiri.jruby? ? hex : decimal

        frag = Nokogiri::XML(utf8, nil, 'UTF-8', Nokogiri::XML::ParseOptions::STRICT)
        assert_equal utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, '').strip

        frag = Nokogiri::XML(expected, nil, 'UTF-8', Nokogiri::XML::ParseOptions::STRICT)
        assert_equal utf8, frag.to_xml.sub(/^<.xml[^>]*>\n/m, '').strip

        frag = Nokogiri::XML(expected, nil, 'US-ASCII', Nokogiri::XML::ParseOptions::STRICT)
        assert_equal expected, frag.to_xml.sub(/^<.xml[^>]*>\n/m, '').strip
      end

      VEHICLE_XML = <<-eoxml
        <root>
          <car xmlns:part="http://general-motors.com/">
            <part:tire>Michelin Model XGV</part:tire>
          </car>
          <bicycle xmlns:part="http://schwinn.com/">
            <part:tire>I'm a bicycle tire!</part:tire>
          </bicycle>
        </root>
      eoxml

      def test_namespace
        doc = Nokogiri::XML(VEHICLE_XML.encode('Shift_JIS'), nil, 'Shift_JIS')
        assert_equal 'Shift_JIS', doc.encoding
        n = doc.xpath('//part:tire', { 'part' => 'http://schwinn.com/' }).first
        assert n
        assert_equal 'UTF-8', n.namespace.href.encoding.name
        assert_equal 'UTF-8', n.namespace.prefix.encoding.name
      end

      def test_namespace_as_hash
        doc = Nokogiri::XML(VEHICLE_XML.encode('Shift_JIS'), nil, 'Shift_JIS')
        assert_equal 'Shift_JIS', doc.encoding
        assert n = doc.xpath('//car').first

        n.namespace_definitions.each do |nd|
          assert_equal 'UTF-8', nd.href.encoding.name
          assert_equal 'UTF-8', nd.prefix.encoding.name
        end

        n.namespaces.each do |k,v|
          assert_equal 'UTF-8', k.encoding.name
          assert_equal 'UTF-8', v.encoding.name
        end
      end
    end
  end
end