File: helper_test.rb

package info (click to toggle)
libfeedtools-ruby 0.2.29%2Bdfsg1-4
links: PTS, VCS
area: main
in suites: squeeze
size: 2,004 kB
ctags: 1,385
sloc: ruby: 18,815; sql: 39; makefile: 6
file content (237 lines) | stat: -rw-r--r-- 8,153 bytes
parent folder | download | duplicates (2)
require 'test/unit'
require 'feed_tools'
require 'feed_tools/helpers/html_helper'
require 'feed_tools/helpers/xml_helper'
require 'feed_tools/helpers/feed_tools_helper'

class HelperTest < Test::Unit::TestCase
  include FeedTools::FeedToolsHelper

  def setup
    FeedTools.reset_configurations
    FeedTools.configurations[:tidy_enabled] = false
    FeedTools.configurations[:feed_cache] = "FeedTools::DatabaseFeedCache"
    FeedTools::FeedToolsHelper.default_local_path = 
      File.expand_path(
        File.expand_path(File.dirname(__FILE__)) + '/../feeds')
  end

  def test_xpath_case_insensitivity
    FEED_TOOLS_NAMESPACES["testnamespace"] = "http://example.com/ns/"
    
    xml = <<-XML
      <RoOt>
        <ChIlD>Test String #1</ChIlD>
      </RoOt>
    XML
    xml_doc = REXML::Document.new(xml)
    test_string = FeedTools::XmlHelper.try_xpaths(xml_doc, [
      "ROOT/child/text()"
    ], :select_result_value => true)
    assert_equal("Test String #1", test_string)

    xml = <<-XML
      <root xmlns:TESTnAmEsPace="http://example.com/ns/">
        <TESTnAmEsPace:ChIlD>Test String #2</TESTnAmEsPace:ChIlD>
      </root>
    XML
    xml_doc = REXML::Document.new(xml)
    test_string = FeedTools::XmlHelper.try_xpaths(xml_doc, [
      "ROOT/testnamespace:child/text()"
    ], :select_result_value => true)
    assert_equal("Test String #2", test_string)

    xml = <<-XML
      <RoOt>
        <ChIlD AttRib="Test String #3" />
      </RoOt>
    XML
    xml_doc = REXML::Document.new(xml)
    test_string = FeedTools::XmlHelper.try_xpaths(xml_doc, [
      "ROOT/child/@ATTRIB"
    ], :select_result_value => true)
    assert_equal("Test String #3", test_string)

    xml = <<-XML
      <RoOt xmlns:TESTnAmEsPace="http://example.com/ns/">
        <ChIlD TESTnAmEsPace:AttRib="Test String #4" />
      </RoOt>
    XML
    xml_doc = REXML::Document.new(xml)
    test_string = FeedTools::XmlHelper.try_xpaths(xml_doc, [
      "ROOT/child/@testnamespace:ATTRIB"
    ], :select_result_value => true)
    assert_equal("Test String #4", test_string)
  end

  def test_escape_entities
  end

  def test_unescape_entities
  end
  
  def test_normalize_url
    assert_equal("", FeedTools::UriHelper.normalize_url(""))
    assert_equal("http://slashdot.org/",
      FeedTools::UriHelper.normalize_url("slashdot.org"))
    assert_equal("http://example.com/index.php",
      FeedTools::UriHelper.normalize_url("example.com/index.php"))

    # Test windows-style file: protocol normalization
    assert_equal("file:///c:/windows/My%20Documents%20100%20/foo.txt",
      FeedTools::UriHelper.normalize_url("c:\\windows\\My Documents 100%20\\foo.txt"))
    assert_equal("file:///c:/windows/My%20Documents%20100%20/foo.txt",
      FeedTools::UriHelper.normalize_url(
        "file://c:\\windows\\My Documents 100%20\\foo.txt"))
    assert_equal("file:///c:/windows/My%20Documents%20100%20/foo.txt",
      FeedTools::UriHelper.normalize_url(
        "file:///c|/windows/My%20Documents%20100%20/foo.txt"))
    assert_equal("file:///c:/windows/My%20Documents%20100%20/foo.txt",
      FeedTools::UriHelper.normalize_url(
        "file:///c:/windows/My%20Documents%20100%20/foo.txt"))
    if FeedTools::UriHelper.idn_enabled?
      # Test internationalized domain names
      assert_equal(
        "http://www.xn--8ws00zhy3a.com/atomtests/iri/everything.atom",
        FeedTools::UriHelper.normalize_url(
          "http://www.詹姆斯.com/atomtests/iri/everything.atom"))
      assert_equal(
        "http://www.xn--8ws00zhy3a.com/atomtests/iri/%E8%A9%B9.html",
        FeedTools::UriHelper.normalize_url(
          "http://www.詹姆斯.com/atomtests/iri/詹.html"))
    end
  end
  
  def test_tidy_html
    FeedTools.configurations[:tidy_enabled] = true
    unless FeedTools::HtmlHelper.tidy_enabled?
      puts "\nCould not test tidy support.  Libtidy couldn't be found."
    else
      illegal_pre = <<-EOF
        <pre>
         require 'net/http'
         module Net
         class HTTPIO < HTTP
           def request(req, body = nil, &#38;block)
             begin_transport req
             req.exec @socket, @curr_http_version, edit_path(req.path), body
             begin
               res = HTTPResponse.read_new(@socket)
             end while HTTPContinue === res

             res.instance_eval do
               def read len = nil; ... end
               def body; true end
               def close
                 req, res = @req, self
                 @http.instance_eval do
                    end_transport req, res
                    finish
                 end
               end
               def size; 0 end
               def is_a? klass; klass == IO ? true : super(klass); end
             end

             res
           end
         end
        </pre>
      EOF
      illegal_pre_after_tidy = FeedTools::HtmlHelper.tidy_html(illegal_pre)
      assert_not_equal(nil, illegal_pre_after_tidy =~ /class HTTPIO &lt; HTTP/,
        "Tidy failed to clean up illegal chars in <pre> block.")
      
      unescaped_utf8_characters = <<-EOF
        \302\240
      EOF
      unescaped_utf8_characters_after_tidy =
        FeedTools::HtmlHelper.tidy_html(unescaped_utf8_characters)
      assert_not_equal("&#194;&#160;", unescaped_utf8_characters_after_tidy,
        "Tidy failed to escape the unicode characters correctly.")
      assert_not_equal("&Acirc;&nbsp;", unescaped_utf8_characters_after_tidy,
        "Tidy failed to escape the unicode characters correctly.")
    end
    FeedTools.configurations[:tidy_enabled] = false
  end
  
  def test_build_urn_uri
    assert_equal("urn:uuid:fa6d0b87-3f36-517d-b9b7-1349f8c3fc6b",
      FeedTools::UriHelper.build_urn_uri('http://sporkmonger.com/'))
  end
  
  def test_build_merged_feed
    if FeedTools::FEED_TOOLS_VERSION::MINOR == 2 && 
        FeedTools::FEED_TOOLS_VERSION::TINY <= 26
      merged_feed = FeedTools.build_merged_feed([
        "http://rss.slashdot.org/Slashdot/slashdot"
      ])
    end
  end
  
  def test_extract_xhtml
    FeedTools.configurations[:tidy_enabled] = false
    
    xml = <<-XML
      <content>
        <div xmlns='http://www.w3.org/1999/xhtml'><em>Testing.</em></div>
      </content>
    XML
    doc = REXML::Document.new(xml)
    assert_equal(
      "<div><em>Testing.</em></div>",
      FeedTools::HtmlHelper.extract_xhtml(doc.root))
    xml = <<-XML
      <content xmlns:xhtml='http://www.w3.org/1999/xhtml'>
        <xhtml:div><xhtml:em>Testing.</xhtml:em></xhtml:div>
      </content>
    XML
    doc = REXML::Document.new(xml)
    assert_equal(
      "<div><em>Testing.</em></div>",
      FeedTools::HtmlHelper.extract_xhtml(doc.root))
    xml = <<-XML
      <content type="xhtml" xmlns:xhtml='http://www.w3.org/1999/xhtml'>
        <xhtml:div xmlns='http://hsivonen.iki.fi/FooML'>
			    <xhtml:ul>
            <xhtml:li>XHTML List Item</xhtml:li>
          </xhtml:ul>
          <ul>
            <li>FooML List Item</li>
          </ul>
        </xhtml:div>
		  </content>
    XML
    doc = REXML::Document.new(xml)
    xhtml = FeedTools::HtmlHelper.extract_xhtml(doc.root)
    assert((xhtml =~ /<div>/) && (xhtml =~ /<\/div>/),
      "XHTML divs were not normalized properly.")
    assert((xhtml =~ /hsivonen\.iki\.fi/),
      "FooML namespace was not preserved.")
    assert((xhtml =~ /<foo:ul xmlns:foo=/),
      "Namespace was not placed correctly.")

    FeedTools.configurations[:tidy_enabled] = true

    xml = <<-XML
      <content type="xhtml" xmlns:xhtml='http://www.w3.org/1999/xhtml'>
        <xhtml:div xmlns='http://hsivonen.iki.fi/FooML'>
			    <xhtml:ul>
            <xhtml:li>XHTML List Item</xhtml:li>
          </xhtml:ul>
          <ul>
            <li>FooML List Item</li>
          </ul>
        </xhtml:div>
		  </content>
    XML
    doc = REXML::Document.new(xml)
    xhtml = FeedTools::HtmlHelper.extract_xhtml(doc.root)
    assert((xhtml =~ /<div>/) && (xhtml =~ /<\/div>/),
      "XHTML divs were not normalized properly.")
    assert((xhtml =~ /hsivonen\.iki\.fi/),
      "FooML namespace was not preserved.")
    assert((xhtml =~ /<foo:ul xmlns:foo=/),
      "Namespace was not placed correctly.")
  end
end