1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
|
# Copyright 2012 Google Inc. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
"""Tests for Gumbo CTypes bindings."""
__author__ = 'jdtang@google.com (Jonathan Tang)'
import io
import unittest
import gumboc
class CtypesTest(unittest.TestCase):
def testWordParse(self):
with gumboc.parse('Test') as output:
doctype_node = output.contents.document.contents
self.assertEqual(gumboc.NodeType.DOCUMENT, doctype_node.type)
document = doctype_node.v.document
self.assertEqual('', document.name)
self.assertEqual('', document.public_identifier)
self.assertEqual('', document.system_identifier)
root = output.contents.root.contents
self.assertEqual(gumboc.NodeType.ELEMENT, root.type)
self.assertEqual(gumboc.Tag.HTML, root.tag)
self.assertEqual(gumboc.Namespace.HTML, root.tag_namespace)
self.assertEqual(2, len(root.children))
head = root.children[0]
self.assertEqual(gumboc.NodeType.ELEMENT, head.type)
self.assertEqual(gumboc.Tag.HEAD, head.tag)
self.assertEqual('head', head.tag_name)
self.assertEqual(gumboc.Namespace.HTML, head.tag_namespace)
self.assertEqual(0, len(head.original_tag))
self.assertEqual('', str(head.original_end_tag))
self.assertEqual(0, head.children.length)
body = root.children[1]
self.assertNotEquals(body, doctype_node)
self.assertEqual(gumboc.NodeType.ELEMENT, body.type)
self.assertEqual(gumboc.Tag.BODY, body.tag)
self.assertEqual('body', body.tag_name)
self.assertEqual(1, len(body.children))
text_node = body.children[0]
self.assertEqual(gumboc.NodeType.TEXT, text_node.type)
self.assertEqual('Test', text_node.text)
def testBufferThatGoesAway(self):
for i in range(10):
source = io.StringIO('<foo bar=quux>1<p>2</foo>')
parse_tree = gumboc.parse(source.read())
source.close()
with parse_tree as output:
root = output.contents.root.contents
body = root.children[1]
foo = body.children[0]
self.assertEqual(gumboc.NodeType.ELEMENT, foo.type)
self.assertEqual(gumboc.Tag.UNKNOWN, foo.tag)
self.assertEqual('<foo bar=quux>', str(foo.original_tag))
self.assertEqual('', str(foo.original_end_tag))
self.assertEqual('foo', foo.tag_name.decode('utf-8'))
self.assertEqual('bar', foo.attributes[0].name)
self.assertEqual('quux', foo.attributes[0].value)
def testUnknownTag(self):
with gumboc.parse('<foo bar=quux>1<p>2</foo>') as output:
root = output.contents.root.contents
body = root.children[1]
foo = body.children[0]
self.assertEqual(gumboc.NodeType.ELEMENT, foo.type)
self.assertEqual(gumboc.Tag.UNKNOWN, foo.tag)
self.assertEqual('<foo bar=quux>', str(foo.original_tag))
self.assertEqual('', str(foo.original_end_tag))
self.assertEqual('foo', foo.tag_name.decode('utf-8'))
self.assertEqual('bar', foo.attributes[0].name)
self.assertEqual('quux', foo.attributes[0].value)
def testSarcasm(self):
with gumboc.parse('<div><sarcasm><div></div></sarcasm></div>') as output:
root = output.contents.root.contents
body = root.children[1]
div = body.children[0]
sarcasm = div.children[0]
self.assertEqual(gumboc.NodeType.ELEMENT, sarcasm.type)
self.assertEqual(gumboc.Tag.UNKNOWN, sarcasm.tag)
self.assertEqual('<sarcasm>', str(sarcasm.original_tag))
self.assertEqual('</sarcasm>', str(sarcasm.original_end_tag))
self.assertEqual('sarcasm', sarcasm.tag_name.decode('utf-8'))
def testEnums(self):
self.assertEqual(gumboc.Tag.A, gumboc.Tag.A)
self.assertEqual(hash(gumboc.Tag.A.value), hash(gumboc.Tag.A))
def testFragment(self):
with gumboc.parse(
'<div></div>',
fragment_context=gumboc.Tag.TITLE,
fragment_namespace=gumboc.Namespace.SVG) as output:
root = output.contents.root.contents
self.assertEqual(1, len(root.children))
div = root.children[0]
self.assertEqual(gumboc.NodeType.ELEMENT, div.type)
self.assertEqual(gumboc.Tag.DIV, div.tag)
self.assertEqual(gumboc.Namespace.HTML, div.tag_namespace)
if __name__ == '__main__':
unittest.main()
|