File: customxml.py

package info (click to toggle)
linkchecker 10.6.0-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 3,132 kB
  • sloc: python: 13,154; makefile: 134; sh: 71; xml: 36; sql: 20; javascript: 19; php: 2
file content (102 lines) | stat: -rw-r--r-- 3,814 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
# Copyright (C) 2000-2014 Bastian Kleineidam
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License along
# with this program; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
"""
An XML logger.
"""
from . import xmllog
from .. import strformat


class CustomXMLLogger(xmllog._XMLLogger):
    """
    XML custom output for easy post-processing.
    """

    LoggerName = "xml"

    LoggerArgs = {
        "filename": "linkchecker-out.xml",
    }

    def start_output(self):
        """
        Write start of checking info as xml comment.
        """
        super().start_output()
        self.xml_start_output()
        attrs = {"created": strformat.strtime(self.starttime)}
        self.xml_starttag('linkchecker', attrs)
        self.flush()

    def log_url(self, url_data):
        """
        Log URL data in custom XML format.
        """
        self.xml_starttag('urldata')
        if self.has_part('url'):
            self.xml_tag("url", url_data.base_url)
        if url_data.name and self.has_part('name'):
            self.xml_tag("name", url_data.name)
        if url_data.parent_url and self.has_part('parenturl'):
            attrs = {
                'line': "%s" % url_data.line,
                'column': "%s" % url_data.column,
            }
            self.xml_tag("parent", url_data.parent_url, attrs=attrs)
        if url_data.base_ref and self.has_part('base'):
            self.xml_tag("baseref", url_data.base_ref)
        if self.has_part("realurl"):
            self.xml_tag("realurl", url_data.url)
        if self.has_part("extern"):
            self.xml_tag("extern", "%d" % (1 if url_data.extern else 0))
        if url_data.dltime >= 0 and self.has_part("dltime"):
            self.xml_tag("dltime", "%f" % url_data.dltime)
        if url_data.size >= 0 and self.has_part("dlsize"):
            self.xml_tag("dlsize", "%d" % url_data.size)
        if url_data.checktime and self.has_part("checktime"):
            self.xml_tag("checktime", "%f" % url_data.checktime)
        if self.has_part("level"):
            self.xml_tag("level", "%d" % url_data.level)
        if url_data.info and self.has_part('info'):
            self.xml_starttag("infos")
            for info in url_data.info:
                self.xml_tag("info", info)
            self.xml_endtag("infos")
        if url_data.modified and self.has_part('modified'):
            self.xml_tag("modified", self.format_modified(url_data.modified))
        if url_data.warnings and self.has_part('warning'):
            self.xml_starttag("warnings")
            for tag, data in url_data.warnings:
                attrs = {}
                if tag:
                    attrs["tag"] = tag
                self.xml_tag("warning", data, attrs)
            self.xml_endtag("warnings")
        if self.has_part("result"):
            attrs = {}
            if url_data.result:
                attrs["result"] = url_data.result
            self.xml_tag("valid", "%d" % (1 if url_data.valid else 0), attrs)
        self.xml_endtag('urldata')
        self.flush()

    def end_output(self, **kwargs):
        """
        Write XML end tag.
        """
        self.xml_endtag("linkchecker")
        self.xml_end_output()
        self.close_fileoutput()