1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139
|
#!/usr/bin/env python
# -*- Mode: Python; py-indent-offset: 4 -*-
#
# This litte script outputs the C doc comments to an XML format.
# So far it's only used by gtkmm (The C++ bindings). Murray Cumming.
# Usage example:
# # ./docextract_to_xml.py -s /gnome/head/cvs/gtk+/gtk/ -s /gnome/head/cvs/gtk+/docs/reference/gtk/tmpl/ > gtk_docs.xml
import getopt
import re
import string
import sys
import docextract
def usage():
sys.stderr.write('usage: docextract_to_xml.py ' +
'[-s /src/dir | --source-dir=/src/dir] ' +
'[-a | --with-annotations] [-p | --with-properties] ' +
'[-i | --with-signals ]\n')
sys.exit(1)
# Translates special texts to &... HTML acceptable format. Also replace
# occurrences of '/*' and '*/' with '/ *' and '* /' respectively to avoid
# comment errors (note the spaces). Some function descriptions include C++
# multi-line comments which cause errors when the description is included in a
# C++ Doxygen comment block.
def escape_text(unescaped_text):
# Escape every "&" not part of an entity reference
escaped_text = re.sub(r'&(?![A-Za-z]+;)', '&', unescaped_text)
# These weird entities turn up in the output...
escaped_text = string.replace(escaped_text, '—', '—')
escaped_text = string.replace(escaped_text, '*', '*')
escaped_text = string.replace(escaped_text, '%', '%')
escaped_text = string.replace(escaped_text, '@', '@')
escaped_text = string.replace(escaped_text, '#', '#')
escaped_text = string.replace(escaped_text, ' ', ' ')
# This represents a '/' before or after an '*' so replace with slash but
# with spaces.
escaped_text = string.replace(escaped_text, '/', ' / ')
# Escape for both tag contents and attribute values
escaped_text = string.replace(escaped_text, '<', '<')
escaped_text = string.replace(escaped_text, '>', '>')
escaped_text = string.replace(escaped_text, '"', '"')
# Replace C++ comment begin and ends to ones that don't affect Doxygen.
escaped_text = string.replace(escaped_text, '/*', '/ *')
escaped_text = string.replace(escaped_text, '*/', '* /')
return escaped_text
def print_annotations(annotations):
for annotation in annotations:
print "<annotation name=" + annotation[0] + ">" + \
escape_text(annotation[1]) + "</annotation>"
if __name__ == '__main__':
try:
opts, args = getopt.getopt(sys.argv[1:], "d:s:o:api",
["source-dir=", "with-annotations",
"with-properties", "with-signals"])
except getopt.error, e:
sys.stderr.write('docextract_to_xml.py: %s\n' % e)
usage()
source_dirs = []
with_annotations = False
with_signals = False
with_properties = False
for opt, arg in opts:
if opt in ('-s', '--source-dir'):
source_dirs.append(arg)
if opt in ('-a', '--with-annotations'):
with_annotations = True
if opt in ('-p', '--with-properties'):
with_properties = True
if opt in ('-i', '--with-signals'):
with_signals = True
if len(args) != 0:
usage()
docs = docextract.extract(source_dirs);
docextract.extract_tmpl(source_dirs, docs); #Try the tmpl sgml files too.
# print d.docs
if docs:
print "<root>"
for name, value in sorted(docs.items()):
# Get the type of comment block ('function', 'signal' or
# 'property') (the value is a GtkDoc).
block_type = value.get_type()
# Skip signals if the option was not specified.
if block_type == 'signal' and not with_signals:
continue
# Likewise for properties.
elif block_type == 'property' and not with_properties:
continue
print "<" + block_type + " name=\"" + escape_text(name) + "\">"
print "<description>"
print escape_text(value.get_description())
print "</description>"
# Loop through the parameters if not dealing with a property:
if block_type != 'property':
print "<parameters>"
for name, description, annotations in value.params:
print "<parameter name=\"" + escape_text(name) + "\">"
print "<parameter_description>" + escape_text(description) + "</parameter_description>"
if with_annotations:
print_annotations(annotations)
print "</parameter>"
print "</parameters>"
# Show the return-type (also if not dealing with a property):
if with_annotations:
print "<return>"
print "<return_description>" + escape_text(value.ret[0]) + \
"</return_description>"
print_annotations(value.ret[1])
print "</return>"
else:
print "<return>" + escape_text(value.ret[0]) + "</return>"
if with_annotations:
print_annotations(value.get_annotations())
print "</" + block_type + ">\n"
print "</root>"
|