#!/usr/bin/env python
#
# Process a list of Python and/or XML files containing SCons documentation.
#
# This script creates formatted lists of the Builders, functions, Tools
# or construction variables documented in the specified XML files.
#
# Dependening on the options, the lists are output in either
# DocBook-formatted generated XML files containing the summary text
# and/or .mod files contining the ENTITY definitions for each item,
# or in man-page-formatted output.
#
import getopt
import os
import re
import string
import sys
import xml.sax
try:
from io import StringIO # usable as of 2.6; takes unicode only
except ImportError:
# No 'io' module or no StringIO in io
exec('from cStringIO import StringIO')
import SConsDoc
base_sys_path = [os.getcwd() + '/build/test-tar-gz/lib/scons'] + sys.path
helpstr = """\
Usage: scons-proc.py [--man|--xml]
[-b file(s)] [-f file(s)] [-t file(s)] [-v file(s)]
[infile ...]
Options:
-b file(s) dump builder information to the specified file(s)
-f file(s) dump function information to the specified file(s)
-t file(s) dump tool information to the specified file(s)
-v file(s) dump variable information to the specified file(s)
--man print info in man page format, each -[btv] argument
is a single file name
--xml (default) print info in SML format, each -[btv] argument
is a pair of comma-separated .gen,.mod file names
"""
opts, args = getopt.getopt(sys.argv[1:],
"b:f:ht:v:",
['builders=', 'help',
'man', 'xml', 'tools=', 'variables='])
buildersfiles = None
functionsfiles = None
output_type = '--xml'
toolsfiles = None
variablesfiles = None
for o, a in opts:
if o in ['-b', '--builders']:
buildersfiles = a
elif o in ['-f', '--functions']:
functionsfiles = a
elif o in ['-h', '--help']:
sys.stdout.write(helpstr)
sys.exit(0)
elif o in ['--man', '--xml']:
output_type = o
elif o in ['-t', '--tools']:
toolsfiles = a
elif o in ['-v', '--variables']:
variablesfiles = a
h = SConsDoc.SConsDocHandler()
saxparser = xml.sax.make_parser()
saxparser.setContentHandler(h)
saxparser.setErrorHandler(h)
xml_preamble = """\
"""
xml_postamble = """\
"""
for f in args:
_, ext = os.path.splitext(f)
if ext == '.py':
dir, _ = os.path.split(f)
if dir:
sys.path = [dir] + base_sys_path
module = SConsDoc.importfile(f)
h.set_file_info(f, len(xml_preamble.split('\n')))
try:
content = module.__scons_doc__
except AttributeError:
content = None
else:
del module.__scons_doc__
else:
h.set_file_info(f, len(xml_preamble.split('\n')))
content = open(f).read()
if content:
content = content.replace('&', '&')
# Strip newlines after comments so they don't turn into
# spurious paragraph separators.
content = content.replace('-->\n', '-->')
input = xml_preamble + content + xml_postamble
try:
saxparser.parse(StringIO(unicode(input)))
except:
sys.stderr.write("error in %s\n" % f)
raise
Warning = """\
"""
Regular_Entities_Header = """\
"""
Link_Entities_Header = """\
"""
class SCons_XML(object):
def __init__(self, entries, **kw):
self.values = entries
for k, v in kw.items():
setattr(self, k, v)
def fopen(self, name):
if name == '-':
return sys.stdout
return open(name, 'w')
class SCons_XML_to_XML(SCons_XML):
def write(self, files):
gen, mod = files.split(',')
g.write_gen(gen)
g.write_mod(mod)
def write_gen(self, filename):
if not filename:
return
f = self.fopen(filename)
for v in self.values:
f.write('\n\n' %
(v.prefix, v.idfunc()))
f.write('%s\n' % v.xml_term())
f.write('\n')
for chunk in v.summary.body:
f.write(str(chunk))
if v.sets:
s = ['&cv-link-%s;' % x for x in v.sets]
f.write('\n')
f.write('Sets: ' + ', '.join(s) + '.\n')
f.write('\n')
if v.uses:
u = ['&cv-link-%s;' % x for x in v.uses]
f.write('\n')
f.write('Uses: ' + ', '.join(u) + '.\n')
f.write('\n')
f.write('\n')
f.write('\n')
def write_mod(self, filename):
description = self.values[0].description
if not filename:
return
f = self.fopen(filename)
f.write(Warning)
f.write('\n')
f.write(Regular_Entities_Header % description)
f.write('\n')
for v in self.values:
f.write('%s%s>">\n' %
(v.prefix, v.idfunc(),
v.tag, v.entityfunc(), v.tag))
if self.env_signatures:
f.write('\n')
for v in self.values:
f.write('env.%s%s>">\n' %
(v.prefix, v.idfunc(),
v.tag, v.entityfunc(), v.tag))
f.write('\n')
f.write(Warning)
f.write('\n')
f.write(Link_Entities_Header % description)
f.write('\n')
for v in self.values:
f.write('<%s>%s%s>\'>\n' %
(v.prefix, v.idfunc(),
v.prefix, v.idfunc(),
v.tag, v.entityfunc(), v.tag))
if self.env_signatures:
f.write('\n')
for v in self.values:
f.write('<%s>env.%s%s>\'>\n' %
(v.prefix, v.idfunc(),
v.prefix, v.idfunc(),
v.tag, v.entityfunc(), v.tag))
f.write('\n')
f.write(Warning)
class SCons_XML_to_man(SCons_XML):
def write(self, filename):
"""
Converts the contents of the specified filename from DocBook XML
to man page macros.
This does not do an intelligent job. In particular, it doesn't
actually use the structured nature of XML to handle arbitrary
input. Instead, we're using text replacement and regular
expression substitutions to convert observed patterns into the
macros we want. To the extent that we're relatively consistent
with our input .xml, this works, but could easily break if handed
input that doesn't match these specific expectations.
"""
if not filename:
return
f = self.fopen(filename)
chunks = []
for v in self.values:
chunks.extend(v.man_separator())
chunks.extend(v.initial_man_chunks())
chunks.extend(list(map(str, v.summary.body)))
body = ''.join(chunks)
# Simple transformation of examples into our defined macros for those.
body = body.replace('', '.ES')
body = body.replace('', '.EE')
# Replace groupings of tags and surrounding newlines
# with single blank lines.
body = body.replace('\n\n\n', '\n\n')
body = body.replace('\n', '')
body = body.replace('', '\n')
body = body.replace('\n', '')
# Convert and its child tags.
body = body.replace('\n', '.RS 10\n')
# Handling needs to be rationalized and made
# consistent. Right now, the values map to arbitrary,
# ad-hoc idioms in the current man page.
body = re.compile(r'\n([^<]*)\n\n').sub(r'.TP 6\n.B \1\n', body)
body = re.compile(r'\n([^<]*)\n\n').sub(r'.IP \1\n', body)
body = re.compile(r'\n([^<]*)\n\n').sub(r'.HP 6\n.B \1\n', body)
body = body.replace('\n', '')
body = body.replace('\n', '')
body = body.replace('\n', '.RE\n')
# Get rid of unnecessary .IP macros, and unnecessary blank lines
# in front of .IP macros.
body = re.sub(r'\.EE\n\n+(?!\.IP)', '.EE\n.IP\n', body)
body = body.replace('\n.EE\n.IP\n.ES\n', '\n.EE\n\n.ES\n')
body = body.replace('\n.IP\n\'\\"', '\n\n\'\\"')
# Convert various named entities and tagged names to nroff
# in-line font conversions (\fB, \fI, \fP).
body = re.sub('&(scons|SConstruct|SConscript|Dir|jar|Make|lambda);',
r'\\fB\1\\fP', body)
body = re.sub('&(TARGET|TARGETS|SOURCE|SOURCES);', r'\\fB$\1\\fP', body)
body = re.sub('&(target|source);', r'\\fI\1\\fP', body)
body = re.sub('&b(-link)?-([^;]*);', r'\\fB\2\\fP()', body)
body = re.sub('&cv(-link)?-([^;]*);', r'\\fB$\2\\fP', body)
body = re.sub('&f(-link)?-env-([^;]*);', r'\\fBenv.\2\\fP()', body)
body = re.sub('&f(-link)?-([^;]*);', r'\\fB\2\\fP()', body)
body = re.sub(r'<(application|command|envar|filename|function|literal|option)>([^<]*)\1>',
r'\\fB\2\\fP', body)
body = re.sub(r'<(classname|emphasis|varname)>([^<]*)\1>',
r'\\fI\2\\fP', body)
# Convert groupings of font conversions (\fB, \fI, \fP) to
# man page .B, .BR, .I, .IR, .R, .RB and .RI macros.
body = re.compile(r'^\\f([BI])([^\\]* [^\\]*)\\fP\s*$', re.M).sub(r'.\1 "\2"', body)
body = re.compile(r'^\\f([BI])(.*)\\fP\s*$', re.M).sub(r'.\1 \2', body)
body = re.compile(r'^\\f([BI])(.*)\\fP(\S+)$', re.M).sub(r'.\1R \2 \3', body)
body = re.compile(r'^(\.B)( .*)\\fP(.*)\\fB(.*)$', re.M).sub(r'\1R\2 \3 \4', body)
body = re.compile(r'^(\.B)R?( .*)\\fP(.*)\\fI(.*)$', re.M).sub(r'\1I\2\3 \4', body)
body = re.compile(r'^(\.I)( .*)\\fP\\fB(.*)\\fP\\fI(.*)$', re.M).sub(r'\1R\2 \3 \4', body)
body = re.compile(r'^(\S+)\\f([BI])(.*)\\fP$', re.M).sub(r'.R\2 \1 \3', body)
body = re.compile(r'^(\S+)\\f([BI])(.*)\\fP([^\s\\]+)$', re.M).sub(r'.R\2 \1 \3 \4', body)
body = re.compile(r'^(\.R[BI].*[\S])\s+$;', re.M).sub(r'\1', body)
# Convert < and > entities to literal < and > characters.
body = body.replace('<', '<')
body = body.replace('>', '>')
# Backslashes. Oh joy.
body = re.sub(r'\\(?=[^f])', r'\\\\', body)
body = re.compile("^'\\\\\\\\", re.M).sub("'\\\\", body)
body = re.compile(r'^\.([BI]R?) ([^"]\S*\\\\\S+[^"])$', re.M).sub(r'.\1 "\2"', body)
# Put backslashes in front of various hyphens that need
# to be long em-dashes.
body = re.compile(r'^\.([BI]R?) --', re.M).sub(r'.\1 \-\-', body)
body = re.compile(r'^\.([BI]R?) -', re.M).sub(r'.\1 \-', body)
body = re.compile(r'\\f([BI])-', re.M).sub(r'\\f\1\-', body)
f.write(body)
class Proxy(object):
def __init__(self, subject):
"""Wrap an object as a Proxy object"""
self.__subject = subject
def __getattr__(self, name):
"""Retrieve an attribute from the wrapped object. If the named
attribute doesn't exist, AttributeError is raised"""
return getattr(self.__subject, name)
def get(self):
"""Retrieve the entire wrapped object"""
return self.__subject
def __cmp__(self, other):
if issubclass(other.__class__, self.__subject.__class__):
return cmp(self.__subject, other)
return cmp(self.__dict__, other.__dict__)
class SConsThing(Proxy):
def idfunc(self):
return self.name
def xml_term(self):
return '%s' % self.name
class Builder(SConsThing):
description = 'builder'
prefix = 'b-'
tag = 'function'
def xml_term(self):
return ('<%s>%s()%s>\n<%s>env.%s()%s>' %
(self.tag, self.name, self.tag, self.tag, self.name, self.tag))
def entityfunc(self):
return self.name
def man_separator(self):
return ['\n', "'\\" + '"'*69 + '\n']
def initial_man_chunks(self):
return [ '.IP %s()\n.IP env.%s()\n' % (self.name, self.name) ]
class Function(SConsThing):
description = 'function'
prefix = 'f-'
tag = 'function'
def args_to_xml(self, arg):
s = ''.join(arg.body).strip()
result = []
for m in re.findall('([a-zA-Z/_]+=?|[^a-zA-Z/_]+)', s):
if m[0] in string.letters:
if m[-1] == '=':
result.append('%s=' % m[:-1])
else:
result.append('%s' % m)
else:
result.append(m)
return ''.join(result)
def xml_term(self):
try:
arguments = self.arguments
except AttributeError:
arguments = ['()']
result = ['']
for arg in arguments:
try:
signature = arg.signature
except AttributeError:
signature = "both"
s = self.args_to_xml(arg)
if signature in ('both', 'global'):
result.append('%s%s\n' % (self.name, s)) #
if signature in ('both', 'env'):
result.append('env.%s%s' % (self.name, s))
result.append('')
return ''.join(result)
def entityfunc(self):
return self.name
def man_separator(self):
return ['\n', "'\\" + '"'*69 + '\n']
def args_to_man(self, arg):
"""Converts the contents of an tag, which
specifies a function's calling signature, into a series
of tokens that alternate between literal tokens
(to be displayed in roman or bold face) and variable
names (to be displayed in italics).
This is complicated by the presence of Python "keyword=var"
arguments, where "keyword=" should be displayed literally,
and "var" should be displayed in italics. We do this by
detecting the keyword= var portion and appending it to the
previous string, if any.
"""
s = ''.join(arg.body).strip()
result = []
for m in re.findall('([a-zA-Z/_]+=?|[^a-zA-Z/_]+)', s):
if m[-1] == '=' and result:
if result[-1][-1] == '"':
result[-1] = result[-1][:-1] + m + '"'
else:
result[-1] += m
else:
if ' ' in m:
m = '"%s"' % m
result.append(m)
return ' '.join(result)
def initial_man_chunks(self):
try:
arguments = self.arguments
except AttributeError:
arguments = ['()']
result = []
for arg in arguments:
try:
signature = arg.signature
except AttributeError:
signature = "both"
s = self.args_to_man(arg)
if signature in ('both', 'global'):
result.append('.TP\n.RI %s%s\n' % (self.name, s))
if signature in ('both', 'env'):
result.append('.TP\n.IR env .%s%s\n' % (self.name, s))
return result
class Tool(SConsThing):
description = 'tool'
prefix = 't-'
tag = 'literal'
def idfunc(self):
return self.name.replace('+', 'X')
def entityfunc(self):
return self.name
def man_separator(self):
return ['\n']
def initial_man_chunks(self):
return ['.IP %s\n' % self.name]
class Variable(SConsThing):
description = 'construction variable'
prefix = 'cv-'
tag = 'envar'
def entityfunc(self):
return '$' + self.name
def man_separator(self):
return ['\n']
def initial_man_chunks(self):
return ['.IP %s\n' % self.name]
if output_type == '--man':
processor_class = SCons_XML_to_man
elif output_type == '--xml':
processor_class = SCons_XML_to_XML
else:
sys.stderr.write("Unknown output type '%s'\n" % output_type)
sys.exit(1)
if buildersfiles:
g = processor_class([ Builder(b) for b in sorted(h.builders.values()) ],
env_signatures=True)
g.write(buildersfiles)
if functionsfiles:
g = processor_class([ Function(b) for b in sorted(h.functions.values()) ],
env_signatures=True)
g.write(functionsfiles)
if toolsfiles:
g = processor_class([ Tool(t) for t in sorted(h.tools.values()) ],
env_signatures=False)
g.write(toolsfiles)
if variablesfiles:
g = processor_class([ Variable(v) for v in sorted(h.cvars.values()) ],
env_signatures=False)
g.write(variablesfiles)
# Local Variables:
# tab-width:4
# indent-tabs-mode:nil
# End:
# vim: set expandtab tabstop=4 shiftwidth=4: