2011-04-15 19:43:06 +02:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
|
|
|
import os
|
|
|
|
import re
|
|
|
|
import sys
|
|
|
|
|
|
|
|
from file_types import *
|
|
|
|
|
|
|
|
cpp_c_headers = {
|
|
|
|
'assert.h' : 'cassert',
|
|
|
|
'ctype.h' : 'cctype',
|
|
|
|
'errno.h' : 'cerrno',
|
|
|
|
'float.h' : 'cfloat',
|
|
|
|
'limits.h' : 'climits',
|
|
|
|
'locale.h' : 'clocale',
|
|
|
|
'math.h' : 'cmath',
|
|
|
|
'setjmp.h' : 'csetjmp',
|
|
|
|
'signal.h' : 'csignal',
|
|
|
|
'stdarg.h' : 'cstdarg',
|
|
|
|
'stddef.h' : 'cstddef',
|
|
|
|
'stdio.h' : 'cstdio',
|
|
|
|
'stdlib.h' : 'cstdlib',
|
|
|
|
'string.h' : 'cstring',
|
|
|
|
'time.h' : 'ctime',
|
|
|
|
'wchar.h' : 'cwchar',
|
|
|
|
'wctype.h' : 'cwctype',
|
|
|
|
}
|
|
|
|
|
|
|
|
include_re = re.compile(r'([#%])(include|import).*[<"](.*)[">]')
|
|
|
|
def include_key(line):
|
|
|
|
'''Mark directories with a leading space so directories
|
|
|
|
are sorted before files'''
|
|
|
|
|
|
|
|
match = include_re.match(line)
|
|
|
|
assert match, line
|
|
|
|
keyword = match.group(2)
|
|
|
|
include = match.group(3)
|
|
|
|
|
|
|
|
# Everything but the file part needs to have a space prepended
|
|
|
|
parts = include.split('/')
|
|
|
|
if len(parts) == 2 and parts[0] == 'dnet':
|
|
|
|
# Don't sort the dnet includes with respect to each other, but
|
|
|
|
# make them sorted with respect to non dnet includes. Python
|
|
|
|
# guarantees that sorting is stable, so just clear the
|
|
|
|
# basename part of the filename.
|
|
|
|
parts[1] = ' '
|
|
|
|
parts[0:-1] = [ ' ' + s for s in parts[0:-1] ]
|
|
|
|
key = '/'.join(parts)
|
|
|
|
|
|
|
|
return key
|
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
|
|
|
|
def _include_matcher(keyword="#include", delim="<>"):
|
|
|
|
"""Match an include statement and return a (keyword, file, extra)
|
|
|
|
duple, or a touple of None values if there isn't a match."""
|
|
|
|
|
|
|
|
rex = re.compile(r'^(%s)\s*%s(.*)%s(.*)$' % (keyword, delim[0], delim[1]))
|
|
|
|
|
|
|
|
def matcher(context, line):
|
|
|
|
m = rex.match(line)
|
|
|
|
return m.groups() if m else (None, ) * 3
|
|
|
|
|
|
|
|
return matcher
|
|
|
|
|
|
|
|
def _include_matcher_fname(fname, **kwargs):
|
|
|
|
"""Match an include of a specific file name. Any keyword arguments
|
|
|
|
are forwarded to _include_matcher, which is used to match the
|
|
|
|
actual include line."""
|
|
|
|
|
|
|
|
rex = re.compile(fname)
|
|
|
|
base_matcher = _include_matcher(**kwargs)
|
|
|
|
|
|
|
|
def matcher(context, line):
|
|
|
|
(keyword, fname, extra) = base_matcher(context, line)
|
|
|
|
if fname and rex.match(fname):
|
|
|
|
return (keyword, fname, extra)
|
|
|
|
else:
|
|
|
|
return (None, ) * 3
|
|
|
|
|
|
|
|
return matcher
|
|
|
|
|
|
|
|
|
|
|
|
def _include_matcher_main():
|
|
|
|
"""Match a C/C++ source file's primary header (i.e., a file with
|
|
|
|
the same base name, but a header extension)."""
|
|
|
|
|
|
|
|
base_matcher = _include_matcher(delim='""')
|
|
|
|
rex = re.compile(r"^src/(.*)\.([^.]+)$")
|
|
|
|
header_map = {
|
|
|
|
"c" : "h",
|
|
|
|
"cc" : "hh",
|
|
|
|
"cpp" : "hh",
|
|
|
|
}
|
|
|
|
def matcher(context, line):
|
|
|
|
m = rex.match(context["filename"])
|
|
|
|
if not m:
|
|
|
|
return (None, ) * 3
|
|
|
|
base, ext = m.groups()
|
|
|
|
(keyword, fname, extra) = base_matcher(context, line)
|
|
|
|
try:
|
|
|
|
if fname == "%s.%s" % (base, header_map[ext]):
|
|
|
|
return (keyword, fname, extra)
|
|
|
|
except KeyError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
return (None, ) * 3
|
|
|
|
|
|
|
|
return matcher
|
|
|
|
|
2011-04-15 19:43:06 +02:00
|
|
|
class SortIncludes(object):
|
|
|
|
# different types of includes for different sorting of headers
|
|
|
|
# <Python.h> - Python header needs to be first if it exists
|
|
|
|
# <*.h> - system headers (directories before files)
|
|
|
|
# <*> - STL headers
|
|
|
|
# <*.(hh|hxx|hpp|H)> - C++ Headers (directories before files)
|
|
|
|
# "*" - M5 headers (directories before files)
|
|
|
|
includes_re = (
|
2015-02-03 20:25:50 +01:00
|
|
|
('main', '""', _include_matcher_main()),
|
|
|
|
('python', '<>', _include_matcher_fname("^Python\.h$")),
|
|
|
|
('c', '<>', _include_matcher_fname("^.*\.h$")),
|
|
|
|
('stl', '<>', _include_matcher_fname("^\w+$")),
|
|
|
|
('cc', '<>', _include_matcher_fname("^.*\.(hh|hxx|hpp|H)$")),
|
|
|
|
('m5header', '""', _include_matcher_fname("^.*\.h{1,2}$", delim='""')),
|
|
|
|
('swig0', '<>', _include_matcher(keyword="%import")),
|
|
|
|
('swig1', '<>', _include_matcher(keyword="%include")),
|
|
|
|
('swig2', '""', _include_matcher(keyword="%import", delim='""')),
|
|
|
|
('swig3', '""', _include_matcher(keyword="%include", delim='""')),
|
2011-04-15 19:43:06 +02:00
|
|
|
)
|
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
block_order = (
|
|
|
|
('main', ),
|
|
|
|
('python', ),
|
|
|
|
('c', ),
|
|
|
|
('stl', ),
|
|
|
|
('cc', ),
|
|
|
|
('m5header', ),
|
|
|
|
('swig0', 'swig1', 'swig2', 'swig3', ),
|
|
|
|
)
|
2011-04-15 19:43:06 +02:00
|
|
|
|
|
|
|
def __init__(self):
|
2015-02-03 20:25:50 +01:00
|
|
|
self.block_priority = {}
|
|
|
|
for prio, keys in enumerate(self.block_order):
|
|
|
|
for key in keys:
|
|
|
|
self.block_priority[key] = prio
|
2011-04-15 19:43:06 +02:00
|
|
|
|
|
|
|
def reset(self):
|
|
|
|
# clear all stored headers
|
|
|
|
self.includes = {}
|
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
def dump_blocks(self, block_types):
|
|
|
|
"""Merge includes of from several block types into one large
|
|
|
|
block of sorted includes. This is useful when we have multiple
|
|
|
|
include block types (e.g., swig includes) with the same
|
|
|
|
priority."""
|
|
|
|
|
|
|
|
includes = []
|
|
|
|
for block_type in block_types:
|
|
|
|
try:
|
|
|
|
includes += self.includes[block_type]
|
|
|
|
except KeyError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
return sorted(set(includes))
|
|
|
|
|
|
|
|
def dump_includes(self):
|
|
|
|
blocks = []
|
|
|
|
# Create a list of blocks in the prescribed include
|
|
|
|
# order. Each entry in the list is a multi-line string with
|
|
|
|
# multiple includes.
|
|
|
|
for types in self.block_order:
|
|
|
|
block = "\n".join(self.dump_blocks(types))
|
|
|
|
if block:
|
|
|
|
blocks.append(block)
|
|
|
|
|
|
|
|
self.reset()
|
|
|
|
return "\n\n".join(blocks)
|
2011-04-15 19:43:06 +02:00
|
|
|
|
|
|
|
def __call__(self, lines, filename, language):
|
2014-08-13 12:57:25 +02:00
|
|
|
self.reset()
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
context = {
|
|
|
|
"filename" : filename,
|
|
|
|
"language" : language,
|
|
|
|
}
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
def match_line(line):
|
|
|
|
if not line:
|
|
|
|
return (None, line)
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
for include_type, (ldelim, rdelim), matcher in self.includes_re:
|
|
|
|
keyword, include, extra = matcher(context, line)
|
|
|
|
if keyword:
|
|
|
|
# if we've got a match, clean up the #include line,
|
|
|
|
# fix up stl headers and store it in the proper category
|
|
|
|
if include_type == 'c' and language == 'C++':
|
|
|
|
stl_inc = cpp_c_headers.get(include, None)
|
|
|
|
if stl_inc:
|
|
|
|
include = stl_inc
|
|
|
|
include_type = 'stl'
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
return (include_type,
|
|
|
|
keyword + ' ' + ldelim + include + rdelim + extra)
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
return (None, line)
|
2011-04-15 19:43:06 +02:00
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
processing_includes = False
|
|
|
|
for line in lines:
|
|
|
|
include_type, line = match_line(line)
|
|
|
|
if include_type:
|
|
|
|
try:
|
|
|
|
self.includes[include_type].append(line)
|
|
|
|
except KeyError:
|
|
|
|
self.includes[include_type] = [ line ]
|
|
|
|
|
|
|
|
processing_includes = True
|
|
|
|
elif processing_includes and not line.strip():
|
|
|
|
# Skip empty lines while processing includes
|
|
|
|
pass
|
|
|
|
elif processing_includes:
|
|
|
|
# We are now exiting an include block
|
|
|
|
processing_includes = False
|
|
|
|
|
|
|
|
# Output pending includes, a new line between, and the
|
|
|
|
# current l.
|
|
|
|
yield self.dump_includes()
|
|
|
|
yield ''
|
|
|
|
yield line
|
|
|
|
else:
|
|
|
|
# We are not in an include block, so just emit the line
|
2011-04-15 19:43:06 +02:00
|
|
|
yield line
|
|
|
|
|
2015-02-03 20:25:50 +01:00
|
|
|
# We've reached EOF, so dump any pending includes
|
|
|
|
if processing_includes:
|
|
|
|
yield self.dump_includes()
|
2011-04-15 19:43:06 +02:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# default language types to try to apply our sorting rules to
|
|
|
|
default_languages = frozenset(('C', 'C++', 'isa', 'python', 'scons', 'swig'))
|
|
|
|
|
|
|
|
def options():
|
|
|
|
import optparse
|
|
|
|
options = optparse.OptionParser()
|
|
|
|
add_option = options.add_option
|
|
|
|
add_option('-d', '--dir_ignore', metavar="DIR[,DIR]", type='string',
|
|
|
|
default=','.join(default_dir_ignore),
|
|
|
|
help="ignore directories")
|
|
|
|
add_option('-f', '--file_ignore', metavar="FILE[,FILE]", type='string',
|
|
|
|
default=','.join(default_file_ignore),
|
|
|
|
help="ignore files")
|
|
|
|
add_option('-l', '--languages', metavar="LANG[,LANG]", type='string',
|
|
|
|
default=','.join(default_languages),
|
|
|
|
help="languages")
|
|
|
|
add_option('-n', '--dry-run', action='store_true',
|
|
|
|
help="don't overwrite files")
|
|
|
|
|
|
|
|
return options
|
|
|
|
|
|
|
|
def parse_args(parser):
|
|
|
|
opts,args = parser.parse_args()
|
|
|
|
|
|
|
|
opts.dir_ignore = frozenset(opts.dir_ignore.split(','))
|
|
|
|
opts.file_ignore = frozenset(opts.file_ignore.split(','))
|
|
|
|
opts.languages = frozenset(opts.languages.split(','))
|
|
|
|
|
|
|
|
return opts,args
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
parser = options()
|
|
|
|
opts, args = parse_args(parser)
|
|
|
|
|
|
|
|
for base in args:
|
|
|
|
for filename,language in find_files(base, languages=opts.languages,
|
|
|
|
file_ignore=opts.file_ignore, dir_ignore=opts.dir_ignore):
|
|
|
|
if opts.dry_run:
|
|
|
|
print "%s: %s" % (filename, language)
|
|
|
|
else:
|
|
|
|
update_file(filename, filename, language, SortIncludes())
|