1#!/usr/bin/env python
2# -*- coding: utf-8 -*-
3
4# Check for stylistic and formal issues in .rst and .py
5# files included in the documentation.
6#
7# 01/2009, Georg Brandl
8
9# TODO: - wrong versions in versionadded/changed
10#       - wrong markup after versionchanged directive
11
12from __future__ import with_statement
13
14import os
15import re
16import sys
17import getopt
18from os.path import join, splitext, abspath, exists
19from collections import defaultdict
20
21directives = [
22    # standard docutils ones
23    'admonition', 'attention', 'caution', 'class', 'compound', 'container',
24    'contents', 'csv-table', 'danger', 'date', 'default-role', 'epigraph',
25    'error', 'figure', 'footer', 'header', 'highlights', 'hint', 'image',
26    'important', 'include', 'line-block', 'list-table', 'meta', 'note',
27    'parsed-literal', 'pull-quote', 'raw', 'replace',
28    'restructuredtext-test-directive', 'role', 'rubric', 'sectnum', 'sidebar',
29    'table', 'target-notes', 'tip', 'title', 'topic', 'unicode', 'warning',
30    # Sphinx and Python docs custom ones
31    'acks', 'attribute', 'autoattribute', 'autoclass', 'autodata',
32    'autoexception', 'autofunction', 'automethod', 'automodule', 'centered',
33    'cfunction', 'class', 'classmethod', 'cmacro', 'cmdoption', 'cmember',
34    'code-block', 'confval', 'cssclass', 'ctype', 'currentmodule', 'cvar',
35    'data', 'decorator', 'decoratormethod', 'deprecated-removed',
36    'deprecated(?!-removed)', 'describe', 'directive', 'doctest', 'envvar',
37    'event', 'exception', 'function', 'glossary', 'highlight', 'highlightlang',
38    'impl-detail', 'index', 'literalinclude', 'method', 'miscnews', 'module',
39    'moduleauthor', 'opcode', 'pdbcommand', 'productionlist',
40    'tabularcolumns', 'testcode', 'testoutput', 'testsetup', 'toctree', 'todo',
41    'todolist', 'versionadded', 'versionchanged'
42]
43
44all_directives = '(' + '|'.join(directives) + ')'
45seems_directive_re = re.compile(r'(?<!\.)\.\. %s([^a-z:]|:(?!:))' % all_directives)
46default_role_re = re.compile(r'(^| )`\w([^`]*?\w)?`($| )')
47leaked_markup_re = re.compile(r'[a-z]::\s|`|\.\.\s*\w+:')
48
49
50checkers = {}
51
52checker_props = {'severity': 1, 'falsepositives': False}
53
54def checker(*suffixes, **kwds):
55    """Decorator to register a function as a checker."""
56    def deco(func):
57        for suffix in suffixes:
58            checkers.setdefault(suffix, []).append(func)
59        for prop in checker_props:
60            setattr(func, prop, kwds.get(prop, checker_props[prop]))
61        return func
62    return deco
63
64
65@checker('.py', severity=4)
66def check_syntax(fn, lines):
67    """Check Python examples for valid syntax."""
68    code = ''.join(lines)
69    if '\r' in code:
70        if os.name != 'nt':
71            yield 0, '\\r in code file'
72        code = code.replace('\r', '')
73    try:
74        compile(code, fn, 'exec')
75    except SyntaxError, err:
76        yield err.lineno, 'not compilable: %s' % err
77
78
79@checker('.rst', severity=2)
80def check_suspicious_constructs(fn, lines):
81    """Check for suspicious reST constructs."""
82    inprod = False
83    for lno, line in enumerate(lines):
84        if seems_directive_re.search(line):
85            yield lno+1, 'comment seems to be intended as a directive'
86        if '.. productionlist::' in line:
87            inprod = True
88        elif not inprod and default_role_re.search(line):
89            yield lno+1, 'default role used'
90        elif inprod and not line.strip():
91            inprod = False
92
93
94@checker('.py', '.rst')
95def check_whitespace(fn, lines):
96    """Check for whitespace and line length issues."""
97    for lno, line in enumerate(lines):
98        if '\r' in line:
99            yield lno+1, '\\r in line'
100        if '\t' in line:
101            yield lno+1, 'OMG TABS!!!1'
102        if line[:-1].rstrip(' \t') != line[:-1]:
103            yield lno+1, 'trailing whitespace'
104
105
106@checker('.rst', severity=0)
107def check_line_length(fn, lines):
108    """Check for line length; this checker is not run by default."""
109    for lno, line in enumerate(lines):
110        if len(line) > 81:
111            # don't complain about tables, links and function signatures
112            if line.lstrip()[0] not in '+|' and \
113               'http://' not in line and \
114               not line.lstrip().startswith(('.. function',
115                                             '.. method',
116                                             '.. cfunction')):
117                yield lno+1, "line too long"
118
119
120@checker('.html', severity=2, falsepositives=True)
121def check_leaked_markup(fn, lines):
122    """Check HTML files for leaked reST markup; this only works if
123    the HTML files have been built.
124    """
125    for lno, line in enumerate(lines):
126        if leaked_markup_re.search(line):
127            yield lno+1, 'possibly leaked markup: %r' % line
128
129
130def main(argv):
131    usage = '''\
132Usage: %s [-v] [-f] [-s sev] [-i path]* [path]
133
134Options:  -v       verbose (print all checked file names)
135          -f       enable checkers that yield many false positives
136          -s sev   only show problems with severity >= sev
137          -i path  ignore subdir or file path
138''' % argv[0]
139    try:
140        gopts, args = getopt.getopt(argv[1:], 'vfs:i:')
141    except getopt.GetoptError:
142        print usage
143        return 2
144
145    verbose = False
146    severity = 1
147    ignore = []
148    falsepos = False
149    for opt, val in gopts:
150        if opt == '-v':
151            verbose = True
152        elif opt == '-f':
153            falsepos = True
154        elif opt == '-s':
155            severity = int(val)
156        elif opt == '-i':
157            ignore.append(abspath(val))
158
159    if len(args) == 0:
160        path = '.'
161    elif len(args) == 1:
162        path = args[0]
163    else:
164        print usage
165        return 2
166
167    if not exists(path):
168        print 'Error: path %s does not exist' % path
169        return 2
170
171    count = defaultdict(int)
172    out = sys.stdout
173
174    for root, dirs, files in os.walk(path):
175        # ignore subdirs controlled by svn
176        if '.svn' in dirs:
177            dirs.remove('.svn')
178
179        # ignore subdirs in ignore list
180        if abspath(root) in ignore:
181            del dirs[:]
182            continue
183
184        for fn in files:
185            fn = join(root, fn)
186            if fn[:2] == './':
187                fn = fn[2:]
188
189            # ignore files in ignore list
190            if abspath(fn) in ignore:
191                continue
192
193            ext = splitext(fn)[1]
194            checkerlist = checkers.get(ext, None)
195            if not checkerlist:
196                continue
197
198            if verbose:
199                print 'Checking %s...' % fn
200
201            try:
202                with open(fn, 'r') as f:
203                    lines = list(f)
204            except (IOError, OSError), err:
205                print '%s: cannot open: %s' % (fn, err)
206                count[4] += 1
207                continue
208
209            for checker in checkerlist:
210                if checker.falsepositives and not falsepos:
211                    continue
212                csev = checker.severity
213                if csev >= severity:
214                    for lno, msg in checker(fn, lines):
215                        print >>out, '[%d] %s:%d: %s' % (csev, fn, lno, msg)
216                        count[csev] += 1
217    if verbose:
218        print
219    if not count:
220        if severity > 1:
221            print 'No problems with severity >= %d found.' % severity
222        else:
223            print 'No problems found.'
224    else:
225        for severity in sorted(count):
226            number = count[severity]
227            print '%d problem%s with severity %d found.' % \
228                  (number, number > 1 and 's' or '', severity)
229    return int(bool(count))
230
231
232if __name__ == '__main__':
233    sys.exit(main(sys.argv))
234