summaryrefslogtreecommitdiff
path: root/scripts/check_whitespace_token.py
blob: cc3d1aa628a8ad10816664c7fd51b4b3e6365a5b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
#!/usr/bin/env python
"""
    Checker for whitespace tokens
    ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

    Helper script to find whitespace which is not of token type `Whitespace`

    :copyright: Copyright 2006-2022 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details.
"""
import argparse
import sys
import re

from utility import unpack_output_file, process_output_files


def check_file(path):
    whitespace_re = re.compile('\s+')

    for value, token, linenumber in unpack_output_file(path):
        if whitespace_re.fullmatch(value):
            # We allow " " if it's inside a Literal.String for example
            if 'Literal' in token:
                continue

            if 'Whitespace' in token:
                continue

            print(f'{path}:{linenumber}')
            return False

    return True


def main(args):
    if process_output_files(args.TEST_ROOT, check_file) > 0:
        return 1
    return 0


if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('TEST_ROOT',
                        help='Root directory containing the tests')
    args = parser.parse_args()
    sys.exit(main(args))