Add another check script for whitespace.

Add a script which checks for whitespace tokens, similar to the script checking for repeated tokens. Also move some functionality shared between them into a utility file, and make check_repeated_token PEP8 compliant.
author: Matthäus G. Chajdas <dev@anteru.net> 2022-12-04 15:12:42 +0100
committer: Matthäus G. Chajdas <dev@anteru.net> 2022-12-04 15:12:42 +0100
commit: d98309343786205a34b483c559be5eefcfd7eade (patch)
tree: 27dd9bd9102b00ba3b453d9dfd96d4f8963f7b97 /scripts/utility.py
parent: dc492aea253a33f3335177dda23066aaf85050a3 (diff)
download: pygments-git-d98309343786205a34b483c559be5eefcfd7eade.tar.gz
1 files changed, 49 insertions, 0 deletions
diff --git a/scripts/utility.py b/scripts/utility.py
new file mode 100644
index 00000000..6ce225b4
--- /dev/null
+++ b/scripts/utility.py
@@ -0,0 +1,49 @@
+"""
+    Utility functions for test scripts
+    ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+    :copyright: Copyright 2006-2022 by the Pygments team, see AUTHORS.
+    :license: BSD, see LICENSE for details.
+"""
+
+import os
+
+def unpack_output_file(path):
+    """
+    Unpack an output file into objects contining the line number, the text,
+    and the token name.
+    """
+    from collections import namedtuple
+    entry = namedtuple('OutputEntry', ['text', 'token', 'linenumber'])
+    for linenumber, line in enumerate(open(path).readlines()):
+        line = line.strip()
+        if line:
+            # Line can start with ' or ", so let's check which one it is
+            # and find the matching one
+            quotation_start = 0
+            quotation_end = line.rfind(line[0])
+            text = line[quotation_start+1:quotation_end]
+            token = line.split()[-1]
+            text = text.replace('\\n', '\n')
+            text = text.replace('\\t', '\t')
+            yield entry(text, token, linenumber + 1)
+
+def process_output_files(root_directory, callback):
+    """
+    Process all output files in a directory using the provided callback.
+    The callback should return `True` in case of success, `False` otherwise.
+
+    The function returns the number of files for which the callback returned
+    `False`.
+    """
+    errors = 0
+    for dir, _, files in os.walk(root_directory):
+        for file in files:
+            if not file.endswith('.output'):
+                continue
+            
+            path = os.path.join(dir, file)
+            if not callback(path):
+                errors += 1
+
+    return errors
author	Matthäus G. Chajdas <dev@anteru.net>	2022-12-04 15:12:42 +0100
committer	Matthäus G. Chajdas <dev@anteru.net>	2022-12-04 15:12:42 +0100
commit	d98309343786205a34b483c559be5eefcfd7eade (patch)
tree	27dd9bd9102b00ba3b453d9dfd96d4f8963f7b97 /scripts/utility.py
parent	dc492aea253a33f3335177dda23066aaf85050a3 (diff)
download	pygments-git-d98309343786205a34b483c559be5eefcfd7eade.tar.gz