summaryrefslogtreecommitdiff
path: root/tests/test_unistring.py
blob: a4b58827ce295f259876de454aae8380bc0d8444 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
# -*- coding: utf-8 -*-
"""
    Test suite for the unistring module
    ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

    :copyright: Copyright 2006-2019 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details.
"""

import re
import random

from pygments import unistring as uni
from pygments.util import unichr


def test_cats_exist_and_compilable():
    for cat in uni.cats:
        s = getattr(uni, cat)
        if s == '':  # Probably Cs on Jython
            continue
        print("%s %r" % (cat, s))
        re.compile('[%s]' % s)


def _cats_that_match(c):
    matching_cats = []
    for cat in uni.cats:
        s = getattr(uni, cat)
        if s == '':  # Probably Cs on Jython
            continue
        if re.compile('[%s]' % s).match(c):
            matching_cats.append(cat)
    return matching_cats


def test_spot_check_types():
    # Each char should match one, and precisely one, category
    random.seed(0)
    for i in range(1000):
        o = random.randint(0, 65535)
        c = unichr(o)
        if o > 0xd800 and o <= 0xdfff and not uni.Cs:
            continue  # Bah, Jython.
        print(hex(o))
        cats = _cats_that_match(c)
        assert len(cats) == 1, "%d (%s): %s" % (o, c, cats)