tests/test_sql.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118

# -*- coding: utf-8 -*-
"""
    Pygments SQL lexers tests
    ~~~~~~~~~~~~~~~~~~~~~~~~~

    :copyright: Copyright 2006-2016 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details.
"""
import unittest

from pygments.lexers.sql import name_between_bracket_re, \
    name_between_backtick_re, tsql_go_re, tsql_declare_re, \
    tsql_variable_re, MySqlLexer, SqlLexer, TransactSqlLexer

from pygments.token import Comment, Name, Number, Punctuation, Whitespace


class TransactSqlLexerTest(unittest.TestCase):

    def setUp(self):
        self.lexer = TransactSqlLexer()

    def _assertAreTokensOfType(self, examples, expected_token_type):
        for test_number, example in enumerate(examples.split(), 1):
            token_count = 0
            for token_type, token_value in self.lexer.get_tokens(example):
                if token_type != Whitespace:
                    token_count += 1
                    self.assertEqual(
                        token_type, expected_token_type,
                        'token_type #%d for %s is be %s but must be %s' %
                        (test_number, token_value, token_type, expected_token_type))
            self.assertEqual(
                token_count, 1,
                '%s must yield exactly 1 token instead of %d' %
                (example, token_count))

    def _assertTokensMatch(self, text, expected_tokens_without_trailing_newline):
        actual_tokens = tuple(self.lexer.get_tokens(text))
        if (len(actual_tokens) >= 1) and (actual_tokens[-1] == (Whitespace, '\n')):
            actual_tokens = tuple(actual_tokens[:-1])
        self.assertEqual(
            expected_tokens_without_trailing_newline, actual_tokens,
            'text must yield expected tokens: %s' % text)

    def test_can_lex_float(self):
        self._assertAreTokensOfType(
            '1. 1.e1 .1 1.2 1.2e3 1.2e+3 1.2e-3 1e2', Number.Float)
        self._assertTokensMatch(
            '1e2.1e2',
            ((Number.Float, '1e2'), (Number.Float, '.1e2'))
        )

    def test_can_reject_almost_float(self):
        self._assertTokensMatch(
            '.e1',
            ((Punctuation, '.'), (Name, 'e1')))

    def test_can_lex_integer(self):
        self._assertAreTokensOfType(
            '1 23 456', Number.Integer)

    def test_can_lex_names(self):
        self._assertAreTokensOfType(
            u'thingy thingy123 _thingy _ _123 Ähnliches Müll #temp1 ##temp2', Name)

    def test_can_lex_comments(self):
        self._assertTokensMatch('--\n', ((Comment.Single, '--\n'),))
        self._assertTokensMatch('/**/', (
            (Comment.Multiline, '/*'), (Comment.Multiline, '*/')
        ))
        self._assertTokensMatch('/*/**/*/', (
            (Comment.Multiline, '/*'),
            (Comment.Multiline, '/*'),
            (Comment.Multiline, '*/'),
            (Comment.Multiline, '*/'),
        ))


class SqlAnalyzeTextTest(unittest.TestCase):
    def test_can_match_analyze_text_res(self):
        self.assertEqual(['`a`', '`bc`'],
            name_between_backtick_re.findall('select `a`, `bc` from some'))
        self.assertEqual(['[a]', '[bc]'],
            name_between_bracket_re.findall('select [a], [bc] from some'))
        self.assertTrue(tsql_declare_re.search('--\nDeClaRe @some int;'))
        self.assertTrue(tsql_go_re.search('select 1\ngo\n--'))
        self.assertTrue(tsql_variable_re.search(
            'create procedure dbo.usp_x @a int, @b int'))

    def test_can_analyze_text(self):
        mysql_lexer = MySqlLexer()
        sql_lexer = SqlLexer()
        tsql_lexer = TransactSqlLexer()
        code_to_expected_lexer_map = {
            'select `a`, `bc` from some': mysql_lexer,
            'select a, bc from some': sql_lexer,
            'select [a], [bc] from some': tsql_lexer,
            '-- `a`, `bc`\nselect [a], [bc] from some': tsql_lexer,
            '-- `a`, `bc`\nselect [a], [bc] from some; go': tsql_lexer,
        }
        sql_lexers = set(code_to_expected_lexer_map.values())
        for code, expected_lexer in code_to_expected_lexer_map.items():
            ratings_and_lexers = list((lexer.analyse_text(code), lexer.name) for lexer in sql_lexers)
            best_rating, best_lexer_name  = sorted(ratings_and_lexers, reverse=True)[0]
            expected_rating = expected_lexer.analyse_text(code)
            message = (
                'lexer must be %s (rating %.2f) instead of '
                '%s (rating %.2f) for analyse_text() on code:\n%s') % (
                expected_lexer.name,
                expected_rating,
                best_lexer_name,
                best_rating,
                code
            )
            self.assertEqual(
                expected_lexer.name, best_lexer_name, message
            )