summaryrefslogtreecommitdiff
path: root/simple_unit_tests.py
diff options
context:
space:
mode:
authorKyle Lahnakoski <klahnakoski@mozilla.com>2019-10-21 23:42:51 -0400
committerPaul McGuire <ptmcg@users.noreply.github.com>2019-10-21 22:42:51 -0500
commit3481b6f3f9bb2dae7e9d88ed08989b5f71238e4b (patch)
tree7c8174b8d9b45ab39cb9119c579fe12c819c6dd2 /simple_unit_tests.py
parent87d14e7ef563263417d3fddccd25636741c5b6c2 (diff)
downloadpyparsing-git-3481b6f3f9bb2dae7e9d88ed08989b5f71238e4b.tar.gz
refactor tests into tests directory (#130)
Diffstat (limited to 'simple_unit_tests.py')
-rw-r--r--simple_unit_tests.py461
1 files changed, 0 insertions, 461 deletions
diff --git a/simple_unit_tests.py b/simple_unit_tests.py
deleted file mode 100644
index f0493cf..0000000
--- a/simple_unit_tests.py
+++ /dev/null
@@ -1,461 +0,0 @@
-#
-# simple_unit_tests.py
-#
-# While these unit tests *do* perform low-level unit testing of the classes in pyparsing,
-# this testing module should also serve an instructional purpose, to clearly show simple passing
-# and failing parse cases of some basic pyparsing expressions.
-#
-# Copyright (c) 2018 Paul T. McGuire
-#
-import unittest
-import pyparsing as pp
-from collections import namedtuple
-from datetime import datetime
-ppt = pp.pyparsing_test
-
-# Test spec data class for specifying simple pyparsing test cases
-PpTestSpec = namedtuple("PpTestSpec", "desc expr text parse_fn "
- "expected_list expected_dict expected_fail_locn")
-PpTestSpec.__new__.__defaults__ = ('', pp.Empty(), '', 'parseString', None, None, None)
-
-
-class PyparsingExpressionTestCase(ppt.ParseResultsAsserts, unittest.TestCase):
- """
- Base pyparsing testing class to parse various pyparsing expressions against
- given text strings. Subclasses must define a class attribute 'tests' which
- is a list of PpTestSpec instances.
- """
- tests = []
- def runTest(self):
- if self.__class__ is PyparsingExpressionTestCase:
- return
-
- for test_spec in self.tests:
- # for each spec in the class's tests list, create a subtest
- # that will either:
- # - parse the string with expected success, display the
- # results, and validate the returned ParseResults
- # - or parse the string with expected failure, display the
- # error message and mark the error location, and validate
- # the location against an expected value
- with self.subTest(test_spec=test_spec):
- test_spec.expr.streamline()
- print("\n{0} - {1}({2})".format(test_spec.desc,
- type(test_spec.expr).__name__,
- test_spec.expr))
-
- parsefn = getattr(test_spec.expr, test_spec.parse_fn)
- if test_spec.expected_fail_locn is None:
- # expect success
- result = parsefn(test_spec.text)
- if test_spec.parse_fn == 'parseString':
- print(result.dump())
- # compare results against given list and/or dict
- self.assertParseResultsEquals(result,
- expected_list=test_spec.expected_list,
- expected_dict=test_spec.expected_dict)
- elif test_spec.parse_fn == 'transformString':
- print(result)
- # compare results against given list and/or dict
- if test_spec.expected_list is not None:
- self.assertEqual([result], test_spec.expected_list)
- elif test_spec.parse_fn == 'searchString':
- print(result)
- # compare results against given list and/or dict
- if test_spec.expected_list is not None:
- self.assertEqual([result], test_spec.expected_list)
- else:
- # expect fail
- with self.assertRaisesParseException():
- try:
- parsefn(test_spec.text)
- except Exception as exc:
- print(pp.ParseException.explain(exc))
- self.assertEqual(exc.loc, test_spec.expected_fail_locn)
- raise
-
-
-# =========== TEST DEFINITIONS START HERE ==============
-
-class TestLiteral(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Simple match",
- expr = pp.Literal("xyz"),
- text = "xyz",
- expected_list = ["xyz"],
- ),
- PpTestSpec(
- desc = "Simple match after skipping whitespace",
- expr = pp.Literal("xyz"),
- text = " xyz",
- expected_list = ["xyz"],
- ),
- PpTestSpec(
- desc = "Simple fail - parse an empty string",
- expr = pp.Literal("xyz"),
- text = "",
- expected_fail_locn = 0,
- ),
- PpTestSpec(
- desc = "Simple fail - parse a mismatching string",
- expr = pp.Literal("xyz"),
- text = "xyu",
- expected_fail_locn = 0,
- ),
- PpTestSpec(
- desc = "Simple fail - parse a partially matching string",
- expr = pp.Literal("xyz"),
- text = "xy",
- expected_fail_locn = 0,
- ),
- PpTestSpec(
- desc = "Fail - parse a partially matching string by matching individual letters",
- expr = pp.Literal("x") + pp.Literal("y") + pp.Literal("z"),
- text = "xy",
- expected_fail_locn = 2,
- ),
- ]
-
-class TestCaselessLiteral(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Match colors, converting to consistent case",
- expr = (pp.CaselessLiteral("RED")
- | pp.CaselessLiteral("GREEN")
- | pp.CaselessLiteral("BLUE"))[...],
- text = "red Green BluE blue GREEN green rEd",
- expected_list = ['RED', 'GREEN', 'BLUE', 'BLUE', 'GREEN', 'GREEN', 'RED'],
- ),
- ]
-
-class TestWord(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Simple Word match",
- expr = pp.Word("xy"),
- text = "xxyxxyy",
- expected_list = ["xxyxxyy"],
- ),
- PpTestSpec(
- desc = "Simple Word match of two separate Words",
- expr = pp.Word("x") + pp.Word("y"),
- text = "xxxxxyy",
- expected_list = ["xxxxx", "yy"],
- ),
- PpTestSpec(
- desc = "Simple Word match of two separate Words - implicitly skips whitespace",
- expr = pp.Word("x") + pp.Word("y"),
- text = "xxxxx yy",
- expected_list = ["xxxxx", "yy"],
- ),
- ]
-
-class TestCombine(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc="Parsing real numbers - fail, parsed numbers are in pieces",
- expr=(pp.Word(pp.nums) + '.' + pp.Word(pp.nums))[...],
- text="1.2 2.3 3.1416 98.6",
- expected_list=['1', '.', '2', '2', '.', '3', '3', '.', '1416', '98', '.', '6'],
- ),
- PpTestSpec(
- desc="Parsing real numbers - better, use Combine to combine multiple tokens into one",
- expr=pp.Combine(pp.Word(pp.nums) + '.' + pp.Word(pp.nums))[...],
- text="1.2 2.3 3.1416 98.6",
- expected_list=['1.2', '2.3', '3.1416', '98.6'],
- ),
- ]
-
-class TestRepetition(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Match several words",
- expr = (pp.Word("x") | pp.Word("y"))[...],
- text = "xxyxxyyxxyxyxxxy",
- expected_list = ['xx', 'y', 'xx', 'yy', 'xx', 'y', 'x', 'y', 'xxx', 'y'],
- ),
- PpTestSpec(
- desc = "Match several words, skipping whitespace",
- expr = (pp.Word("x") | pp.Word("y"))[...],
- text = "x x y xxy yxx y xyx xxy",
- expected_list = ['x', 'x', 'y', 'xx', 'y', 'y', 'xx', 'y', 'x', 'y', 'x', 'xx', 'y'],
- ),
- PpTestSpec(
- desc = "Match several words, skipping whitespace (old style)",
- expr = pp.OneOrMore(pp.Word("x") | pp.Word("y")),
- text = "x x y xxy yxx y xyx xxy",
- expected_list = ['x', 'x', 'y', 'xx', 'y', 'y', 'xx', 'y', 'x', 'y', 'x', 'xx', 'y'],
- ),
- PpTestSpec(
- desc = "Match words and numbers - show use of results names to collect types of tokens",
- expr = (pp.Word(pp.alphas)("alpha*")
- | pp.pyparsing_common.integer("int*"))[...],
- text = "sdlfj23084ksdfs08234kjsdlfkjd0934",
- expected_list = ['sdlfj', 23084, 'ksdfs', 8234, 'kjsdlfkjd', 934],
- expected_dict = { 'alpha': ['sdlfj', 'ksdfs', 'kjsdlfkjd'], 'int': [23084, 8234, 934] }
- ),
- PpTestSpec(
- desc = "Using delimitedList (comma is the default delimiter)",
- expr = pp.delimitedList(pp.Word(pp.alphas)),
- text = "xxyx,xy,y,xxyx,yxx, xy",
- expected_list = ['xxyx', 'xy', 'y', 'xxyx', 'yxx', 'xy'],
- ),
- PpTestSpec(
- desc = "Using delimitedList, with ':' delimiter",
- expr = pp.delimitedList(pp.Word(pp.hexnums, exact=2), delim=':', combine=True),
- text = "0A:4B:73:21:FE:76",
- expected_list = ['0A:4B:73:21:FE:76'],
- ),
- ]
-
-class TestResultsName(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Match with results name",
- expr = pp.Literal("xyz").setResultsName("value"),
- text = "xyz",
- expected_dict = {'value': 'xyz'},
- expected_list = ['xyz'],
- ),
- PpTestSpec(
- desc = "Match with results name - using naming short-cut",
- expr = pp.Literal("xyz")("value"),
- text = "xyz",
- expected_dict = {'value': 'xyz'},
- expected_list = ['xyz'],
- ),
- PpTestSpec(
- desc = "Define multiple results names",
- expr = pp.Word(pp.alphas, pp.alphanums)("key") + '=' + pp.pyparsing_common.integer("value"),
- text = "range=5280",
- expected_dict = {'key': 'range', 'value': 5280},
- expected_list = ['range', '=', 5280],
- ),
- ]
-
-class TestGroups(PyparsingExpressionTestCase):
- EQ = pp.Suppress('=')
- tests = [
- PpTestSpec(
- desc = "Define multiple results names in groups",
- expr = pp.Group(pp.Word(pp.alphas)("key")
- + EQ
- + pp.pyparsing_common.number("value"))[...],
- text = "range=5280 long=-138.52 lat=46.91",
- expected_list = [['range', 5280], ['long', -138.52], ['lat', 46.91]],
- ),
- PpTestSpec(
- desc = "Define multiple results names in groups - use Dict to define results names using parsed keys",
- expr = pp.Dict(pp.Group(pp.Word(pp.alphas)
- + EQ
- + pp.pyparsing_common.number)[...]),
- text = "range=5280 long=-138.52 lat=46.91",
- expected_list = [['range', 5280], ['long', -138.52], ['lat', 46.91]],
- expected_dict = {'lat': 46.91, 'long': -138.52, 'range': 5280}
- ),
- PpTestSpec(
- desc = "Define multiple value types",
- expr = pp.Dict(pp.Group(pp.Word(pp.alphas)
- + EQ
- + (pp.pyparsing_common.number | pp.oneOf("True False") | pp.QuotedString("'"))
- )[...]
- ),
- text = "long=-122.47 lat=37.82 public=True name='Golden Gate Bridge'",
- expected_list = [['long', -122.47], ['lat', 37.82], ['public', 'True'], ['name', 'Golden Gate Bridge']],
- expected_dict = {'long': -122.47, 'lat': 37.82, 'public': 'True', 'name': 'Golden Gate Bridge'}
- ),
- ]
-
-class TestParseAction(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc="Parsing real numbers - use parse action to convert to float at parse time",
- expr=pp.Combine(pp.Word(pp.nums) + '.' + pp.Word(pp.nums)).addParseAction(lambda t: float(t[0]))[...],
- text="1.2 2.3 3.1416 98.6",
- expected_list= [1.2, 2.3, 3.1416, 98.6], # note, these are now floats, not strs
- ),
- PpTestSpec(
- desc = "Match with numeric string converted to int",
- expr = pp.Word("0123456789").addParseAction(lambda t: int(t[0])),
- text = "12345",
- expected_list = [12345], # note - result is type int, not str
- ),
- PpTestSpec(
- desc = "Use two parse actions to convert numeric string, then convert to datetime",
- expr = pp.Word(pp.nums).addParseAction(lambda t: int(t[0]),
- lambda t: datetime.utcfromtimestamp(t[0])),
- text = "1537415628",
- expected_list = [datetime(2018, 9, 20, 3, 53, 48)],
- ),
- PpTestSpec(
- desc = "Use tokenMap for parse actions that operate on a single-length token",
- expr = pp.Word(pp.nums).addParseAction(pp.tokenMap(int),
- pp.tokenMap(datetime.utcfromtimestamp)),
- text = "1537415628",
- expected_list = [datetime(2018, 9, 20, 3, 53, 48)],
- ),
- PpTestSpec(
- desc = "Using a built-in function that takes a sequence of strs as a parse action",
- expr = pp.Word(pp.hexnums, exact=2)[...].addParseAction(':'.join),
- text = "0A4B7321FE76",
- expected_list = ['0A:4B:73:21:FE:76'],
- ),
- PpTestSpec(
- desc = "Using a built-in function that takes a sequence of strs as a parse action",
- expr = pp.Word(pp.hexnums, exact=2)[...].addParseAction(sorted),
- text = "0A4B7321FE76",
- expected_list = ['0A', '21', '4B', '73', '76', 'FE'],
- ),
- ]
-
-class TestResultsModifyingParseAction(PyparsingExpressionTestCase):
- def compute_stats_parse_action(t):
- # by the time this parse action is called, parsed numeric words
- # have been converted to ints by a previous parse action, so
- # they can be treated as ints
- t['sum'] = sum(t)
- t['ave'] = sum(t) / len(t)
- t['min'] = min(t)
- t['max'] = max(t)
-
- tests = [
- PpTestSpec(
- desc = "A parse action that adds new key-values",
- expr = pp.pyparsing_common.integer[...].addParseAction(compute_stats_parse_action),
- text = "27 1 14 22 89",
- expected_list = [27, 1, 14, 22, 89],
- expected_dict = {'ave': 30.6, 'max': 89, 'min': 1, 'sum': 153}
- ),
- ]
-
-class TestRegex(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc="Parsing real numbers - using Regex instead of Combine",
- expr=pp.Regex(r'\d+\.\d+').addParseAction(lambda t: float(t[0]))[...],
- text="1.2 2.3 3.1416 98.6",
- expected_list=[1.2, 2.3, 3.1416, 98.6], # note, these are now floats, not strs
- ),
- ]
-
-class TestParseCondition(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "Define a condition to only match numeric values that are multiples of 7",
- expr = pp.Word(pp.nums).addCondition(lambda t: int(t[0]) % 7 == 0)[...],
- text = "14 35 77 12 28",
- expected_list = ['14', '35', '77'],
- ),
- PpTestSpec(
- desc = "Separate conversion to int and condition into separate parse action/conditions",
- expr = pp.Word(pp.nums).addParseAction(lambda t: int(t[0]))
- .addCondition(lambda t: t[0] % 7 == 0)[...],
- text = "14 35 77 12 28",
- expected_list = [14, 35, 77],
- ),
- ]
-
-class TestTransformStringUsingParseActions(PyparsingExpressionTestCase):
- markup_convert_map = {
- '*' : 'B',
- '_' : 'U',
- '/' : 'I',
- }
- def markup_convert(t):
- htmltag = TestTransformStringUsingParseActions.markup_convert_map[t.markup_symbol]
- return "<{0}>{1}</{2}>".format(htmltag, t.body, htmltag)
-
- tests = [
- PpTestSpec(
- desc = "Use transformString to convert simple markup to HTML",
- expr = (pp.oneOf(markup_convert_map)('markup_symbol')
- + "(" + pp.CharsNotIn(")")('body') + ")").addParseAction(markup_convert),
- text = "Show in *(bold), _(underscore), or /(italic) type",
- expected_list = ['Show in <B>bold</B>, <U>underscore</U>, or <I>italic</I> type'],
- parse_fn = 'transformString',
- ),
- ]
-
-class TestCommonHelperExpressions(PyparsingExpressionTestCase):
- tests = [
- PpTestSpec(
- desc = "A comma-delimited list of words",
- expr = pp.delimitedList(pp.Word(pp.alphas)),
- text = "this, that, blah,foo, bar",
- expected_list = ['this', 'that', 'blah', 'foo', 'bar'],
- ),
- PpTestSpec(
- desc = "A counted array of words",
- expr = pp.countedArray(pp.Word('ab'))[...],
- text = "2 aaa bbb 0 3 abab bbaa abbab",
- expected_list = [['aaa', 'bbb'], [], ['abab', 'bbaa', 'abbab']],
- ),
- PpTestSpec(
- desc = "skipping comments with ignore",
- expr = (pp.pyparsing_common.identifier('lhs')
- + '='
- + pp.pyparsing_common.fnumber('rhs')).ignore(pp.cppStyleComment),
- text = "abc_100 = /* value to be tested */ 3.1416",
- expected_list = ['abc_100', '=', 3.1416],
- expected_dict = {'lhs': 'abc_100', 'rhs': 3.1416},
- ),
- PpTestSpec(
- desc = "some pre-defined expressions in pyparsing_common, and building a dotted identifier with delimted_list",
- expr = (pp.pyparsing_common.number("id_num")
- + pp.delimitedList(pp.pyparsing_common.identifier, '.', combine=True)("name")
- + pp.pyparsing_common.ipv4_address("ip_address")
- ),
- text = "1001 www.google.com 192.168.10.199",
- expected_list = [1001, 'www.google.com', '192.168.10.199'],
- expected_dict = {'id_num': 1001, 'name': 'www.google.com', 'ip_address': '192.168.10.199'},
- ),
- PpTestSpec(
- desc = "using oneOf (shortcut for Literal('a') | Literal('b') | Literal('c'))",
- expr = pp.oneOf("a b c")[...],
- text = "a b a b b a c c a b b",
- expected_list = ['a', 'b', 'a', 'b', 'b', 'a', 'c', 'c', 'a', 'b', 'b'],
- ),
- PpTestSpec(
- desc = "parsing nested parentheses",
- expr = pp.nestedExpr(),
- text = "(a b (c) d (e f g ()))",
- expected_list = [['a', 'b', ['c'], 'd', ['e', 'f', 'g', []]]],
- ),
- PpTestSpec(
- desc = "parsing nested braces",
- expr = (pp.Keyword('if')
- + pp.nestedExpr()('condition')
- + pp.nestedExpr('{', '}')('body')),
- text = 'if ((x == y) || !z) {printf("{}");}',
- expected_list = ['if', [['x', '==', 'y'], '||', '!z'], ['printf(', '"{}"', ');']],
- expected_dict = {'condition': [[['x', '==', 'y'], '||', '!z']],
- 'body': [['printf(', '"{}"', ');']]},
- ),
- ]
-
-
-def _get_decl_line_no(cls):
- import inspect
- return inspect.getsourcelines(cls)[1]
-
-
-# get all test case classes defined in this module and sort them by decl line no
-test_case_classes = list(PyparsingExpressionTestCase.__subclasses__())
-test_case_classes.sort(key=_get_decl_line_no)
-
-# make into a suite and run it - this will run the tests in the same order
-# they are declared in this module
-#
-# runnable from setup.py using "python setup.py test -s simple_unit_tests.suite"
-#
-suite = unittest.TestSuite(cls() for cls in test_case_classes)
-
-
-# ============ MAIN ================
-
-if __name__ == '__main__':
-
- result = unittest.TextTestRunner().run(suite)
-
- exit(0 if result.wasSuccessful() else 1)