summaryrefslogtreecommitdiff
path: root/buildscripts/config_diff.py
blob: f82522cd21a2bc61677f37448fd11dedfa5fb7bf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
#!/usr/bin/env python3
"""Compares IDL server parameters and configs between MongoDB server versions.

The comparison is computed by scanning though `base_version_dirs` and `incremented_version_dirs` looking for all configs and setParameters in each tree.
It then compares these looking for additions, removals, and deltas.  Finally it outputs a summary to the console.
"""

import argparse
from enum import Enum
import io
import os
import pprint
import unittest
import yaml

_COMPARE_FIELDS_SERVER_PARAMETERS = ['default', 'set_at', 'validator', 'test_only']
_COMPARE_FIELDS_CONFIGS = ['arg_vartype', 'requires', 'hidden', 'redact']


class ComparisonType(str, Enum):
    CONFIGS = 'configs'
    SERVER_PARAMETERS = 'server_parameters'


class PropertyDiff:
    def __init__(self, base, inc):
        self.base = base
        self.inc = inc


class PropertiesDiffs:
    def __init__(self, removed, added, modified):
        self.removed = removed
        self.added = added
        self.modified = modified


def build_diff_fn(compare_fields: list) -> callable:
    def diff_fn(prop_base: dict, prop_inc: dict) -> dict:
        change_diffs = {}
        for field in compare_fields:
            if prop_base.get(field) != prop_inc.get(field):
                change_diffs[field] = PropertyDiff(
                    str(prop_base.get(field, "")), str(prop_inc.get(field, "")))
        return change_diffs

    return diff_fn


class BuildBasePropertiesForComparisonHandler:
    """Interprets an .idl file representing a "base" version of configuration for comparison.

    As a base version, no comparison is required, only to build a list of configurations for
    future comparison.
    """

    def __init__(self, handler_type: ComparisonType):
        self.handler_type = handler_type
        self.properties = {}

    def handle(self, yaml_obj: dict, yaml_file_name: str) -> None:
        yaml_props = yaml_obj.get(self.handler_type)

        if yaml_props is not None:
            for prop, val in yaml_props.items():
                self.properties[prop, yaml_file_name] = val


class ComputeDiffsFromIncrementedVersionHandler:
    """Interprets an .idl file representing an "incremented" version containing changes from a "base" version.

    This handler performs comparison between the "incremented" state and a base state, and thus
    requires knowledge of a base dictionary of properties (base_properties) to execute.
    """

    def __init__(self, handler_type: ComparisonType, base_properties: dict, calc_diff_fn: callable):
        self.calc_diff = calc_diff_fn
        self.handler_type = handler_type
        self.properties_diff = PropertiesDiffs(base_properties, {}, {})

    def _compare_and_partition(self, yaml_props: dict, yaml_file_name: str) -> None:

        for yaml_key, yaml_val in yaml_props.items():
            compare_key = (yaml_key, yaml_file_name)

            # If the yaml file property does not exist in "removed" base version properties,
            # it must have been added in the incremented version
            if compare_key not in self.properties_diff.removed:
                self.properties_diff.added[compare_key] = yaml_val
                continue

            # Otherwise, we can remove it from 'removed' since it exists in both
            # version properties, and check if there is a diff
            # This will leave properties_diff.removed containing only entries that were
            # present in the base version properties, but not in the incremented version properties,
            # which means they were removed in the incremented version
            in_both_prop = self.properties_diff.removed.pop(compare_key)
            changed_properties = self.calc_diff(yaml_val, in_both_prop)

            if len(changed_properties) > 0:
                self.properties_diff.modified[compare_key] = changed_properties

    def handle(self, yaml_obj: dict, yaml_file_name: str) -> None:
        yaml_props = yaml_obj.get(self.handler_type.value)
        if yaml_props is not None:
            self._compare_and_partition(yaml_props, yaml_file_name)


def load_yaml(dirs: list, exclusions: list, idl_yaml_handlers: list) -> None:
    """Walks each path from top to bottom, applying each handler in idl_yaml_handlers to any .idl files encountered.

    If a directory encountered contains any string in exclusions, it is skipped and will not
    be included in the walk.
    """
    for directory in dirs:
        for dirpath, dirnames, filenames in os.walk(directory):
            for dirname in dirnames:
                for exclusion in exclusions:
                    if exclusion in dirpath + os.path.sep + dirname:
                        dirnames.remove(dirname)
                        break

            for name in filenames:
                if not name.endswith('.idl'):
                    continue

                with io.open(os.path.join(dirpath, name), 'r', encoding='utf-8') as idl_yaml_stream:
                    idl_yaml = yaml.safe_load(idl_yaml_stream)
                    for handler in idl_yaml_handlers:
                        handler.handle(idl_yaml, name)


def get_properties_diffs(mode: ComparisonType, base_version_dirs: list, inc_version_dirs: list,
                         exclude: list) -> PropertiesDiffs:
    """Returns a PropertiesDiffs object containing the changes between properties in base_version_dirs and inc_version_dirs."""

    compare_fields = []
    if mode == ComparisonType.SERVER_PARAMETERS:
        compare_fields = _COMPARE_FIELDS_SERVER_PARAMETERS
    elif mode == ComparisonType.CONFIGS:
        compare_fields = _COMPARE_FIELDS_CONFIGS
    else:
        raise Exception(f'Unknown option {mode}')

    diff_fn = build_diff_fn(compare_fields)

    base_handler = BuildBasePropertiesForComparisonHandler(mode)
    load_yaml(base_version_dirs, exclude, [base_handler])

    increment_handler = ComputeDiffsFromIncrementedVersionHandler(mode, base_handler.properties,
                                                                  diff_fn)
    load_yaml(inc_version_dirs, exclude, [increment_handler])

    return increment_handler.properties_diff


def output_diffs(mode: ComparisonType, diff: PropertiesDiffs) -> None:

    pp = pprint.PrettyPrinter()

    mode_format = ""
    if mode == ComparisonType.CONFIGS:
        mode_format = "config"
    elif mode == ComparisonType.SERVER_PARAMETERS:
        mode_format = "server parameter"
    else:
        raise Exception(f'Unknown option {mode}')

    for sp, val in diff.added.items():
        if not val.get('test_only'):
            print(f'Added {mode_format} {str(sp)}')
            pp.pprint(val)
            print()

    for sp, val in diff.removed.items():
        if not val.get('test_only'):
            print(f'Removed {mode_format} {str(sp)}')
            pp.pprint(val)
            print()

    for sp, val in diff.modified.items():
        if not val.get('test_only'):
            print(f'Modified {mode_format} {str(sp)}')
            for property_name, delta in val.items():
                print(f'<{property_name}> changed from [{delta.base}] to [{delta.inc}]')
            print()


def main():

    arg_parser = argparse.ArgumentParser(prog="Core Server IDL Parameter/Config Diff")

    arg_parser.add_argument(
        'mode', choices=[ComparisonType.SERVER_PARAMETERS.value, ComparisonType.CONFIGS.value])
    arg_parser.add_argument(
        '-b', '--base_version_dirs',
        help='A colon-separated list of paths to the base version for comparison', required=True)

    arg_parser.add_argument(
        '-i', '--incremented_version_dirs',
        help='A colon-separated list of paths to the incremented version for comparison',
        required=True)
    arg_parser.add_argument(
        '-e', '--exclude_dirs',
        help='A colon-separated list of directory path strings to exclude from comparison, ' +
        'e.g. a path /foo/bar/dir will be excluded by an argument of any of foo/bar/dir, bar/dir,' +
        'foo, or bar, or dir ', required=False)

    args = arg_parser.parse_args()

    incremented_version_dirs = str.split(args.incremented_version_dirs, ':')
    base_version_dirs = str.split(args.base_version_dirs, ':')
    exclude = set(args.exclude_dirs.split(':')) if args.exclude_dirs else set()
    mode = ComparisonType(args.mode)

    diffs = get_properties_diffs(mode, base_version_dirs, incremented_version_dirs, exclude)
    output_diffs(mode, diffs)


if __name__ == "__main__":
    main()


#########################################################################################
#  python3 -m unittest buildscripts/config_diff.py
#########################################################################################
class TestBuildBasePropertiesForComparisonHandler(unittest.TestCase):
    def test_yaml_obj_filters_comparison_types_correctly(self):
        filename = "test.yml"
        document = """
            global:
              cpp_namespace: "mongo"

            server_parameters:
              changeStreamOptions:
                description: "Cluster server parameter for change stream options"
                set_at: cluster
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true

            configs:
              "net.compression.compressors":
                description: 'Comma-separated list of compressors to use for network messages'
                source: [ cli, ini, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'snappy,zstd,zlib' 
        """
        yaml_obj = yaml.load(document)

        fixture = BuildBasePropertiesForComparisonHandler(ComparisonType.SERVER_PARAMETERS)
        fixture.handle(yaml_obj, filename)

        #should filter out configs, but parse server parameters
        self.assertIsNone(fixture.properties.get(("net.compression.compressors", filename)))
        self.assertIsNotNone(fixture.properties[("changeStreamOptions", filename)])

        fixture = BuildBasePropertiesForComparisonHandler(ComparisonType.CONFIGS)
        fixture.handle(yaml_obj, filename)

        #should filter out server parameters, but parse configs
        self.assertIsNone(fixture.properties.get(("changeStreamOptions", filename)))
        self.assertIsNotNone(fixture.properties.get(("net.compression.compressors", filename)))

    def test_empty_yaml_obj_does_nothing(self):
        filename = "test.yml"
        document = """
            global:
              cpp_namespace: "mongo"
        """

        yaml_obj = yaml.load(document)

        fixture = BuildBasePropertiesForComparisonHandler(ComparisonType.SERVER_PARAMETERS)
        fixture.handle(yaml_obj, filename)
        self.assertTrue(len(fixture.properties) == 0)

        fixture = BuildBasePropertiesForComparisonHandler(ComparisonType.CONFIGS)
        fixture.handle(yaml_obj, filename)
        self.assertTrue(len(fixture.properties) == 0)


class TestComputeDiffsFromIncrementedVersionHandler(unittest.TestCase):
    def setUp(self):
        self.parameter_diff_function = build_diff_fn(_COMPARE_FIELDS_SERVER_PARAMETERS)
        self.config_diff_function = build_diff_fn(_COMPARE_FIELDS_CONFIGS)

    def test_yaml_obj_filtered_correctly(self):
        filename = "inc.yml"
        document = """
            server_parameters:
              testOptions:
                description: "Cluster server parameter for change stream options"
                set_at: cluster
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true
              helloMorld:
                description: "yep"
                set_at: allthetime
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true

            configs:
              "asdf":
                description: 'Comma-separated list of compressors to use for network messages'
                source: [ cli, ini, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'snappy,zstd,zlib' 
              "qwer":
                description: 'ok'
                source: [ cli, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'zlib' 
        """

        inc_yaml_obj = yaml.load(document)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.CONFIGS, {},
                                                                self.config_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff
        self.assertIsNotNone(properties_diffs.added.get(("asdf", filename)))
        self.assertIsNotNone(properties_diffs.added.get(("qwer", filename)))

        self.assertIsNone(properties_diffs.added.get(("testOptions", filename)))
        self.assertIsNone(properties_diffs.added.get(("helloMorld", filename)))

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.SERVER_PARAMETERS,
                                                                {}, self.parameter_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNone(properties_diffs.added.get(("asdf", filename)))
        self.assertIsNone(properties_diffs.added.get(("qwer", filename)))

        self.assertIsNotNone(properties_diffs.added.get(("testOptions", filename)))
        self.assertIsNotNone(properties_diffs.added.get(("helloMorld", filename)))

    def test_added_works_correctly(self):
        filename = "test.yaml"
        document = """
            server_parameters:
              testOptions:
                description: "Cluster server parameter for change stream options"
                set_at: cluster
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true

            configs:
              "asdf":
                description: 'Comma-separated list of compressors to use for network messages'
                source: [ cli, ini, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'snappy,zstd,zlib' 
        """

        inc_yaml_obj = yaml.load(document)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.CONFIGS, {},
                                                                self.config_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNotNone(properties_diffs.added.get(("asdf", filename)))
        self.assertTrue(len(properties_diffs.added) == 1)
        self.assertTrue(len(properties_diffs.removed) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.SERVER_PARAMETERS,
                                                                {}, self.parameter_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff
        self.assertTrue(len(properties_diffs.added) == 1)
        self.assertIsNotNone(properties_diffs.added.get(("testOptions", filename)))
        self.assertTrue(len(properties_diffs.removed) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)

    def test_removed_works_correctly(self):
        filename = "test.yaml"
        document = """
            server_parameters:
            configs:
        """

        def get_base_data():
            return {("ok", "test.yaml"): {"yes": "no"}, ("also_ok", "blah.yaml"): {"no": "yes"}}

        inc_yaml_obj = yaml.load(document)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.CONFIGS,
                                                                get_base_data(),
                                                                self.config_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNotNone(properties_diffs.removed.get(("ok", filename)))
        self.assertIsNotNone(properties_diffs.removed.get(("also_ok", "blah.yaml")))

        self.assertTrue(len(properties_diffs.removed) == 2)
        self.assertTrue(len(properties_diffs.added) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.SERVER_PARAMETERS,
                                                                get_base_data(),
                                                                self.parameter_diff_function)
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNotNone(properties_diffs.removed.get(("ok", filename)))
        self.assertIsNotNone(properties_diffs.removed.get(("also_ok", "blah.yaml")))

        self.assertTrue(len(properties_diffs.removed) == 2)
        self.assertTrue(len(properties_diffs.added) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)

    def test_modified_works_correctly(self):
        filename = "test.yaml"
        document = """
            server_parameters:
              testOptions:
                description: "Cluster server parameter for change stream options"
                set_at: cluster
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true

              testParameter:
                description: "Some parameter"
                set_at: cluster
                cpp_class:
                  name: ChangeStreamOptionsParameter
                  override_set: true
                  override_validate: true

            configs:
              "asdf":
                description: 'Comma-separated list of compressors to use for network messages'
                source: [ cli, ini, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'snappy,zstd,zlib' 

              "zxcv":
                description: 'Comma-separated list of compressors to use for network messages'
                source: [ cli, ini, yaml ]
                arg_vartype: String
                short_name: networkMessageCompressors
                default: 'snappy,zstd,zlib' 
        """

        inc_yaml_obj = yaml.load(document)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.CONFIGS, {},
                                                                build_diff_fn(['default']))
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNotNone(properties_diffs.added.get(("asdf", filename)))
        self.assertTrue(len(properties_diffs.removed) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)

        inc_fixture = ComputeDiffsFromIncrementedVersionHandler(ComparisonType.SERVER_PARAMETERS,
                                                                {}, build_diff_fn(['set_at']))
        inc_fixture.handle(inc_yaml_obj, filename)

        properties_diffs = inc_fixture.properties_diff

        self.assertIsNotNone(properties_diffs.added.get(("testOptions", filename)))
        self.assertTrue(len(properties_diffs.removed) == 0)
        self.assertTrue(len(properties_diffs.modified) == 0)


class TestPropertiesDiffFunction(unittest.TestCase):
    def test_empty_returns_empty(self):
        fn = build_diff_fn([])
        diffs = fn({"same": "different"}, {"same": "different"})
        self.assertTrue(len(diffs) == 0)

    def test_return_one_diff(self):
        fn = build_diff_fn(["same"])
        diffs = fn({"same": "dofferent"}, {"same": "different"})
        self.assertTrue(len(diffs) == 1)
        self.assertTrue(diffs["same"].base == "dofferent")
        self.assertTrue(diffs["same"].inc == "different")

    def test_return_two_diffs(self):
        fn = build_diff_fn(["same", "a"])
        diffs = fn({"same": "dofferent", "a": "1"}, {"same": "different", "a": "2"})
        self.assertTrue(len(diffs) == 2)
        self.assertTrue(diffs["same"].base == "dofferent")
        self.assertTrue(diffs["same"].inc == "different")
        self.assertTrue(diffs["a"].base == "1")
        self.assertTrue(diffs["a"].inc == "2")

    def test_only_base_returns_diff(self):
        fn = build_diff_fn(["a"])
        diffs = fn({"a": "1"}, {})
        self.assertTrue(len(diffs) == 1)
        self.assertTrue(diffs["a"].base == "1")
        self.assertTrue(diffs["a"].inc == "")

    def test_only_inc_returns_diff(self):
        fn = build_diff_fn(["a"])
        diffs = fn({}, {"a": "1"})
        self.assertTrue(len(diffs) == 1)
        self.assertTrue(diffs["a"].inc == "1")
        self.assertTrue(diffs["a"].base == "")

    def test_nonincluided_field_is_not_diff(self):
        fn = build_diff_fn(["b"])
        diffs = fn({}, {"a": "1"})
        self.assertTrue(len(diffs) == 0)

    def test_base_version_nexist_added_none(self):
        fn = build_diff_fn(["a"])
        diffs = fn({}, {"a": "None"})
        self.assertTrue(diffs["a"].inc == "None")
        self.assertTrue(diffs["a"].base == "")
        self.assertTrue(len(diffs) == 1)


class TestCLIFunctions(unittest.TestCase):
    def test_unknown_comparison_type_throws(self):
        with self.assertRaises(Exception):
            output_diffs(None, PropertiesDiffs({}, {}, {}))

        with self.assertRaises(Exception):
            get_properties_diffs(None, [], [], [])