1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
|
#
# (c) Simon Marlow 2002
#
from my_typing import *
from pathlib import Path
from perf_notes import MetricChange, PerfStat, Baseline, MetricOracles, GitRef
from datetime import datetime
# -----------------------------------------------------------------------------
# Configuration info
# There is a single global instance of this structure, stored in the
# variable config below. The fields of the structure are filled in by
# the appropriate config script(s) for this compiler/platform, in
# ../config.
#
# Bits of the structure may also be filled in from the command line,
# via the build system, using the '-e' option to runtests.
class TestConfig:
def __init__(self):
# Where the testsuite root is
self.top = Path('.')
# Directories below which to look for test description files (foo.T)
self.rootdirs = []
# Run these tests only (run all tests if empty)
self.run_only_some_tests = False
self.only = set()
# Don't fail on out-of-tolerance stat failures
self.ignore_perf_increases = False
self.ignore_perf_decreases = False
# Accept new output which differs from the sample?
self.accept = False
self.accept_platform = False
self.accept_os = False
# File in which to save the performance metrics.
self.metrics_file = ''
# File in which to save the summary
self.summary_file = ''
# Path to Ghostscript
self.gs = None # type: Optional[Path]
# Run tests requiring Haddock
self.haddock = False
# Compiler has native code generator?
self.have_ncg = False
# Is compiler unregisterised?
self.unregisterised = False
# Was the compiler executable compiled with profiling?
self.compiler_profiled = False
# Was the compiler compiled with DEBUG?
self.compiler_debugged = False
# Was the compiler compiled with LLVM?
self.ghc_built_by_llvm = False
# Should we print the summary?
# Disabling this is useful for Phabricator/Harbormaster
# logfiles, which are truncated to 30 lines. TODO. Revise if
# this is still true.
# Note that we have a separate flag for this, instead of
# overloading --verbose, as you might want to see the summary
# with --verbose=0.
self.no_print_summary = False
# What platform are we running on?
self.platform = ''
self.os = ''
self.arch = ''
self.msys = False
self.cygwin = False
# What is the wordsize (in bits) of this platform?
self.wordsize = ''
# Verbosity level
self.verbose = 2
# See Note [validate and testsuite speed] in toplevel Makefile.
self.speed = 1
self.list_broken = False
# Path to the compiler (stage2 by default)
self.compiler = ''
# and ghc-pkg
self.ghc_pkg = ''
# Is self.compiler a stage 1, 2 or 3 compiler?
self.stage = 2
# Flags we always give to this compiler
self.compiler_always_flags = []
# Which ways to run tests (when compiling and running respectively)
# Other ways are added from the command line if we have the appropriate
# libraries.
self.compile_ways = [] # type: List[WayName]
self.run_ways = [] # type: List[WayName]
self.other_ways = [] # type: List[WayName]
# The ways selected via the command line.
self.cmdline_ways = [] # type: List[WayName]
# Lists of flags for each way
self.way_flags = {} # type: Dict[WayName, List[str]]
self.way_rts_flags = {} # type: Dict[WayName, List[str]]
# Do we have a functional LLVM toolchain?
self.have_llvm = False
# Do we have vanilla libraries?
self.have_vanilla = False
# Do we have dynamic libraries?
self.have_dynamic = False
# Do we have profiling support?
self.have_profiling = False
# Do we have interpreter support?
self.have_interp = False
# Does the platform support loading of dynamic shared libraries? e.g.
# some musl-based environments do not.
self.supports_dynamic_libs = True
# Does GHC support dynamic linking of Haskell objects (i.e. the dynamic
# way)?
self.supports_dynamic_hs = True
# Is the compiler dynamically linked?
self.ghc_dynamic = False
# Do we have SMP support?
self.have_smp = False
# Is gdb available?
self.have_gdb = False
# Is readelf available?
self.have_readelf = False
# Do we use a fast backend for bignum (e.g. GMP)
self.have_fast_bignum = True
# Are we testing an in-tree compiler?
self.in_tree_compiler = True
# Are we running in a ThreadSanitizer-instrumented build?
self.have_thread_sanitizer = False
# Do symbols use leading underscores?
self.leading_underscore = False
# the timeout program
self.timeout_prog = ''
self.timeout = 300
# threads
self.threads = 1
self.use_threads = False
# tests which should be considered to be broken during this testsuite
# run.
self.broken_tests = set() # type: Set[TestName]
# Baseline commit for performance metric comparisons.
self.baseline_commit = None # type: Optional[GitRef]
# Additional package dbs to inspect for test dependencies.
self.test_package_db = [] # type: [PathToPackageDb]
# Should we skip performance tests
self.skip_perf_tests = False
# Only do performance tests
self.only_perf_tests = False
# Allowed performance changes (see perf_notes.get_allowed_perf_changes())
self.allowed_perf_changes = {}
# The test environment.
self.test_env = 'local'
# terminal supports colors
self.supports_colors = False
# Where to look up runtime stats produced by haddock, needed for
# the haddock perf tests in testsuite/tests/perf/haddock/.
# See Note [Haddock runtime stats files] at the bottom of this file.
self.stats_files_dir = Path('/please_set_stats_files_dir')
# Should we cleanup after test runs?
self.cleanup = True
# I have no idea what this does
self.package_conf_cache_file = None # type: Optional[Path]
# The extra hadrian dependencies we need for all configured tests
self.hadrian_deps = set() # type: Set[str]
# Are we only reporting hadrian dependencies?
# The path specifies the file in which to write the dependencies
self.only_report_hadrian_deps = None # type: Optional[Path]
def validate(self) -> None:
""" Check the TestConfig for self-consistency """
def assert_implies(a: bool, b: bool):
if a:
assert(b)
assert_implies(self.supports_dynamic_hs, self.supports_dynamic_libs)
assert_implies(self.have_dynamic, self.supports_dynamic_hs)
assert_implies(self.ghc_dynamic, self.have_dynamic)
global config
config = TestConfig()
def getConfig():
return config
import os
# Hold our modified GHC testrunning environment so we don't poison the current
# python's environment.
global ghc_env
ghc_env = os.environ.copy()
# -----------------------------------------------------------------------------
# Information about the current test run
class TestResult:
"""
A result from the execution of a test. These live in the expected_passes,
framework_failures, framework_warnings, unexpected_passes,
unexpected_failures, unexpected_stat_failures lists of TestRun.
"""
__slots__ = 'directory', 'testname', 'reason', 'way', 'stdout', 'stderr'
def __init__(self,
directory: str,
testname: TestName,
reason: str,
way: WayName,
stdout: Optional[str]=None,
stderr: Optional[str]=None) -> None:
self.directory = directory
self.testname = testname
self.reason = reason
self.way = way
self.stdout = stdout
self.stderr = stderr
# A performance metric measured in this test run.
PerfMetric = NamedTuple('PerfMetric',
[('change', MetricChange),
('stat', PerfStat),
('baseline', Optional[Baseline]) ])
class TestRun:
def __init__(self) -> None:
self.start_time = None # type: Optional[datetime]
self.total_tests = 0
self.total_test_cases = 0
self.n_tests_skipped = 0
self.n_missing_libs = 0
self.n_expected_passes = 0
self.n_expected_failures = 0
self.framework_failures = [] # type: List[TestResult]
self.framework_warnings = [] # type: List[TestResult]
self.expected_passes = [] # type: List[TestResult]
self.unexpected_passes = [] # type: List[TestResult]
self.unexpected_failures = [] # type: List[TestResult]
self.unexpected_stat_failures = [] # type: List[TestResult]
# Results from tests that have been marked as fragile
self.fragile_passes = [] # type: List[TestResult]
self.fragile_failures = [] # type: List[TestResult]
# List of all metrics measured in this test run.
# [(change, PerfStat)] where change is one of the MetricChange
# constants: NewMetric, NoChange, Increase, Decrease.
# NewMetric happens when the previous git commit has no metric recorded.
self.metrics = [] # type: List[PerfMetric]
global t
t = TestRun()
def getTestRun() -> TestRun:
return t
# -----------------------------------------------------------------------------
# Information about the current test
class TestOptions:
def __init__(self) -> None:
# skip this test?
self.skip = False
# the test is known to be fragile in these ways
self.fragile_ways = [] # type: List[WayName]
# skip these ways
self.omit_ways = [] # type: List[WayName]
# skip all ways except these (None == do all ways)
self.only_ways = None # type: Optional[List[WayName]]
# add these ways to the default set
self.extra_ways = [] # type: List[WayName]
# the result we normally expect for this test
self.expect = 'pass'
# override the expected result for certain ways
self.expect_fail_for = [] # type: List[WayName]
# the stdin file that this test will use (None for <name>.stdin)
self.srcdir = None # type: Optional[Path]
# the stdin file that this test will use (None for <name>.stdin)
self.stdin = None # type: Optional[Path]
# Set the expected stderr/stdout. '' means infer from test name.
self.use_specs = {} # type: Dict[str, Path]
# don't compare output
self.ignore_stdout = False
self.ignore_stderr = False
# Backpack test
self.compile_backpack = False
# We sometimes want to modify the compiler_always_flags, so
# they are copied from config.compiler_always_flags when we
# make a new instance of TestOptions.
self.compiler_always_flags = [] # type: List[str]
# extra compiler opts for this test
self.extra_hc_opts = ''
# extra run opts for this test
self.extra_run_opts = ''
# expected exit code
self.exit_code = 0 # type: int
# extra files to clean afterward
self.clean_files = [] # type: List[str]
# extra files to copy to the testdir
self.extra_files = [] # type: List[str]
# Map from metric to (function from way and commit to baseline value, allowed percentage deviation) e.g.
# { 'bytes allocated': (
# lambda way commit:
# ...
# if way1: return None ...
# elif way2:return 9300000000 ...
# ...
# , 10) }
# This means no baseline is available for way1. For way 2, allow a 10%
# deviation from 9300000000.
self.stats_range_fields = {} # type: Dict[MetricName, MetricOracles]
# Is the test testing performance?
self.is_stats_test = False
# Does this test the compiler's performance as opposed to the generated code.
self.is_compiler_stats_test = False
# should we run this test alone, i.e. not run it in parallel with
# any other threads
self.alone = False
# Does this test use a literate (.lhs) file?
self.literate = False
# Does this test use a .c, .m or .mm file?
self.c_src = False
self.objc_src = False
self.objcpp_src = False
# Does this test use a .cmm file?
self.cmm_src = False
# Should we put .hi/.o files in a subdirectory?
self.outputdir = None
# Command to run before the test
self.pre_cmd = None
# Command wrapper: a function to apply to the command before running it
self.cmd_wrapper = None
# Prefix to put on the command before compiling it
self.compile_cmd_prefix = ''
# Extra output normalisation
self.extra_normaliser = lambda x: x # type: OutputNormalizer
# Custom output checker, otherwise do a comparison with expected
# stdout file. Accepts two arguments: filename of actual stdout
# output, and a normaliser function given other test options
self.check_stdout = None # type: Optional[Callable[[Path, OutputNormalizer], bool]]
# Check .hp file when profiling libraries are available?
self.check_hp = True
# Extra normalisation for compiler error messages
self.extra_errmsg_normaliser = lambda x: x
# Keep profiling callstacks.
self.keep_prof_callstacks = False
# The directory the test is in
self.testdir = Path('.')
# Should we redirect stdout and stderr to a single file?
self.combined_output = False
# How should the timeout be adjusted on this test?
self.compile_timeout_multiplier = 1.0
self.run_timeout_multiplier = 1.0
# Should we run tests in a local subdirectory (<testname>-run) or
# in temporary directory in /tmp? See Note [Running tests in /tmp].
self.local = True
# Should we copy the files of symlink the files for the test?
self.copy_files = False
# The extra hadrian dependencies we need for this particular test
self.hadrian_deps = set() # type: Set[str]
# The default set of options
global default_testopts
default_testopts = TestOptions()
# (bug, directory, name) of tests marked broken. Used by config.list_broken
# feature.
global brokens
brokens = [] # type: List[Tuple[IssueNumber, str, str]]
|