summaryrefslogtreecommitdiff
path: root/rts
diff options
context:
space:
mode:
authorNiklas Hambüchen <mail@nh2.me>2019-10-29 12:54:10 +0100
committerMarge Bot <ben+marge-bot@smart-cactus.org>2019-11-01 23:12:17 -0400
commit9980fb58f613ee3363c7e4cb86453e542c6c69aa (patch)
tree67f0e195dd71510d1d797ce5e07f422401269b90 /rts
parent01006bc79582616c9bbc842b397e85437a57ac18 (diff)
downloadhaskell-9980fb58f613ee3363c7e4cb86453e542c6c69aa.tar.gz
Add +RTS --disable-delayed-os-memory-return. Fixes #17411.
Sets `MiscFlags.disableDelayedOsMemoryReturn`. See the added `Note [MADV_FREE and MADV_DONTNEED]` for details.
Diffstat (limited to 'rts')
-rw-r--r--rts/RtsFlags.c6
-rw-r--r--rts/posix/OSMem.c50
2 files changed, 43 insertions, 13 deletions
diff --git a/rts/RtsFlags.c b/rts/RtsFlags.c
index 0e28b980ac..7949d401db 100644
--- a/rts/RtsFlags.c
+++ b/rts/RtsFlags.c
@@ -243,6 +243,7 @@ void initRtsFlagsDefaults(void)
RtsFlags.MiscFlags.generate_stack_trace = true;
RtsFlags.MiscFlags.generate_dump_file = false;
RtsFlags.MiscFlags.machineReadable = false;
+ RtsFlags.MiscFlags.disableDelayedOsMemoryReturn = false;
RtsFlags.MiscFlags.internalCounters = false;
RtsFlags.MiscFlags.linkerAlwaysPic = DEFAULT_LINKER_ALWAYS_PIC;
RtsFlags.MiscFlags.linkerMemBase = 0;
@@ -914,6 +915,11 @@ error = true;
OPTION_UNSAFE;
RtsFlags.MiscFlags.machineReadable = true;
}
+ else if (strequal("disable-delayed-os-memory-return",
+ &rts_argv[arg][2])) {
+ OPTION_UNSAFE;
+ RtsFlags.MiscFlags.disableDelayedOsMemoryReturn = true;
+ }
else if (strequal("internal-counters",
&rts_argv[arg][2])) {
OPTION_SAFE;
diff --git a/rts/posix/OSMem.c b/rts/posix/OSMem.c
index dc8c4122f7..15f1b62dc9 100644
--- a/rts/posix/OSMem.c
+++ b/rts/posix/OSMem.c
@@ -602,6 +602,26 @@ void osCommitMemory(void *at, W_ size)
}
}
+/* Note [MADV_FREE and MADV_DONTNEED]
+ *
+ * madvise() provides flags with which one can release no longer needed pages
+ * back to the kernel without having to munmap() (which is expensive).
+ *
+ * On Linux, MADV_FREE is newer and faster because it can avoid zeroing
+ * pages if they are re-used by the process later (see `man 2 madvise`),
+ * but for the trade-off that memory inspection tools like `top` will
+ * not immediately reflect the freeing in their display of resident memory
+ * (RSS column): Only under memory pressure will Linux actually remove
+ * the freed pages from the process and update its RSS statistics.
+ * Until then, the pages show up as `LazyFree` in `/proc/PID/smaps`
+ * (see `man 5 proc`).
+ * The delayed RSS update can confuse programmers debugging memory issues,
+ * production memory monitoring tools, and end users who may complain about
+ * undue memory usage shown in reporting tools, so with
+ * `disableDelayedOsMemoryReturn` we provide an RTS flag that allows forcing
+ * usage of MADV_DONTNEED instead of MADV_FREE.
+ */
+
void osDecommitMemory(void *at, W_ size)
{
int r;
@@ -618,21 +638,25 @@ void osDecommitMemory(void *at, W_ size)
#endif
#if defined(MADV_FREE)
- // Try MADV_FREE first, FreeBSD has both and MADV_DONTNEED
- // just swaps memory out. Linux >= 4.5 has both DONTNEED and FREE; either
- // will work as they both allow the system to free anonymous pages.
- // It is important that we try both methods as the kernel which we were
- // built on may differ from the kernel we are now running on.
- r = madvise(at, size, MADV_FREE);
- if(r < 0) {
- if (errno == EINVAL) {
- // Perhaps the system doesn't support MADV_FREE; fall-through and
- // try MADV_DONTNEED.
+ // See Note [MADV_FREE and MADV_DONTNEED].
+ // If MADV_FREE is disabled, fall-through to MADV_DONTNEED.
+ if (!RtsFlags.MiscFlags.disableDelayedOsMemoryReturn) {
+ // Try MADV_FREE first, FreeBSD has both and MADV_DONTNEED
+ // just swaps memory out. Linux >= 4.5 has both DONTNEED and FREE; either
+ // will work as they both allow the system to free anonymous pages.
+ // It is important that we try both methods as the kernel which we were
+ // built on may differ from the kernel we are now running on.
+ r = madvise(at, size, MADV_FREE);
+ if(r < 0) {
+ if (errno == EINVAL) {
+ // Perhaps the system doesn't support MADV_FREE; fall-through and
+ // try MADV_DONTNEED.
+ } else {
+ sysErrorBelch("unable to decommit memory");
+ }
} else {
- sysErrorBelch("unable to decommit memory");
+ return;
}
- } else {
- return;
}
#endif