From 3b305defa04bf01add8c30b61bd13d8ae8364ace Mon Sep 17 00:00:00 2001 From: Sean Quah Date: Thu, 18 May 2023 18:52:09 +0100 Subject: [PATCH 1/3] Fix `HomeServer`s leaking after tests that touch inbound federation Signed-off-by: Sean Quah --- synapse/util/ratelimitutils.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/synapse/util/ratelimitutils.py b/synapse/util/ratelimitutils.py index f262bf95a0fd..2ad55ac13e3b 100644 --- a/synapse/util/ratelimitutils.py +++ b/synapse/util/ratelimitutils.py @@ -25,10 +25,12 @@ Iterator, List, Mapping, + MutableSet, Optional, Set, Tuple, ) +from weakref import WeakSet from prometheus_client.core import Counter from typing_extensions import ContextManager @@ -86,7 +88,9 @@ ) -_rate_limiter_instances: Set["FederationRateLimiter"] = set() +# This must be a `WeakSet`, otherwise we indirectly hold on to entire `HomeServer`s +# during trial test runs and leak a lot of memory. +_rate_limiter_instances: MutableSet["FederationRateLimiter"] = WeakSet() # Protects the _rate_limiter_instances set from concurrent access _rate_limiter_instances_lock = threading.Lock() From cc480e10f4ff31cde7911df822c6c7758db34c6b Mon Sep 17 00:00:00 2001 From: Sean Quah Date: Thu, 18 May 2023 18:54:01 +0100 Subject: [PATCH 2/3] Fix `HomeServer`s leaking due to #15334 When the gen-0 GC is run at the end of each test, the `TestCase` object usually still holds references to the `HomeServer` used during the test. As a result, the `HomeServer` gets promoted to gen-1 and then never garbage collected. Fix this by periodically running full GCs. Signed-off-by: Sean Quah --- tests/unittest.py | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/tests/unittest.py b/tests/unittest.py index b6fdf69635b1..623c5a75a2f4 100644 --- a/tests/unittest.py +++ b/tests/unittest.py @@ -229,13 +229,20 @@ def tearDown(orig: Callable[[], R]) -> R: # # The easiest way to do this would be to do a full GC after each test # run, but that is very expensive. Instead, we disable GC (above) for - # the duration of the test so that we only need to run a gen-0 GC, which - # is a lot quicker. + # the duration of the test and only run a gen-0 GC, which is a lot + # quicker. This doesn't clean up everything, since the TestCase + # instance still holds references to objects created during the test, + # such as HomeServers, so we do a full GC every so often. @around(self) def tearDown(orig: Callable[[], R]) -> R: ret = orig() gc.collect(0) + # Run a full GC every 50 gen-0 GCs. + gen0_stats = gc.get_stats()[0] + gen0_collections = gen0_stats["collections"] + if gen0_collections % 50 == 0: + gc.collect() gc.enable() set_current_context(SENTINEL_CONTEXT) From 8e94932d4c2f3b5829b4b9ab9f67b59db05e9271 Mon Sep 17 00:00:00 2001 From: Sean Quah Date: Thu, 18 May 2023 18:56:48 +0100 Subject: [PATCH 3/3] Add newsfile --- changelog.d/15630.misc | 1 + 1 file changed, 1 insertion(+) create mode 100644 changelog.d/15630.misc diff --git a/changelog.d/15630.misc b/changelog.d/15630.misc new file mode 100644 index 000000000000..a30304bfd6ab --- /dev/null +++ b/changelog.d/15630.misc @@ -0,0 +1 @@ +Fix two memory leaks in `trial` test runs.