From a0e57305d96f09d755246f11dbb13a83898101b7 Mon Sep 17 00:00:00 2001 From: Matthieu Ancellin <31126826+mancellin@users.noreply.github.com> Date: Thu, 14 Dec 2023 10:35:47 +0100 Subject: [PATCH] Fix issue with caching of matrices since #420 (#442) --- capytaine/bem/engines.py | 6 +- capytaine/tools/lru_cache.py | 49 ++++---- docs/changelog.rst | 2 + pytest/test_bem_linear_combination_of_dofs.py | 9 +- pytest/test_bem_solver.py | 2 +- pytest/test_tool_lru_cache.py | 107 ++++++++++++++++++ 6 files changed, 141 insertions(+), 34 deletions(-) create mode 100644 pytest/test_tool_lru_cache.py diff --git a/capytaine/bem/engines.py b/capytaine/bem/engines.py index 89c6a448..c8eee507 100644 --- a/capytaine/bem/engines.py +++ b/capytaine/bem/engines.py @@ -14,7 +14,7 @@ from capytaine.matrices.block import BlockMatrix from capytaine.matrices.low_rank import LowRankMatrix, NoConvergenceOfACA from capytaine.matrices.block_toeplitz import BlockSymmetricToeplitzMatrix, BlockToeplitzMatrix, BlockCirculantMatrix -from capytaine.tools.lru_cache import delete_first_lru_cache +from capytaine.tools.lru_cache import lru_cache_with_strict_maxsize LOG = logging.getLogger(__name__) @@ -69,7 +69,7 @@ def __init__(self, *, linear_solver='lu_decomposition', matrix_cache_size=1): self.linear_solver = linear_solver if matrix_cache_size > 0: - self.build_matrices = delete_first_lru_cache(maxsize=matrix_cache_size)(self.build_matrices) + self.build_matrices = lru_cache_with_strict_maxsize(maxsize=matrix_cache_size)(self.build_matrices) self.exportable_settings = { 'engine': 'BasicMatrixEngine', @@ -153,7 +153,7 @@ class HierarchicalToeplitzMatrixEngine(MatrixEngine): def __init__(self, *, ACA_distance=8.0, ACA_tol=1e-2, matrix_cache_size=1): if matrix_cache_size > 0: - self.build_matrices = delete_first_lru_cache(maxsize=matrix_cache_size)(self.build_matrices) + self.build_matrices = lru_cache_with_strict_maxsize(maxsize=matrix_cache_size)(self.build_matrices) self.ACA_distance = ACA_distance self.ACA_tol = ACA_tol diff --git a/capytaine/tools/lru_cache.py b/capytaine/tools/lru_cache.py index 48c7805e..701c1609 100644 --- a/capytaine/tools/lru_cache.py +++ b/capytaine/tools/lru_cache.py @@ -1,29 +1,43 @@ +# Copyright (C) 2017-2024 Matthieu Ancellin +# See LICENSE file at +"""Tools for memoization of functions.""" from collections import OrderedDict from functools import wraps -def delete_first_lru_cache(maxsize=1): - """Behaves like functools.lru_cache(), but the oldest data in the cache is - deleted *before* computing a new one, in order to limit RAM usage when - stored objects are big.""" +import logging + +LOG = logging.getLogger(__name__) + + +def lru_cache_with_strict_maxsize(maxsize=1): + """Behaves mostly like functools.lru_cache(), but the oldest data in the cache is + deleted *before* computing a new one, in order to *never* have more that + `maxsize` items in memory. + This is useful to limit RAM usage when stored objects are big, like the interaction + matrices of Capytaine.""" def decorator(f): cache = OrderedDict() @wraps(f) def decorated_f(*args, **kwargs): - # /!\ cache only args + hashable_kwargs = tuple((k, v) for (k, v) in kwargs.items()) + # Might miss a cache hit if the order of kwargs is changed. + # But at least unlike a previous version, should not return a wrong value. - if args in cache: + if (args, hashable_kwargs) in cache: # Get item in cache - return cache[args] + LOG.debug("Get cached version of %s(%s, %s)", f.__name__, args, hashable_kwargs) + return cache[(args, hashable_kwargs)] if len(cache) + 1 > maxsize: # Drop oldest item in cache. cache.popitem(last=False) # Compute and store + LOG.debug("Computing %s(%s, %s)", f.__name__, args, hashable_kwargs) result = f(*args, **kwargs) - cache[args] = result + cache[(args, hashable_kwargs)] = result return result @@ -32,21 +46,4 @@ def decorated_f(*args, **kwargs): return decorator -# if __name__ == "__main__": -# import numpy as np -# from functools import lru_cache - -# # @lru_cache(maxsize=1) -# @delete_first_lru_cache(maxsize=1) -# def f(i): -# print(i) -# np.random.seed(i) -# a = np.random.random((20_000, 20_000)) -# print(a.nbytes / 2**30, "Go") -# return a - -# print(f(1)[0, 0]) -# print(f(1)[0, 0]) -# print(f(2)[0, 0]) -# print(f(1)[0, 0]) -# print(f(3)[0, 0]) +delete_first_lru_cache = lru_cache_with_strict_maxsize # For backward compatibility... diff --git a/docs/changelog.rst b/docs/changelog.rst index 5dfe10cd..0995c745 100644 --- a/docs/changelog.rst +++ b/docs/changelog.rst @@ -72,6 +72,8 @@ Internals * Fortran source files are not included in wheel anymore (:pull:`360`). +* The `delete_first_lru_cache` decorator has been renamed :func:`~capytaine.tools.lru_cache.lru_cache_with_strict_maxsize` and now supports keyword arguments in the memoized function (:pull:`442`). + * Improve some warnings and error messages. ------------------------------- diff --git a/pytest/test_bem_linear_combination_of_dofs.py b/pytest/test_bem_linear_combination_of_dofs.py index 0de7058c..77fffc1e 100644 --- a/pytest/test_bem_linear_combination_of_dofs.py +++ b/pytest/test_bem_linear_combination_of_dofs.py @@ -3,10 +3,11 @@ import numpy as np import capytaine as cpt -import pytest +import pytest solver = cpt.BEMSolver() -method = ['indirect','direct'] +method = ['indirect', 'direct'] + @pytest.mark.parametrize("method", method) def test_sum_of_dofs(method): @@ -27,7 +28,8 @@ def test_sum_of_dofs(method): body1_added_mass = dataset['added_mass'].sel(radiating_dof="body1__Heave", influenced_dof="body1__Heave").data body2_added_mass = dataset['added_mass'].sel(radiating_dof="body2__Heave", influenced_dof="body2__Heave").data - assert np.allclose(both_added_mass, body1_added_mass + body2_added_mass, rtol=1.1e-2) + assert np.allclose(both_added_mass, body1_added_mass + body2_added_mass, rtol=1e-2) + @pytest.mark.parametrize("method", method) def test_rotation_axis(method): @@ -57,4 +59,3 @@ def test_rotation_axis(method): A = dataset['added_mass'].sel(radiating_dof=["Yaw", "Sway"], influenced_dof=["Yaw", "Sway"]).data P = np.array([1, -l]) assert np.isclose(A_m, P.T @ A @ P) - diff --git a/pytest/test_bem_solver.py b/pytest/test_bem_solver.py index b8f5322b..9a8e5c96 100644 --- a/pytest/test_bem_solver.py +++ b/pytest/test_bem_solver.py @@ -140,4 +140,4 @@ def test_direct_solver(sphere): solver = cpt.BEMSolver() direct_result = solver.solve(problem, method='direct') indirect_result = solver.solve(problem, method='indirect') - assert direct_result.forces["Surge"] == pytest.approx(indirect_result.forces["Surge"], rel=1e-2) + assert direct_result.forces["Surge"] == pytest.approx(indirect_result.forces["Surge"], rel=1e-1) diff --git a/pytest/test_tool_lru_cache.py b/pytest/test_tool_lru_cache.py new file mode 100644 index 00000000..3173d4b5 --- /dev/null +++ b/pytest/test_tool_lru_cache.py @@ -0,0 +1,107 @@ +from functools import lru_cache + +import pytest +import numpy as np + +from capytaine.tools.lru_cache import lru_cache_with_strict_maxsize + + +def get_random_id(n): + # An impure function that shouldn't be memoized, but allows to test the cache. + return np.random.default_rng().integers(n) + +N = 100_000_000 + +def test_cache(): + f = lru_cache_with_strict_maxsize()(get_random_id) + a = f(N) + b = f(N) + assert a == b # randint was not run the second time, the cached value was used + + +def test_cache_maxsize(): + # 1/N chance of failing + f = lru_cache_with_strict_maxsize(maxsize=1)(get_random_id) + a = f(N) + f(10) + b = f(N) + assert a != b # the cached value of the first call had been deleted + + +def test_cache_kwargs(): + f = lru_cache_with_strict_maxsize()(get_random_id) + a = f(n=N) + b = f(n=N) + assert a == b # the cached value of the first call had been deleted + + +def test_delete_first(): + """This test is a convoluted way to test the main difference between the + built-in lru_cache and the lru_cache_with_strict_maxsize decorator defined + by Capytaine. The difference is that the latter make sure that objects in + the cache are deleted before computing and caching a new result. For + Capytaine, it is meant to limit the RAM usage. Here, it is tested by making + sure that there is never two instances of a Singleton class at the same + time.""" + + class Singleton: + nb_instances = [0] + # Use a one-element list as a mutable integer shared by all instances. + + def __init__(self): + if self.nb_instances[0] != 0: + raise ValueError("There can be only one Singleton at the same time!") + self.nb_instances[0] += 1 + + def __del__(self): + # When the singleton is deleted, update the counter + self.nb_instances[0] -= 1 + + assert Singleton.nb_instances[0] == 0 + a = Singleton() + assert Singleton.nb_instances[0] == 1 + del a + assert Singleton.nb_instances[0] == 0 + + ## NO CACHE + def new_instance(a): + return Singleton() + new_instance(1) + assert Singleton.nb_instances[0] == 0 # The Singleton created above is immediately garbage-collected. + + ## CAPYTAINE'S CACHE + @lru_cache_with_strict_maxsize(maxsize=1) + def new_instance(a): + return Singleton() + + new_instance(1) + assert Singleton.nb_instances[0] == 1 # It is not garbage collected only because it is still in the cache. + new_instance(2) # When we create a new instance, the old one is removed from the cache before creating the new one. + + del new_instance # Delete the cache before doing more tests. + + # STDLIB CACHE + @lru_cache(maxsize=1) + def new_instance(a): + return Singleton() + + new_instance(1) + with pytest.raises(ValueError): + new_instance(2) # lru_cache tries to create the new singleton, before deleting the old one from the cache. + + +# def benchmark_ram_usage(): +# # Would need a way to monitor the RAM usage to automate this test +# # The RAM usage should never be more than the ~3GB allocated by a single call +# +# # @delete_first_lru_cache(maxsize=1) +# @lru_cache(maxsize=1) +# def f(i): +# np.random.seed(i) +# a = np.random.random((20_000, 20_000)) +# print(f"Allocated {a.nbytes / 2**30:.2f} GB") +# return a +# +# for i in (1, 1, 2, 1, 3): +# print(f"Calling f({i})") +# f(i)