tests: Add initial tests for memory check function

EdCaunt · EdCaunt · commit 09c54069d0c1 · 2025-08-04T09:42:22.000+01:00
diff --git a/devito/operator/operator.py b/devito/operator/operator.py
@@ -1416,9 +1416,10 @@ def get_nbytes(obj):
             # FIXME: Probably wrong for streamed functions
             # Will overreport memory usage currently
             try:
+                # TODO: is _obj even needed?
                 v = get_nbytes(self[i.name]._obj)
             except AttributeError:
-                v = get_nbytes(i)
+                v = get_nbytes(self.get(i.name, i))
 
             if i._mem_host:
                 host += v
diff --git a/devito/types/sparse.py b/devito/types/sparse.py
@@ -905,9 +905,8 @@ def _decomposition(self):
         mapper = {self._sparse_dim: self._distributor.decomposition[self._sparse_dim]}
         return tuple(mapper.get(d) for d in self.dimensions)
 
-    def _arg_defaults(self, alias=None, estimate_memory=False, **kwargs):
-        defaults = super()._arg_defaults(alias=alias, **kwargs)
-        # FIXME: Repeated use of this structure is ugly
+    def _arg_defaults(self, alias=None, estimate_memory=False):
+        defaults = super()._arg_defaults(alias=alias, estimate_memory=estimate_memory)
         if estimate_memory:
             return defaults
 
diff --git a/tests/test_operator.py b/tests/test_operator.py
@@ -1,4 +1,7 @@
 from itertools import permutations
+from functools import reduce
+from operator import mul
+import logging
 
 import numpy as np
 import sympy
@@ -9,7 +12,7 @@
                     SparseFunction, SparseTimeFunction, Dimension, error, SpaceDimension,
                     NODE, CELL, dimensions, configuration, TensorFunction,
                     TensorTimeFunction, VectorFunction, VectorTimeFunction,
-                    div, grad, switchconfig, exp)
+                    div, grad, switchconfig, exp, Buffer)
 from devito import  Inc, Le, Lt, Ge, Gt  # noqa
 from devito.exceptions import InvalidOperator
 from devito.finite_differences.differentiable import diff2sympy
@@ -2051,3 +2054,167 @@ def test_indirection(self):
 
         assert np.all(f.data[0] == 0.)
         assert np.all(f.data[i] == 3. for i in range(1, 10))
+
+
+class TestEstimateMemory:
+    """Tests for the Operator.estimate_memory() utility"""
+
+    def parse_output(self, output, expected):
+        """Parse estimate_memory machine-readable output"""
+        # Check that no allocation occurs as estimate_memory should avoid data touch
+        assert "Allocating" not in output.text
+
+        name, disk, host, device = output.records[-1].message.split()
+        extracted = (name, int(disk), int(host), int(device))
+
+        assert extracted == expected
+
+    @pytest.mark.parametrize('shape', [(11,), (101, 101), (101, 101, 101)])
+    @pytest.mark.parametrize('dtype', [np.int8, np.int16, np.float32,
+                                       np.float32, np.complex64])
+    @pytest.mark.parametrize('so', [0, 2, 4, 6])
+    def test_basic_usage(self, caplog, shape, dtype, so):
+        grid = Grid(shape=shape)
+        f = Function(name='f', grid=grid, space_order=so, dtype=dtype)
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator(Eq(f, 1))
+
+            # Machine-readable output for parsing
+            op.estimate_memory(human_readable=False)
+
+            # Check output of estimate_memory
+            host = reduce(mul, [s + 2*so for s in shape])*np.dtype(dtype).itemsize
+            expected = ("Kernel", 0, host, 0)
+            self.parse_output(caplog, expected)
+
+    def test_multiple_objects(self, caplog):
+        grid = Grid(shape=(101, 101))
+
+        f = Function(name='f', grid=grid, space_order=2, dtype=np.float32)
+        g = Function(name='g', grid=grid, space_order=4, dtype=np.float64)
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator([Eq(f, 1), Eq(g, 1)])
+            op.estimate_memory(human_readable=False)
+
+            check = sum(reduce(mul, func.shape_allocated)*np.dtype(func.dtype).itemsize
+                        for func in (f, g))
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    @pytest.mark.parametrize('time', [True, False])
+    def test_sparse(self, caplog, time):
+        grid = Grid(shape=(101, 101))
+        f = Function(name='f', grid=grid, space_order=2)
+        if time:
+            src = SparseTimeFunction(name='src', grid=grid, npoint=1000, nt=10)
+        else:
+            src = SparseFunction(name='src', grid=grid, npoint=1000)
+        src_term = src.inject(field=f, expr=src)
+
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator(src_term)
+            op.estimate_memory(human_readable=False)
+
+            check = sum(reduce(mul, func.shape_allocated)*np.dtype(func.dtype).itemsize
+                        for func in (f, src, src.coordinates))
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    @pytest.mark.parametrize('save', [None, Buffer(3), 10])
+    def test_timefunction(self, caplog, save):
+        grid = Grid(shape=(101, 101))
+        f = Function(name='f', grid=grid, space_order=2, save=save)
+
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator(Eq(f, 1))
+            op.estimate_memory(human_readable=False)
+            check = reduce(mul, f.shape_allocated)*np.dtype(f.dtype).itemsize
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    def test_mashup(self, caplog):
+        grid = Grid(shape=(101, 101))
+        f = Function(name='f', grid=grid, space_order=4)
+        g = TimeFunction(name='g', grid=grid, space_order=4)
+
+        src0 = SparseFunction(name='src0', grid=grid, npoint=100)
+        src1 = SparseFunction(name='src1', grid=grid, npoint=100)
+
+        eq0 = Eq(f, 1)
+        eq1 = Eq(g, 1)
+
+        src_term0 = src0.inject(field=f, expr=src0)
+        src_term1 = src1.inject(field=f, expr=src1)
+
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator([eq0, eq1] + src_term0 + src_term1)
+            op.estimate_memory(human_readable=False)
+
+            check = sum(reduce(mul, func.shape_allocated)*np.dtype(func.dtype).itemsize
+                        for func in (f, g, src0, src0.coordinates,
+                                     src1, src1.coordinates))
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    def test_temp_array(self, caplog):
+        """Check that temporary arrays will be factored into the memory calculation"""
+        grid = Grid(shape=(101, 101))
+        f = TimeFunction(name='f', grid=grid, space_order=2)
+        g = TimeFunction(name='g', grid=grid, space_order=2)
+        a = Function(name='a', grid=grid, space_order=2)
+
+        # Reuse an expensive function to encourage generation of an array temp
+        eq0 = Eq(f.forward, g + sympy.sin(a))
+        eq1 = Eq(g.forward, f + sympy.sin(a))
+
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator([eq0, eq1])
+
+            # Regression to ensure this test functions as intended
+            # Ensure an array temporary is created
+            assert "r0[x][y]" in str(op.ccode)
+
+            op.estimate_memory(human_readable=False)
+
+            check = sum(reduce(mul, func.shape_allocated)*np.dtype(func.dtype).itemsize
+                        for func in (f, g, a))
+
+            # Factor in the temp array
+            check += reduce(mul, a.shape)*np.dtype(a.dtype).itemsize
+
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    def test_overrides(self, caplog):
+        grid0 = Grid(shape=(101, 101))
+        # Original fields
+        f0 = Function(name='f0', grid=grid0, space_order=4)
+        tf0 = TimeFunction(name='tf0', grid=grid0, space_order=4)
+        s0 = SparseFunction(name='s0', grid=grid0, npoint=100)
+        st0 = SparseTimeFunction(name='st0', grid=grid0, npoint=100, nt=10)
+
+        grid1 = Grid(shape=(201, 201))  # Bigger grid so overrides are distinct
+        # Replacement fields
+        f1 = Function(name='f1', grid=grid1, space_order=4)
+        tf1 = TimeFunction(name='tf1', grid=grid1, space_order=4)
+        s1 = SparseFunction(name='s1', grid=grid1, npoint=200)
+        st1 = SparseTimeFunction(name='st1', grid=grid1, npoint=200, nt=20)
+
+        eq0 = Eq(f0, 1)
+        eq1 = Eq(tf0, 1)
+        s0_term = s0.inject(field=f0, expr=s0)
+        st0_term = st0.inject(field=tf0, expr=st0)
+
+        with switchconfig(log_level='DEBUG'), caplog.at_level(logging.DEBUG):
+            op = Operator([eq0, eq1] + s0_term + st0_term)
+
+            # Apply overrides for the check
+            op.estimate_memory(f0=f1, tf0=tf1, s0=s1, st0=st1, human_readable=False)
+
+            check = sum(reduce(mul, func.shape_allocated)*np.dtype(func.dtype).itemsize
+                        for func in (f1, tf1, s1, s1.coordinates, st1, st1.coordinates))
+
+            expected = ("Kernel", 0, check, 0)
+            self.parse_output(caplog, expected)
+
+    # Test with OpenACC