From fdb1abfa2ed0ac8d4823bc41c2d9111152d24ac8 Mon Sep 17 00:00:00 2001
From: Pablo Galindo <pablogsal@gmail.com>
Date: Fri, 3 Nov 2023 21:54:36 +0000
Subject: [PATCH] Limit the number of memory records reported

For very big files, the generated reporters will hung when trying to
process all of the memory records produced. This happens quite a lot in
flamegraphs produced from very big files, where the browser cannot
display the ploy with millions of points.

To help here, add a new parameter to the FileReader class that limits
the number of memory records (and therefore temporal snapshots) stored
and reported. This should not affect most regular capture files but will
help with the very big ones.

Signed-off-by: Pablo Galindo <pablogsal@gmail.com>
Co-authored-by: Matt Wozniski <godlygeek@gmail.com>
---
 news/491.bugfix.rst                |  1 +
 src/memray/_memray.pyi             |  6 +++++-
 src/memray/_memray.pyx             | 16 +++++++++++++++-
 src/memray/commands/common.py      | 10 +++++++++-
 src/memray/commands/flamegraph.py  |  7 +++++++
 tests/integration/test_tracking.py | 28 ++++++++++++++++++++++++++++
 6 files changed, 65 insertions(+), 3 deletions(-)
 create mode 100644 news/491.bugfix.rst

diff --git a/news/491.bugfix.rst b/news/491.bugfix.rst
new file mode 100644
index 0000000000..33a885f590
--- /dev/null
+++ b/news/491.bugfix.rst
@@ -0,0 +1 @@
+Limit the number of memory records displayed in reporters by default. This will help displaying flamegraphs for long capture sessions.
diff --git a/src/memray/_memray.pyi b/src/memray/_memray.pyi
index 09c818ab4b..90411c2a39 100644
--- a/src/memray/_memray.pyi
+++ b/src/memray/_memray.pyi
@@ -133,7 +133,11 @@ class FileReader:
     @property
     def metadata(self) -> Metadata: ...
     def __init__(
-        self, file_name: Union[str, Path], *, report_progress: bool = False
+        self,
+        file_name: Union[str, Path],
+        *,
+        report_progress: bool = False,
+        max_memory_records: int = 10000,
     ) -> None: ...
     def get_allocation_records(self) -> Iterable[AllocationRecord]: ...
     def get_temporal_allocation_records(
diff --git a/src/memray/_memray.pyx b/src/memray/_memray.pyx
index f961cf699e..a52eb72f62 100644
--- a/src/memray/_memray.pyx
+++ b/src/memray/_memray.pyx
@@ -55,6 +55,7 @@ from _memray.source cimport SocketSource
 from _memray.tracking_api cimport Tracker as NativeTracker
 from _memray.tracking_api cimport install_trace_function
 from cpython cimport PyErr_CheckSignals
+from libc.math cimport ceil
 from libc.stdint cimport uint64_t
 from libcpp cimport bool
 from libcpp.limits cimport numeric_limits
@@ -855,8 +856,9 @@ cdef class FileReader:
     cdef HighWatermark _high_watermark
     cdef object _header
     cdef bool _report_progress
+    cdef int _memory_snapshot_stride
 
-    def __cinit__(self, object file_name, *, bool report_progress=False):
+    def __cinit__(self, object file_name, *, bool report_progress=False, int max_memory_records=10000):
         try:
             self._file = open(file_name)
         except OSError as exc:
@@ -881,6 +883,9 @@ cdef class FileReader:
         n_memory_snapshots_approx = 2048
         if 0 < stats["start_time"] < stats["end_time"]:
             n_memory_snapshots_approx = (stats["end_time"] - stats["start_time"]) / 10
+
+        if n_memory_snapshots_approx > max_memory_records:
+            n_memory_snapshots_approx = max_memory_records
         self._memory_snapshots.reserve(n_memory_snapshots_approx)
 
         cdef object total = stats['n_allocations'] or None
@@ -891,6 +896,7 @@ cdef class FileReader:
             total=total,
             report_progress=self._report_progress
         )
+        self._memory_snapshot_stride = 0
         cdef MemoryRecord memory_record
         with progress_indicator:
             while True:
@@ -917,6 +923,10 @@ cdef class FileReader:
                     self._memory_snapshots.push_back(reader.getLatestMemorySnapshot())
                 else:
                     break
+
+        if len(self._memory_snapshots) > max_memory_records:
+            self._memory_snapshot_stride = int(ceil(len(self._memory_snapshots) / max_memory_records))
+            self._memory_snapshots = self._memory_snapshots[::self._memory_snapshot_stride]
         self._high_watermark = finder.getHighWatermark()
         stats["n_allocations"] = progress_indicator.num_processed
 
@@ -1100,6 +1110,7 @@ cdef class FileReader:
 
         cdef AllocationLifetimeAggregator aggregator
         cdef _Allocation allocation
+        cdef int memory_records_seen
 
         with progress_indicator:
             while records_to_process > 0:
@@ -1113,6 +1124,9 @@ cdef class FileReader:
                     records_to_process -= 1
                     progress_indicator.update(1)
                 elif ret == RecordResult.RecordResultMemoryRecord:
+                    memory_records_seen += 1
+                    if self._memory_snapshot_stride and memory_records_seen % self._memory_snapshot_stride != 0:
+                        continue
                     aggregator.captureSnapshot()
                 else:
                     assert ret != RecordResult.RecordResultMemorySnapshot
diff --git a/src/memray/commands/common.py b/src/memray/commands/common.py
index 7edff5d18e..4986097e53 100644
--- a/src/memray/commands/common.py
+++ b/src/memray/commands/common.py
@@ -127,9 +127,13 @@ def write_report(
         merge_threads: Optional[bool] = None,
         inverted: Optional[bool] = None,
         temporal: bool = False,
+        max_memory_records: Optional[int] = None,
     ) -> None:
         try:
-            reader = FileReader(os.fspath(result_path), report_progress=True)
+            kwargs = {}
+            if max_memory_records is not None:
+                kwargs["max_memory_records"] = max_memory_records
+            reader = FileReader(os.fspath(result_path), report_progress=True, **kwargs)
             merge_threads = True if merge_threads is None else merge_threads
             inverted = False if inverted is None else inverted
 
@@ -271,6 +275,10 @@ def run(self, args: argparse.Namespace, parser: argparse.ArgumentParser) -> None
 
         if hasattr(args, "inverted"):
             kwargs["inverted"] = args.inverted
+
+        if hasattr(args, "max_memory_records"):
+            kwargs["max_memory_records"] = args.max_memory_records
+
         self.write_report(
             result_path,
             output_file,
diff --git a/src/memray/commands/flamegraph.py b/src/memray/commands/flamegraph.py
index 075ffc3ba3..113ebe39f7 100644
--- a/src/memray/commands/flamegraph.py
+++ b/src/memray/commands/flamegraph.py
@@ -29,3 +29,10 @@ def prepare_parser(self, parser: argparse.ArgumentParser) -> None:
             action="store_true",
             default=False,
         )
+
+        parser.add_argument(
+            "--max-memory-records",
+            help="Maximum number of memory records to display",
+            type=int,
+            default=None,
+        )
diff --git a/tests/integration/test_tracking.py b/tests/integration/test_tracking.py
index 5e17500154..4bcb7920c4 100644
--- a/tests/integration/test_tracking.py
+++ b/tests/integration/test_tracking.py
@@ -1672,6 +1672,34 @@ def test_memory_snapshots_tick_interval(self, tmp_path):
             for prev, _next in zip(memory_snapshots, memory_snapshots[1:])
         )
 
+    def test_memory_snapshots_limit_when_reading(self, tmp_path):
+        # GIVEN
+        allocator = MemoryAllocator()
+        output = tmp_path / "test.bin"
+
+        # WHEN
+        with Tracker(output):
+            for _ in range(2):
+                allocator.valloc(ALLOC_SIZE)
+                time.sleep(0.11)
+                allocator.free()
+
+        reader = FileReader(output)
+        memory_snapshots = list(reader.get_memory_snapshots())
+        temporal_records = list(reader.get_temporal_allocation_records())
+
+        assert memory_snapshots
+        n_snapshots = len(memory_snapshots)
+        n_temporal_records = len(temporal_records)
+
+        reader = FileReader(output, max_memory_records=n_snapshots // 2)
+        memory_snapshots = list(reader.get_memory_snapshots())
+        temporal_records = list(reader.get_temporal_allocation_records())
+
+        assert memory_snapshots
+        assert len(memory_snapshots) <= n_snapshots // 2 + 1
+        assert len(temporal_records) <= n_temporal_records // 2 + 1
+
     def test_temporary_allocations_when_filling_vector_without_preallocating(
         self, tmp_path
     ):