From 4322d29b6a03d8c2fcd8ba71079cbe63c55fa1f1 Mon Sep 17 00:00:00 2001
From: Stephen Brennan <stephen.s.brennan@oracle.com>
Date: Tue, 25 Nov 2025 16:28:33 -0800
Subject: [PATCH 1/2] pstack: improve generation of DSO ranges

We generate a single address range for each DSO in the userspace
program. However, the method is a bit convoluted: we select the largest
"vm_end" value, and we use a start address computed from the start of
the executable VMA and its vm_pgoff. The result of this is that, if a
DSO file is mapped multiple times in different locations, we may produce
an address range that spans other DSO address ranges. This is exactly
what happened in osandov/drgn#574.

Simplify this by just using the start address of the lowest VMA (the one
which has vm_pgoff==0), and computing the end address by taking the file
size, or the start of the next DSO address range, whichever is lower.
This ensures there are no address range overlaps. It does not provide
drgn with any additional information about the file address mappings,
but as far as I can tell, that's just fine: drgn can't use multiple
address ranges, because it doesn't know which file offsets they
correspond to.

To ensure this behavior is used by both the "dump" and "pstack" modes,
implement factor out the DSO range generation code into a helper and use
it in both places.

Signed-off-by: Stephen Brennan <stephen.s.brennan@oracle.com>
---
 drgn_tools/pstack.py | 108 ++++++++++++++++++++++---------------------
 1 file changed, 55 insertions(+), 53 deletions(-)

diff --git a/drgn_tools/pstack.py b/drgn_tools/pstack.py
index 2b3efea4..9957b937 100644
--- a/drgn_tools/pstack.py
+++ b/drgn_tools/pstack.py
@@ -269,30 +269,52 @@ def add_task_args(group: argparse.ArgumentParser) -> None:
     )
 
 
+def task_dsos(mm: Object) -> List[Tuple[str, int, int, int]]:
+    """
+    Return the mapped DSOs for a task's ``mm_struct``. The return value is a
+    tuple: (path, start, end, ino)
+    """
+    # For the first pass, find any mapping which starts at offset 0 within the
+    # file, and record the full range of the file (even if it's not actually
+    # mapped for its full size). Also, record which file mappings have an
+    # executable VMA, since we'll only care about those.
+    file_range: Dict[str, Tuple[int, int, int]] = {}
+    file_exec = set()
+    VM_EXEC = 0x4
+    for vma in for_each_vma(mm):
+        if not vma.vm_file:
+            continue
+        path = os.fsdecode(d_path(vma.vm_file.f_path))
+        if vma.vm_pgoff == 0:
+            file_range[path] = (
+                vma.vm_start.value_(),
+                (vma.vm_start + vma.vm_file.f_inode.i_size).value_(),
+                vma.vm_file.f_inode.i_ino.value_(),
+            )
+        if vma.vm_flags & VM_EXEC:
+            file_exec.add(path)
+
+    # For the second pass, ensure there is no overlap between the ranges we
+    # created previously. Since the whole file is not necessarily mapped, we
+    # want to avoid creating overlapping ranges that drgn is not expecting (see
+    # https://github.com/osandov/drgn/issues/574). Once we've ensured there are
+    # no overlaps, and the file had an executable mapping, we can emit it.
+    ranges = sorted(file_range.items(), key=lambda t: t[1][0])
+    result = []
+    for i, (path, (start, end, ino)) in enumerate(ranges):
+        if i + 1 < len(ranges):
+            end = min(end, ranges[i + 1][1][1])
+        if path in file_exec:
+            result.append((path, start, end, ino))
+    return result
+
+
 def task_metadata(prog: Program, task: Object) -> Dict[str, Any]:
     """Return JSON metadata about a task, for later use."""
-    VM_EXEC = 0x4
     load_addrs = {}
-    file_vm_end: Dict[str, int] = {}
     if task.mm:
-        for vma in for_each_vma(task.mm):
-            if not vma.vm_file:
-                continue
-            path = os.fsdecode(d_path(vma.vm_file.f_path))
-            file_vm_end[path] = max(
-                vma.vm_end.value_(),
-                file_vm_end.get(path, 0),
-            )
-            if vma.vm_flags & VM_EXEC and vma.vm_file:
-                file_start = (
-                    vma.vm_start - vma.vm_pgoff * task.mm.prog_["PAGE_SIZE"]
-                ).value_()
-                inode = vma.vm_file.f_inode.i_ino.value_()
-                load_addrs[path] = [file_start, vma.vm_end.value_(), inode]
-
-        # use the largest vm_end we find for the end of the address range
-        for path in load_addrs:
-            load_addrs[path][1] = file_vm_end[path]
+        for path, start, end, inode in task_dsos(task.mm):
+            load_addrs[path] = [start, end, inode]
     return {
         "pid": task.pid.value_(),
         "comm": task.comm.string_().decode("utf-8", errors="replace"),
@@ -709,39 +731,19 @@ def read_fn(_, count, offset, __):
 
     up.add_memory_segment(0, 0xFFFFFFFFFFFFFFFF, read_fn, False)
 
-    # Do one pass where we record the maximum extent of the mapping for each
-    # file, and we also detect each executable mapping, for which we prepare
-    # modules.
-    file_vm_end: Dict[str, int] = {}
-    VM_EXEC = 0x4
-    for vma in for_each_vma(mm):
-        if vma.vm_file:
-            path = os.fsdecode(d_path(vma.vm_file.f_path))
-            file_vm_end[path] = max(
-                vma.vm_end.value_(), file_vm_end.get(path, 0)
-            )
-        if vma.vm_flags & VM_EXEC and vma.vm_file:
-            try:
-                statbuf = os.stat(path)
-                if statbuf.st_ino != vma.vm_file.f_inode.i_ino.value_():
-                    log.warning(
-                        "file %s doesn't match the inode on-disk, it may"
-                        " have been updated",
-                        path,
-                    )
-            except OSError:
-                pass
-            file_start = (
-                vma.vm_start - vma.vm_pgoff * mm.prog_["PAGE_SIZE"]
-            ).value_()
-            mod = up.extra_module(path, create=True)
-            mod.address_range = (file_start, vma.vm_end.value_())
-
-    # Now set the address ranges based on the observed file end, then load the
-    # ELF files.
-    for mod in up.modules():
-        path = mod.name
-        mod.address_range = (mod.address_range[0], file_vm_end[path])
+    for path, start, end, ino in task_dsos(mm):
+        try:
+            statbuf = os.stat(path)
+            if statbuf.st_ino != ino:
+                log.warning(
+                    "file %s doesn't match the inode on-disk, it may"
+                    " have been updated",
+                    path,
+                )
+        except OSError:
+            pass
+        mod = up.extra_module(path, create=True)
+        mod.address_range = (start, end)
         mod.try_file(path)
 
     return up

From 607487ed895adb96cfe7f803f729c973d9e03925 Mon Sep 17 00:00:00 2001
From: Stephen Brennan <stephen.s.brennan@oracle.com>
Date: Tue, 25 Nov 2025 16:31:42 -0800
Subject: [PATCH 2/2] pstack: avoid unwinding running tasks

Signed-off-by: Stephen Brennan <stephen.s.brennan@oracle.com>
---
 drgn_tools/pstack.py | 21 +++++++++++++++++++--
 1 file changed, 19 insertions(+), 2 deletions(-)

diff --git a/drgn_tools/pstack.py b/drgn_tools/pstack.py
index 9957b937..575bf5c7 100644
--- a/drgn_tools/pstack.py
+++ b/drgn_tools/pstack.py
@@ -47,6 +47,7 @@
 from drgn import FaultError
 from drgn import Object
 from drgn import Program
+from drgn import ProgramFlags
 from drgn import sizeof
 from drgn import StackTrace
 from drgn.helpers.linux import access_remote_vm
@@ -56,6 +57,7 @@
 from drgn.helpers.linux import for_each_online_cpu
 from drgn.helpers.linux import for_each_task
 from drgn.helpers.linux import for_each_vma
+from drgn.helpers.linux import task_on_cpu
 from drgn.helpers.linux import task_state_to_char
 from drgn.helpers.linux import vma_find
 
@@ -765,9 +767,17 @@ def pstack_print_process(task: Object) -> None:
         tcomm = thread.comm.string_().decode("utf-8", errors="replace")
         st = task_state_to_char(thread)
         cpu = task_cpu(thread)
-        cpunote = "RUNNING ON " if cpu_curr(prog, cpu) == thread else ""
+        on_cpu = task_on_cpu(thread)
+        cpunote = "RUNNING ON " if on_cpu else ""
         print(f"  Thread {i} TID={tid} [{st}] {cpunote}CPU={cpu} ('{tcomm}')")
-        kstack = prog.stack_trace(thread)
+        try:
+            kstack = prog.stack_trace(thread)
+        except ValueError as e:
+            if "cannot unwind stack of running task" in str(e):
+                print(f"    {str(e)}")
+                continue
+            else:
+                raise
         if len(kstack) > 0 and (kstack[0].pc & (1 << 63)):
             # Kernel stack is indeed a kernel stack, print it
             print(
@@ -786,6 +796,8 @@ def pstack(prog: Program) -> None:
     parser = argparse.ArgumentParser(description="print stack traces")
     add_task_args(parser)
     args = parser.parse_args(sys.argv[2:])
+    if args.online and prog.flags & ProgramFlags.IS_LIVE:
+        sys.exit("error: --online: cannot unwind running tasks on live system")
     for task in get_tasks(prog, args):
         pstack_print_process(task)
         print()
@@ -801,6 +813,11 @@ def add_args(self, parser: argparse.ArgumentParser) -> None:
         add_task_args(parser)
 
     def run(self, prog: Program, args: argparse.Namespace) -> None:
+        if args.online and prog.flags & ProgramFlags.IS_LIVE:
+            print(
+                "--online: cannot unwind running tasks on live system, skipping"
+            )
+            return
         for task in get_tasks(prog, args):
             pstack_print_process(task)
             print()