From bffb3fc06ffa44209c201321c88d112563cdb687 Mon Sep 17 00:00:00 2001 From: andrewjcg Date: Mon, 28 Oct 2024 15:55:22 -0400 Subject: [PATCH 1/3] Upgrade from memmap to memmap2 (#678) The former appears to be unmaintained: https://github.com/danburkert/memmap-rs/issues/90 --- Cargo.lock | 13 +++++++++++-- Cargo.toml | 2 +- src/binary_parser.rs | 2 +- 3 files changed, 13 insertions(+), 4 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index 35f0a049..6d6acf0c 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -11,7 +11,7 @@ dependencies = [ "cpp_demangle", "fallible-iterator", "gimli", - "memmap2", + "memmap2 0.5.10", "object", "rustc-demangle", "smallvec", @@ -912,6 +912,15 @@ dependencies = [ "libc", ] +[[package]] +name = "memmap2" +version = "0.9.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "fe751422e4a8caa417e13c3ea66452215d7d63e19e604f4980461212f3ae1322" +dependencies = [ + "libc", +] + [[package]] name = "minimal-lexical" version = "0.2.1" @@ -1125,7 +1134,7 @@ dependencies = [ "libc", "log", "lru", - "memmap", + "memmap2 0.9.4", "proc-maps", "py-spy-testdata", "rand", diff --git a/Cargo.toml b/Cargo.toml index 59482f68..388dbd9e 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -31,7 +31,7 @@ lru = "0.10" regex = ">=1.6.0" tempfile = "3.6.0" proc-maps = "0.3.2" -memmap = "0.7.0" +memmap2 = "0.9.4" cpp_demangle = "0.4" serde = {version="1.0", features=["rc"]} serde_derive = "1.0" diff --git a/src/binary_parser.rs b/src/binary_parser.rs index ace9ab45..76584475 100644 --- a/src/binary_parser.rs +++ b/src/binary_parser.rs @@ -4,7 +4,7 @@ use std::path::Path; use anyhow::Error; use goblin::Object; -use memmap::Mmap; +use memmap2::Mmap; pub struct BinaryInfo { pub symbols: HashMap, From 78f9a1f4d264f6b6c2927e1b7791d9d1dbc4d1f6 Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Mon, 28 Oct 2024 14:20:43 -0700 Subject: [PATCH 2/3] Update remoteprocess/proc-maps/goblin dependencies (#712) --- Cargo.lock | 144 ++++++++++++----------------------------------------- Cargo.toml | 8 +-- 2 files changed, 37 insertions(+), 115 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index 6d6acf0c..a6af5e6b 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -4,17 +4,18 @@ version = 3 [[package]] name = "addr2line" -version = "0.21.0" +version = "0.24.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8a30b2e23b9e17a9f90641c7ab1549cd9b44f296d3ccbf309d2863cfe398a0cb" +checksum = "dfbe277e56a376000877090da837660b4427aad530e3028d44e0bffe4f89a1c1" dependencies = [ "cpp_demangle", "fallible-iterator", "gimli", - "memmap2 0.5.10", + "memmap2", "object", "rustc-demangle", "smallvec", + "typed-arena", ] [[package]] @@ -138,29 +139,6 @@ version = "1.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "ace50bade8e6234aa140d9a2f552bbee1db4d353f69b8217bc503490fc1a9f26" -[[package]] -name = "bindgen" -version = "0.68.1" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "726e4313eb6ec35d2730258ad4e15b547ee75d6afaa1361a922e78e59b7d8078" -dependencies = [ - "bitflags 2.6.0", - "cexpr", - "clang-sys", - "lazy_static", - "lazycell", - "log", - "peeking_take_while", - "prettyplease", - "proc-macro2", - "quote", - "regex", - "rustc-hash", - "shlex", - "syn 2.0.79", - "which", -] - [[package]] name = "bindgen" version = "0.70.1" @@ -171,6 +149,8 @@ dependencies = [ "cexpr", "clang-sys", "itertools", + "log", + "prettyplease", "proc-macro2", "quote", "regex", @@ -435,17 +415,6 @@ dependencies = [ "parking_lot_core", ] -[[package]] -name = "derive_more" -version = "0.99.18" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "5f33878137e4dafd7fa914ad4e259e18a4e8e532b9617a2d0150262bf53abfce" -dependencies = [ - "proc-macro2", - "quote", - "syn 2.0.79", -] - [[package]] name = "either" version = "1.13.0" @@ -541,9 +510,9 @@ dependencies = [ [[package]] name = "gimli" -version = "0.28.1" +version = "0.31.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "4271d37baee1b8c7e4b708028c57d816cf9d2434acb33a549475f78c181f6253" +checksum = "07e28edb80900c19c28f1072f2e8aeca7fa06b23cd4169cefe1af5aa3260783f" dependencies = [ "fallible-iterator", "stable_deref_trait", @@ -557,9 +526,9 @@ checksum = "d2fabcfbdc87f4758337ca535fb41a6d701b65693ce38287d856d1674551ec9b" [[package]] name = "goblin" -version = "0.7.1" +version = "0.9.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f27c1b4369c2cd341b5de549380158b105a04c331be5db9110eef7b6d2742134" +checksum = "53ab3f32d1d77146981dea5d6b1e8fe31eedcb7013e5e00d6ccd1259a4b4d923" dependencies = [ "log", "plain", @@ -626,15 +595,6 @@ version = "0.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "fbf6a919d6cf397374f7dfeeea91d974c7c0a7221d0d0f4f20d859d329e53fcc" -[[package]] -name = "home" -version = "0.5.9" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e3d1354bf6b7235cb4a0576c2619fd4ed18183f689b12b006a0ee7329eeff9a5" -dependencies = [ - "windows-sys 0.52.0", -] - [[package]] name = "humantime" version = "2.1.0" @@ -787,12 +747,6 @@ version = "1.5.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "bbd2bcb4c963f2ddae06a2efc7e9f3591312473c50c6685e1f298068316e66fe" -[[package]] -name = "lazycell" -version = "1.3.0" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55" - [[package]] name = "libc" version = "0.2.159" @@ -821,7 +775,7 @@ version = "0.14.10" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "e78a09b56be5adbcad5aa1197371688dc6bb249a26da3bca2011ee2fb987ebfb" dependencies = [ - "bindgen 0.70.1", + "bindgen", "errno", "libc", ] @@ -893,25 +847,6 @@ version = "2.7.4" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "78ca9ab1a0babb1e7d5695e3530886289c18cf2f87ec19a575a0abdce112e3a3" -[[package]] -name = "memmap" -version = "0.7.0" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6585fd95e7bb50d6cc31e20d4cf9afb4e2ba16c5846fc76793f11218da9c475b" -dependencies = [ - "libc", - "winapi", -] - -[[package]] -name = "memmap2" -version = "0.5.10" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "83faa42c0a078c393f6b29d5db232d8be22776a891f8f56e5284faee4a20b327" -dependencies = [ - "libc", -] - [[package]] name = "memmap2" version = "0.9.4" @@ -997,9 +932,9 @@ checksum = "830b246a0e5f20af87141b25c173cd1b609bd7779a4617d6ec582abaf90870f3" [[package]] name = "object" -version = "0.32.2" +version = "0.36.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a6a622008b6e321afc04970976f62ee297fdbaa6f95318ca343e3eebb9648441" +checksum = "aedf0a2d09c573ed1d8d85b30c119153926a2b36dce0ab28322c09a117a4683e" dependencies = [ "flate2", "memchr", @@ -1031,12 +966,6 @@ dependencies = [ "windows-targets 0.52.6", ] -[[package]] -name = "peeking_take_while" -version = "0.1.2" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "19b17cddbe7ec3f8bc800887bab5e717348c95ea2ca0b1bf0837fb964dc67099" - [[package]] name = "plain" version = "0.2.3" @@ -1103,12 +1032,12 @@ dependencies = [ [[package]] name = "proc-maps" -version = "0.3.2" +version = "0.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0ec8fdc22cb95c02f6a26a91fb1cd60a7a115916c2ed3b09d0a312e11785bd57" +checksum = "3db44c5aa60e193a25fcd93bb9ed27423827e8f118897866f946e2cf936c44fb" dependencies = [ "anyhow", - "bindgen 0.68.1", + "bindgen", "libc", "libproc", "mach2", @@ -1134,7 +1063,7 @@ dependencies = [ "libc", "log", "lru", - "memmap2 0.9.4", + "memmap2", "proc-maps", "py-spy-testdata", "rand", @@ -1265,11 +1194,12 @@ checksum = "2b15c43186be67a4fd63bee50d0303afffcef381492ebe2c5d87f324e1b8815c" [[package]] name = "remoteprocess" -version = "0.4.13" +version = "0.5.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8928e7901c7fc6f1f8d697d77a9da0f749f96454714a8d097662531640647409" +checksum = "e6194770c7afc1d2ca42acde19267938eb7d52ccb5b727f1a2eafa8d4d00ff20" dependencies = [ "addr2line", + "cfg-if", "goblin", "lazy_static", "libc", @@ -1277,7 +1207,7 @@ dependencies = [ "log", "mach", "mach_o_sys", - "memmap", + "memmap2", "nix 0.26.4", "object", "proc-maps", @@ -1336,12 +1266,10 @@ dependencies = [ [[package]] name = "ruzstd" -version = "0.5.0" +version = "0.7.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "58c4eb8a81997cf040a091d1f7e1938aeab6749d3a0dfa73af43cdc32393483d" +checksum = "99c3938e133aac070997ddc684d4b393777d293ba170f2988c8fd5ea2ad4ce21" dependencies = [ - "byteorder", - "derive_more", "twox-hash", ] @@ -1359,18 +1287,18 @@ checksum = "94143f37725109f92c262ed2cf5e59bce7498c01bcc1502d7b9afe439a4e9f49" [[package]] name = "scroll" -version = "0.11.0" +version = "0.12.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "04c565b551bafbef4157586fa379538366e4385d42082f255bfd96e4fe8519da" +checksum = "6ab8598aa408498679922eff7fa985c25d58a90771bd6be794434c5277eab1a6" dependencies = [ "scroll_derive", ] [[package]] name = "scroll_derive" -version = "0.11.1" +version = "0.12.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "1db149f81d46d2deba7cd3c50772474707729550221e69588478ebf9ada425ae" +checksum = "7f81c2fde025af7e69b1d1420531c8a8811ca898919db177141a85313b1cb932" dependencies = [ "proc-macro2", "quote", @@ -1533,6 +1461,12 @@ dependencies = [ "static_assertions", ] +[[package]] +name = "typed-arena" +version = "2.0.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6af6ae20167a9ece4bcb41af5b80f8a1f1df981f6391189ce00fd257af04126a" + [[package]] name = "unicode-ident" version = "1.0.13" @@ -1618,18 +1552,6 @@ version = "0.2.95" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "65fc09f10666a9f147042251e0dda9c18f166ff7de300607007e96bdebc1068d" -[[package]] -name = "which" -version = "4.4.2" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "87ba24419a2078cd2b0f2ede2691b6c66d8e47836da3b6db8265ebad47afbfc7" -dependencies = [ - "either", - "home", - "once_cell", - "rustix 0.38.37", -] - [[package]] name = "winapi" version = "0.3.9" diff --git a/Cargo.toml b/Cargo.toml index 388dbd9e..187464fb 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -22,15 +22,15 @@ console = "0.15" ctrlc = "3" indicatif = "0.17" env_logger = "0.10" -goblin = "0.7.1" -inferno = "0.11.17" +goblin = "0.9.2" +inferno = "0.11.21" lazy_static = "1.4.0" libc = "0.2" log = "0.4" lru = "0.10" regex = ">=1.6.0" tempfile = "3.6.0" -proc-maps = "0.3.2" +proc-maps = "0.4.0" memmap2 = "0.9.4" cpp_demangle = "0.4" serde = {version="1.0", features=["rc"]} @@ -38,7 +38,7 @@ serde_derive = "1.0" serde_json = "1.0" rand = "0.8" rand_distr = "0.4" -remoteprocess = {version="0.4.12", features=["unwind"]} +remoteprocess = {version="0.5.0", features=["unwind"]} chrono = "0.4.26" [dev-dependencies] From 114e6981d0f7263019c16d7d477e5e13b6f8b56a Mon Sep 17 00:00:00 2001 From: Ben Frederickson Date: Wed, 30 Oct 2024 13:33:04 -0700 Subject: [PATCH 3/3] Detect GIL on python 3.12 (#713) Use the InterpreterState._gil member to figure out both if the gil is locked, and if so which thread is holding the GIL --- src/coredump.rs | 3 ++- src/python_interpreters.rs | 18 ++++++++++++++---- src/python_process_info.rs | 12 +++++++++++- src/python_spy.rs | 16 +++++++++------- src/stack_trace.rs | 6 +++++- src/utils.rs | 4 ++++ 6 files changed, 45 insertions(+), 14 deletions(-) diff --git a/src/coredump.rs b/src/coredump.rs index 7df1e010..e0118437 100644 --- a/src/coredump.rs +++ b/src/coredump.rs @@ -246,7 +246,8 @@ impl PythonCoreDump { // lets us figure out which thread has the GIL let config = Config::default(); - let threadstate_address = get_threadstate_address(&python_info, &version, &config)?; + let threadstate_address = + get_threadstate_address(interpreter_address, &python_info, &version, &config)?; info!("found threadstate at 0x{:016x}", threadstate_address); Ok(PythonCoreDump { diff --git a/src/python_interpreters.rs b/src/python_interpreters.rs index 609ca7ba..bd055791 100644 --- a/src/python_interpreters.rs +++ b/src/python_interpreters.rs @@ -14,6 +14,7 @@ This means we can't dereference them directly. use crate::python_bindings::{ v2_7_15, v3_10_0, v3_11_0, v3_12_0, v3_3_7, v3_5_5, v3_6_6, v3_7_0, v3_8_0, v3_9_5, }; +use crate::utils::offset_of; pub trait InterpreterState { type ThreadState: ThreadState; @@ -22,6 +23,7 @@ pub trait InterpreterState { type ListObject: ListObject; type TupleObject: TupleObject; fn head(&self) -> *mut Self::ThreadState; + fn gil_locked(&self) -> Option; fn modules(&self) -> *mut Self::Object; } @@ -100,10 +102,6 @@ pub trait TypeObject { fn flags(&self) -> usize; } -fn offset_of(object: *const T, member: *const M) -> usize { - member as usize - object as usize -} - /// This macro provides a common impl for PyThreadState/PyFrameObject/PyCodeObject traits /// (this code is identical across python versions, we are only abstracting the struct layouts here). /// String handling changes substantially between python versions, and is handled separately. @@ -115,9 +113,13 @@ macro_rules! PythonCommonImpl { type StringObject = $py::$stringobject; type ListObject = $py::PyListObject; type TupleObject = $py::PyTupleObject; + fn head(&self) -> *mut Self::ThreadState { self.tstate_head } + fn gil_locked(&self) -> Option { + None + } fn modules(&self) -> *mut Self::Object { self.modules } @@ -415,9 +417,14 @@ impl InterpreterState for v3_12_0::PyInterpreterState { type StringObject = v3_12_0::PyUnicodeObject; type ListObject = v3_12_0::PyListObject; type TupleObject = v3_12_0::PyTupleObject; + fn head(&self) -> *mut Self::ThreadState { self.threads.head } + fn gil_locked(&self) -> Option { + Some(self._gil.locked._value != 0) + } + fn modules(&self) -> *mut Self::Object { self.imports.modules } @@ -506,6 +513,9 @@ impl InterpreterState for v3_11_0::PyInterpreterState { fn head(&self) -> *mut Self::ThreadState { self.threads.head } + fn gil_locked(&self) -> Option { + None + } fn modules(&self) -> *mut Self::Object { self.modules } diff --git a/src/python_process_info.rs b/src/python_process_info.rs index 2270556c..5ecb4cc2 100644 --- a/src/python_process_info.rs +++ b/src/python_process_info.rs @@ -529,6 +529,7 @@ where } pub fn get_threadstate_address( + interpreter_address: usize, python_info: &PythonProcessInfo, version: &Version, config: &Config, @@ -536,7 +537,16 @@ pub fn get_threadstate_address( let threadstate_address = match version { Version { major: 3, - minor: 7..=12, + minor: 12, + .. + } => { + let interp: v3_12_0::_is = Default::default(); + let offset = crate::utils::offset_of(&interp, &interp._gil.last_holder._value); + interpreter_address + offset + } + Version { + major: 3, + minor: 7..=11, .. } => match python_info.get_symbol("_PyRuntime") { Some(&addr) => { diff --git a/src/python_spy.rs b/src/python_spy.rs index 531616ab..40361577 100644 --- a/src/python_spy.rs +++ b/src/python_spy.rs @@ -62,7 +62,8 @@ impl PythonSpy { info!("Found interpreter at 0x{:016x}", interpreter_address); // lets us figure out which thread has the GIL - let threadstate_address = get_threadstate_address(&python_info, &version, config)?; + let threadstate_address = + get_threadstate_address(interpreter_address, &python_info, &version, config)?; #[cfg(feature = "unwind")] let native = if config.native { @@ -206,18 +207,19 @@ impl PythonSpy { None }; - // TODO: hoist most of this code out to stack_trace.rs, and - // then annotate the output of that with things like native stack traces etc - // have moved in gil / locals etc - let gil_thread_id = - get_gil_threadid::(self.threadstate_address, &self.process)?; - // Get the python interpreter, and loop over all the python threads let interp: I = self .process .copy_struct(self.interpreter_address) .context("Failed to copy PyInterpreterState from process")?; + // get the threadid of the gil if appropriate + let gil_thread_id = if interp.gil_locked().unwrap_or(true) { + get_gil_threadid::(self.threadstate_address, &self.process)? + } else { + 0 + }; + let mut traces = Vec::new(); let mut threads = interp.head(); while !threads.is_null() { diff --git a/src/stack_trace.rs b/src/stack_trace.rs index dce648e9..27d44a96 100644 --- a/src/stack_trace.rs +++ b/src/stack_trace.rs @@ -77,7 +77,11 @@ where I: InterpreterState, P: ProcessMemory, { - let gil_thread_id = get_gil_threadid::(threadstate_address, process)?; + let gil_thread_id = if interpreter.gil_locked().unwrap_or(true) { + get_gil_threadid::(threadstate_address, process)? + } else { + 0 + }; let mut ret = Vec::new(); let mut threads = interpreter.head(); diff --git a/src/utils.rs b/src/utils.rs index 2ca1374f..a354f151 100644 --- a/src/utils.rs +++ b/src/utils.rs @@ -20,3 +20,7 @@ pub fn resolve_filename(filename: &str, modulename: &str) -> Option { None } + +pub fn offset_of(object: *const T, member: *const M) -> usize { + member as usize - object as usize +}