diff --git a/.vscode/settings.json b/.vscode/settings.json
new file mode 100644
index 000000000..1b5f3234a
--- /dev/null
+++ b/.vscode/settings.json
@@ -0,0 +1,7 @@
+{
+    "[rust]": {
+        "editor.defaultFormatter": "rust-lang.rust-analyzer",
+        "editor.formatOnSave": true,
+    },
+    "rust-analyzer.cargo.features": "all",
+}
\ No newline at end of file
diff --git a/Cargo.toml b/Cargo.toml
index ec359edd3..49f3716f2 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -23,6 +23,7 @@ num-integer = "0.1"
 num-traits = "0.2"
 ndarray = ">= 0.15, < 0.17"
 pyo3 = { version = "0.25.0", default-features = false, features = ["macros"] }
+rand_core = { version = "0.9.3", default-features = false, optional = true }
 rustc-hash = "2.0"
 
 [dev-dependencies]
@@ -32,6 +33,7 @@ pyo3 = { version = "0.25", default-features = false, features = [
 nalgebra = { version = ">=0.30, <0.34", default-features = false, features = [
     "std",
 ] }
+rand = { version = "0.9.1", default-features = false }
 
 [build-dependencies]
 pyo3-build-config = { version = "0.25", features = ["resolve-config"] }
diff --git a/examples/simple/src/lib.rs b/examples/simple/src/lib.rs
index 3bb29e3e1..b9cb28907 100644
--- a/examples/simple/src/lib.rs
+++ b/examples/simple/src/lib.rs
@@ -113,7 +113,7 @@ fn rust_ext<'py>(m: &Bound<'py, PyModule>) -> PyResult<()> {
     // This crate follows a strongly-typed approach to wrapping NumPy arrays
     // while Python API are often expected to work with multiple element types.
     //
-    // That kind of limited polymorphis can be recovered by accepting an enumerated type
+    // That kind of limited polymorphism can be recovered by accepting an enumerated type
     // covering the supported element types and dispatching into a generic implementation.
     #[derive(FromPyObject)]
     enum SupportedArray<'py> {
diff --git a/src/lib.rs b/src/lib.rs
index 195465022..219f7efe1 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -79,6 +79,7 @@ pub mod datetime;
 mod dtype;
 mod error;
 pub mod npyffi;
+pub mod random;
 mod slice_container;
 mod strings;
 mod sum_products;
diff --git a/src/npyffi/mod.rs b/src/npyffi/mod.rs
index bf846f8e2..efd214a80 100644
--- a/src/npyffi/mod.rs
+++ b/src/npyffi/mod.rs
@@ -94,11 +94,13 @@ macro_rules! impl_api {
 pub mod array;
 pub mod flags;
 pub mod objects;
+pub mod random;
 pub mod types;
 pub mod ufunc;
 
 pub use self::array::*;
 pub use self::flags::*;
 pub use self::objects::*;
+pub use self::random::*;
 pub use self::types::*;
 pub use self::ufunc::*;
diff --git a/src/npyffi/objects.rs b/src/npyffi/objects.rs
index d28e88b7e..5a00539fa 100644
--- a/src/npyffi/objects.rs
+++ b/src/npyffi/objects.rs
@@ -1,4 +1,4 @@
-//! Low-Lebel binding for NumPy C API C-objects
+//! Low-Level binding for NumPy C API C-objects
 //!
 //! <https://numpy.org/doc/stable/reference/c-api/types-and-structures.html>
 #![allow(non_camel_case_types)]
diff --git a/src/npyffi/random.rs b/src/npyffi/random.rs
new file mode 100644
index 000000000..e618768aa
--- /dev/null
+++ b/src/npyffi/random.rs
@@ -0,0 +1,11 @@
+use std::ffi::c_void;
+
+#[repr(C)]
+#[derive(Debug)]
+pub struct bitgen_t {
+    pub state: *mut c_void,
+    pub next_uint64: unsafe extern "C" fn(*mut c_void) -> super::npy_uint64, //nogil
+    pub next_uint32: unsafe extern "C" fn(*mut c_void) -> super::npy_uint32, //nogil
+    pub next_double: unsafe extern "C" fn(*mut c_void) -> libc::c_double,    //nogil
+    pub next_raw: unsafe extern "C" fn(*mut c_void) -> super::npy_uint64,    //nogil
+}
diff --git a/src/random.rs b/src/random.rs
new file mode 100644
index 000000000..db0012a24
--- /dev/null
+++ b/src/random.rs
@@ -0,0 +1,317 @@
+//! Safe interface for NumPy's random [`BitGenerator`][bg].
+//!
+//! Using the patterns described in [“Extending `numpy.random`”][ext],
+//! you can generate random numbers without holding the GIL,
+//! by [acquiring][`PyBitGeneratorMethods::lock`] a lock [guard][`PyBitGeneratorGuard`] for the [`PyBitGenerator`]:
+//!
+//! ```
+//! use pyo3::prelude::*;
+//! use numpy::random::{PyBitGenerator, PyBitGeneratorMethods as _};
+//!
+//! fn default_bit_gen<'py>(py: Python<'py>) -> PyResult<Bound<'py, PyBitGenerator>> {
+//!     let default_rng = py.import("numpy.random")?.call_method0("default_rng")?;
+//!     let bit_generator = default_rng.getattr("bit_generator")?.downcast_into()?;
+//!     Ok(bit_generator)
+//! }
+//!
+//! let random_number = Python::with_gil(|py| -> PyResult<_> {
+//!     let mut bitgen = default_bit_gen(py)?.lock()?;
+//!     // use bitgen without holding the GIL
+//!     let r = py.allow_threads(|| bitgen.next_u64());
+//!     // release the lock manually while holding the GIL again
+//!     bitgen.release(py)?;
+//!     Ok(r)
+//! })?;
+//! # Ok::<(), PyErr>(())
+//! ```
+//!
+//! With the [`rand`] crate installed, you can also use the [`rand::Rng`] APIs from the [`PyBitGeneratorGuard`]:
+//!
+//! ```
+//! # use pyo3::prelude::*;
+//! use rand::Rng as _;
+//! # use numpy::random::{PyBitGenerator, PyBitGeneratorMethods as _};
+//! # // TODO: reuse function definition from above?
+//! # fn default_bit_gen<'py>(py: Python<'py>) -> PyResult<Bound<'py, PyBitGenerator>> {
+//! #     let default_rng = py.import("numpy.random")?.call_method0("default_rng")?;
+//! #     let bit_generator = default_rng.getattr("bit_generator")?.downcast_into()?;
+//! #     Ok(bit_generator)
+//! # }
+//!
+//! Python::with_gil(|py| -> PyResult<_> {
+//!     let mut bitgen = default_bit_gen(py)?.lock()?;
+//!     if bitgen.random_ratio(1, 1_000_000) {
+//!         println!("a sure thing");
+//!     }
+//!     bitgen.release(py)?;
+//!     Ok(())
+//! })?;
+//! # Ok::<(), PyErr>(())
+//! ```
+//!
+//! [bg]: https://numpy.org/doc/stable//reference/random/bit_generators/generated/numpy.random.BitGenerator.html
+//! [ext]: https://numpy.org/doc/stable/reference/random/extending.html
+
+use std::ptr::NonNull;
+
+use pyo3::{
+    exceptions::PyRuntimeError,
+    ffi, intern,
+    prelude::*,
+    sync::GILOnceCell,
+    types::{DerefToPyAny, PyCapsule, PyType},
+    PyTypeInfo,
+};
+
+use crate::npyffi::bitgen_t;
+
+/// Wrapper for [`np.random.BitGenerator`][bg].
+///
+/// See also [`PyBitGeneratorMethods`].
+///
+/// [bg]: https://numpy.org/doc/stable//reference/random/bit_generators/generated/numpy.random.BitGenerator.html
+#[repr(transparent)]
+pub struct PyBitGenerator(PyAny);
+
+impl DerefToPyAny for PyBitGenerator {}
+
+unsafe impl PyTypeInfo for PyBitGenerator {
+    const NAME: &'static str = "PyBitGenerator";
+    const MODULE: Option<&'static str> = Some("numpy.random");
+
+    fn type_object_raw<'py>(py: Python<'py>) -> *mut ffi::PyTypeObject {
+        static CLS: GILOnceCell<Py<PyType>> = GILOnceCell::new();
+        let cls = CLS
+            .import(py, "numpy.random", "BitGenerator")
+            .expect("Failed to get BitGenerator type object");
+        cls.as_type_ptr()
+    }
+}
+
+/// Methods for [`PyBitGenerator`].
+pub trait PyBitGeneratorMethods {
+    /// Acquire a lock on the BitGenerator to allow calling its methods in.
+    fn lock(&self) -> PyResult<PyBitGeneratorGuard>;
+}
+
+impl<'py> PyBitGeneratorMethods for Bound<'py, PyBitGenerator> {
+    fn lock(&self) -> PyResult<PyBitGeneratorGuard> {
+        let py = self.py();
+        let capsule = self
+            .getattr(intern!(py, "capsule"))?
+            .downcast_into::<PyCapsule>()?;
+        assert_eq!(capsule.name()?, Some(ffi::c_str!("BitGenerator")));
+        let lock = self.getattr(intern!(py, "lock"))?;
+        // Acquire the lock in non-blocking mode or return an error
+        if !lock
+            .call_method(intern!(py, "acquire"), (false,), None)?
+            .extract()?
+        {
+            return Err(PyRuntimeError::new_err(
+                "Failed to acquire BitGenerator lock",
+            ));
+        }
+        // Return the guard or release the lock if the capsule is invalid
+        let ptr = capsule.pointer() as *mut bitgen_t;
+        let non_null = match NonNull::new(ptr) {
+            Some(non_null) => non_null,
+            None => {
+                lock.call_method0(intern!(py, "release"))?;
+                return Err(PyRuntimeError::new_err("Invalid BitGenerator capsule"));
+            }
+        };
+        Ok(PyBitGeneratorGuard {
+            raw_bitgen: non_null,
+            released: false,
+            _capsule: capsule.unbind(),
+            lock: lock.unbind(),
+        })
+    }
+}
+
+impl<'py> TryFrom<&Bound<'py, PyBitGenerator>> for PyBitGeneratorGuard {
+    type Error = PyErr;
+    fn try_from(value: &Bound<'py, PyBitGenerator>) -> Result<Self, Self::Error> {
+        value.lock()
+    }
+}
+
+/// [`PyBitGenerator`] lock allowing to access its methods without holding the GIL.
+///
+/// Since [dropping](`Drop::drop`) this acquires the GIL,
+/// prefer to call [`release`][`PyBitGeneratorGuard::release`] manually to release the lock.
+pub struct PyBitGeneratorGuard {
+    raw_bitgen: NonNull<bitgen_t>,
+    /// Whether this guard has been manually released.
+    released: bool,
+    /// This field makes sure the `raw_bitgen` inside the capsule doesn’t get deallocated.
+    _capsule: Py<PyCapsule>,
+    /// This lock makes sure no other threads try to use the BitGenerator while we do.
+    lock: Py<PyAny>,
+}
+
+// SAFETY: 1. We don’t hold the GIL, so we can’t access the Python objects.
+//         2. We only access `raw_bitgen` from `&mut self`, which protects it from parallel access.
+unsafe impl Send for PyBitGeneratorGuard {}
+
+impl Drop for PyBitGeneratorGuard {
+    fn drop(&mut self) {
+        if self.released {
+            return;
+        }
+        // ignore errors because `drop` can’t fail
+        let _ = Python::with_gil(|py| -> PyResult<_> {
+            self.lock.bind(py).call_method0(intern!(py, "release"))?;
+            Ok(())
+        });
+    }
+}
+
+// SAFETY: 1. We hold the `BitGenerator.lock`, so nothing apart from us is allowed to change its state.
+//         2. We hold the `BitGenerator.capsule`, so it can’t be deallocated.
+impl<'py> PyBitGeneratorGuard {
+    /// Release the lock, allowing for checking for errors.
+    pub fn release(mut self, py: Python<'py>) -> PyResult<()> {
+        self.released = true; // only ever read by drop at the end of a scope (like this one).
+        self.lock.bind(py).call_method0(intern!(py, "release"))?;
+        Ok(())
+    }
+
+    /// Returns the next random unsigned 64 bit integer.
+    pub fn next_u64(&mut self) -> u64 {
+        unsafe {
+            let bitgen = self.raw_bitgen.as_ptr();
+            debug_assert_ne!((*bitgen).state, std::ptr::null_mut());
+            ((*bitgen).next_uint64)((*bitgen).state)
+        }
+    }
+    /// Returns the next random unsigned 32 bit integer.
+    pub fn next_u32(&mut self) -> u32 {
+        unsafe {
+            let bitgen = self.raw_bitgen.as_ptr();
+            debug_assert_ne!((*bitgen).state, std::ptr::null_mut());
+            ((*bitgen).next_uint32)((*bitgen).state)
+        }
+    }
+    /// Returns the next random double.
+    pub fn next_double(&mut self) -> f64 {
+        unsafe {
+            let bitgen = self.raw_bitgen.as_ptr();
+            debug_assert_ne!((*bitgen).state, std::ptr::null_mut());
+            ((*bitgen).next_double)((*bitgen).state)
+        }
+    }
+    /// Returns the next raw value (can be used for testing).
+    pub fn next_raw(&mut self) -> u64 {
+        unsafe {
+            let bitgen = self.raw_bitgen.as_ptr();
+            debug_assert_ne!((*bitgen).state, std::ptr::null_mut());
+            ((*bitgen).next_raw)((*bitgen).state)
+        }
+    }
+}
+
+#[cfg(feature = "rand_core")]
+impl rand_core::RngCore for PyBitGeneratorGuard {
+    fn next_u32(&mut self) -> u32 {
+        PyBitGeneratorGuard::next_u32(self)
+    }
+    fn next_u64(&mut self) -> u64 {
+        PyBitGeneratorGuard::next_u64(self)
+    }
+    fn fill_bytes(&mut self, dst: &mut [u8]) {
+        rand_core::impls::fill_bytes_via_next(self, dst)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn get_bit_generator<'py>(py: Python<'py>) -> PyResult<Bound<'py, PyBitGenerator>> {
+        let default_rng = py.import("numpy.random")?.call_method0("default_rng")?;
+        let bit_generator = default_rng
+            .getattr("bit_generator")?
+            .downcast_into::<PyBitGenerator>()?;
+        Ok(bit_generator)
+    }
+
+    /// Test the primary use case: acquire the lock, release the GIL, then use the lock
+    #[test]
+    fn use_outside_gil() -> PyResult<()> {
+        Python::with_gil(|py| {
+            let mut bitgen = get_bit_generator(py)?.lock()?;
+            py.allow_threads(|| {
+                let _ = bitgen.next_raw();
+            });
+            assert!(bitgen.release(py).is_ok());
+            Ok(())
+        })
+    }
+
+    /// More complex version of primary use case: use from multiple threads
+    #[cfg(feature = "rand_core")]
+    #[test]
+    fn use_parallel() -> PyResult<()> {
+        use crate::array::{PyArray2, PyArrayMethods as _};
+        use ndarray::Dimension;
+        use rand::Rng;
+        use std::sync::{Arc, Mutex};
+
+        Python::with_gil(|py| -> PyResult<_> {
+            let mut arr = PyArray2::<u32>::zeros(py, (2, 300), false).readwrite();
+            let bitgen = get_bit_generator(py)?.lock()?;
+            let bitgen = Arc::new(Mutex::new(bitgen));
+
+            let (_n_threads, chunk_size) = arr.dims().into_pattern();
+            let slice = arr.as_slice_mut()?;
+
+            py.allow_threads(|| {
+                std::thread::scope(|s| {
+                    for chunk in slice.chunks_exact_mut(chunk_size) {
+                        let bitgen = Arc::clone(&bitgen);
+                        s.spawn(move || {
+                            let mut bitgen = bitgen.lock().unwrap();
+                            chunk.fill_with(|| bitgen.random_range(10..200));
+                        });
+                    }
+                })
+            });
+
+            Arc::into_inner(bitgen)
+                .unwrap()
+                .into_inner()
+                .unwrap()
+                .release(py)?;
+            Ok(())
+        })
+    }
+
+    /// Test that the `rand::Rng` APIs work
+    #[cfg(feature = "rand_core")]
+    #[test]
+    fn rand() -> PyResult<()> {
+        use rand::Rng as _;
+
+        Python::with_gil(|py| {
+            let mut bitgen = get_bit_generator(py)?.lock()?;
+            py.allow_threads(|| {
+                assert!(bitgen.random_ratio(1, 1));
+                assert!(!bitgen.random_ratio(0, 1));
+            });
+            assert!(bitgen.release(py).is_ok());
+            Ok(())
+        })
+    }
+
+    #[test]
+    fn double_lock_fails() -> PyResult<()> {
+        Python::with_gil(|py| {
+            let generator = get_bit_generator(py)?;
+            let bitgen = generator.lock()?;
+            assert!(generator.lock().is_err());
+            assert!(bitgen.release(py).is_ok());
+            Ok(())
+        })
+    }
+}