2021-06-30 10:03:53 +00:00
|
|
|
//! A write-once cell mediated by the Python GIL.
|
2022-06-01 08:07:00 +00:00
|
|
|
use crate::{types::PyString, Py, Python};
|
2020-06-14 15:29:40 +00:00
|
|
|
use std::cell::UnsafeCell;
|
|
|
|
|
|
|
|
/// A write-once cell similar to [`once_cell::OnceCell`](https://docs.rs/once_cell/1.4.0/once_cell/).
|
|
|
|
///
|
|
|
|
/// Unlike `once_cell::sync` which blocks threads to achieve thread safety, this implementation
|
|
|
|
/// uses the Python GIL to mediate concurrent access. This helps in cases where `once_sync` or
|
|
|
|
/// `lazy_static`'s synchronization strategy can lead to deadlocks when interacting with the Python
|
2021-07-24 07:47:02 +00:00
|
|
|
/// GIL. For an example, see [the FAQ section](https://pyo3.rs/latest/faq.html) of the guide.
|
2020-06-14 15:29:40 +00:00
|
|
|
///
|
2021-03-20 07:45:56 +00:00
|
|
|
/// # Examples
|
2020-06-14 15:29:40 +00:00
|
|
|
///
|
|
|
|
/// The following example shows how to use `GILOnceCell` to share a reference to a Python list
|
|
|
|
/// between threads:
|
|
|
|
///
|
|
|
|
/// ```
|
2021-10-14 21:15:25 +00:00
|
|
|
/// use pyo3::once_cell::GILOnceCell;
|
2020-06-14 15:29:40 +00:00
|
|
|
/// use pyo3::prelude::*;
|
|
|
|
/// use pyo3::types::PyList;
|
|
|
|
///
|
|
|
|
/// static LIST_CELL: GILOnceCell<Py<PyList>> = GILOnceCell::new();
|
|
|
|
///
|
2022-03-23 07:07:28 +00:00
|
|
|
/// pub fn get_shared_list(py: Python<'_>) -> &PyList {
|
2020-06-14 15:29:40 +00:00
|
|
|
/// LIST_CELL
|
|
|
|
/// .get_or_init(py, || PyList::empty(py).into())
|
|
|
|
/// .as_ref(py)
|
|
|
|
/// }
|
2021-03-20 07:44:28 +00:00
|
|
|
/// # Python::with_gil(|py| assert_eq!(get_shared_list(py).len(), 0));
|
2020-06-14 15:29:40 +00:00
|
|
|
/// ```
|
|
|
|
pub struct GILOnceCell<T>(UnsafeCell<Option<T>>);
|
|
|
|
|
|
|
|
// T: Send is needed for Sync because the thread which drops the GILOnceCell can be different
|
|
|
|
// to the thread which fills it.
|
|
|
|
unsafe impl<T: Send + Sync> Sync for GILOnceCell<T> {}
|
|
|
|
unsafe impl<T: Send> Send for GILOnceCell<T> {}
|
|
|
|
|
|
|
|
impl<T> GILOnceCell<T> {
|
|
|
|
/// Create a `GILOnceCell` which does not yet contain a value.
|
|
|
|
pub const fn new() -> Self {
|
|
|
|
Self(UnsafeCell::new(None))
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Get a reference to the contained value, or `None` if the cell has not yet been written.
|
2022-04-03 14:21:37 +00:00
|
|
|
#[inline]
|
2022-03-23 07:07:28 +00:00
|
|
|
pub fn get(&self, _py: Python<'_>) -> Option<&T> {
|
2020-06-14 15:29:40 +00:00
|
|
|
// Safe because if the cell has not yet been written, None is returned.
|
|
|
|
unsafe { &*self.0.get() }.as_ref()
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Get a reference to the contained value, initializing it if needed using the provided
|
|
|
|
/// closure.
|
|
|
|
///
|
|
|
|
/// Note that:
|
|
|
|
/// 1) reentrant initialization can cause a stack overflow.
|
|
|
|
/// 2) if f() temporarily releases the GIL (e.g. by calling `Python::import`) then it is
|
|
|
|
/// possible (and well-defined) that a second thread may also call get_or_init and begin
|
|
|
|
/// calling `f()`. Even when this happens `GILOnceCell` guarantees that only **one** write
|
|
|
|
/// to the cell ever occurs - other threads will simply discard the value they compute and
|
|
|
|
/// return the result of the first complete computation.
|
2020-06-22 21:13:23 +00:00
|
|
|
/// 3) if f() does not release the GIL and does not panic, it is guaranteed to be called
|
|
|
|
/// exactly once, even if multiple threads attempt to call `get_or_init`
|
|
|
|
/// 4) if f() can panic but still does not release the GIL, it may be called multiple times,
|
|
|
|
/// but it is guaranteed that f() will never be called concurrently
|
2022-04-03 14:21:37 +00:00
|
|
|
#[inline]
|
2022-03-23 07:07:28 +00:00
|
|
|
pub fn get_or_init<F>(&self, py: Python<'_>, f: F) -> &T
|
2020-06-14 15:29:40 +00:00
|
|
|
where
|
|
|
|
F: FnOnce() -> T,
|
|
|
|
{
|
2022-04-03 14:21:37 +00:00
|
|
|
if let Some(value) = self.get(py) {
|
2020-06-14 15:29:40 +00:00
|
|
|
return value;
|
|
|
|
}
|
|
|
|
|
2022-04-03 14:21:37 +00:00
|
|
|
self.init(py, f)
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cold]
|
|
|
|
fn init<F>(&self, py: Python<'_>, f: F) -> &T
|
|
|
|
where
|
|
|
|
F: FnOnce() -> T,
|
|
|
|
{
|
2020-06-14 15:29:40 +00:00
|
|
|
// Note that f() could temporarily release the GIL, so it's possible that another thread
|
|
|
|
// writes to this GILOnceCell before f() finishes. That's fine; we'll just have to discard
|
|
|
|
// the value computed here and accept a bit of wasted computation.
|
|
|
|
let value = f();
|
|
|
|
let _ = self.set(py, value);
|
|
|
|
|
|
|
|
self.get(py).unwrap()
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Get the contents of the cell mutably. This is only possible if the reference to the cell is
|
|
|
|
/// unique.
|
|
|
|
pub fn get_mut(&mut self) -> Option<&mut T> {
|
|
|
|
// Safe because we have &mut self
|
|
|
|
unsafe { &mut *self.0.get() }.as_mut()
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Set the value in the cell.
|
|
|
|
///
|
|
|
|
/// If the cell has already been written, `Err(value)` will be returned containing the new
|
|
|
|
/// value which was not written.
|
2022-03-23 07:07:28 +00:00
|
|
|
pub fn set(&self, _py: Python<'_>, value: T) -> Result<(), T> {
|
2020-06-14 15:29:40 +00:00
|
|
|
// Safe because GIL is held, so no other thread can be writing to this cell concurrently.
|
|
|
|
let inner = unsafe { &mut *self.0.get() };
|
|
|
|
if inner.is_some() {
|
|
|
|
return Err(value);
|
|
|
|
}
|
|
|
|
|
|
|
|
*inner = Some(value);
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
2022-04-03 10:27:34 +00:00
|
|
|
|
2022-04-03 18:58:51 +00:00
|
|
|
/// Interns `text` as a Python string and stores a reference to it in static storage.
|
2022-04-03 10:27:34 +00:00
|
|
|
///
|
2022-04-03 18:58:51 +00:00
|
|
|
/// A reference to the same Python string is returned on each invocation.
|
2022-04-03 10:27:34 +00:00
|
|
|
///
|
2022-04-03 18:58:51 +00:00
|
|
|
/// # Example: Using `intern!` to avoid needlessly recreating the same Python string
|
2022-04-03 10:27:34 +00:00
|
|
|
///
|
|
|
|
/// ```
|
|
|
|
/// use pyo3::intern;
|
2022-04-04 18:25:47 +00:00
|
|
|
/// # use pyo3::{pyfunction, types::PyDict, wrap_pyfunction, PyResult, Python};
|
2022-04-03 10:27:34 +00:00
|
|
|
///
|
|
|
|
/// #[pyfunction]
|
|
|
|
/// fn create_dict(py: Python<'_>) -> PyResult<&PyDict> {
|
|
|
|
/// let dict = PyDict::new(py);
|
|
|
|
/// // 👇 A new `PyString` is created
|
2022-04-03 18:58:51 +00:00
|
|
|
/// // for every call of this function.
|
2022-04-03 10:27:34 +00:00
|
|
|
/// dict.set_item("foo", 42)?;
|
|
|
|
/// Ok(dict)
|
|
|
|
/// }
|
|
|
|
///
|
|
|
|
/// #[pyfunction]
|
|
|
|
/// fn create_dict_faster(py: Python<'_>) -> PyResult<&PyDict> {
|
|
|
|
/// let dict = PyDict::new(py);
|
|
|
|
/// // 👇 A `PyString` is created once and reused
|
|
|
|
/// // for the lifetime of the program.
|
|
|
|
/// dict.set_item(intern!(py, "foo"), 42)?;
|
|
|
|
/// Ok(dict)
|
|
|
|
/// }
|
2022-04-04 18:25:47 +00:00
|
|
|
/// #
|
|
|
|
/// # Python::with_gil(|py| {
|
2022-05-10 07:17:10 +00:00
|
|
|
/// # let fun_slow = wrap_pyfunction!(create_dict, py).unwrap();
|
|
|
|
/// # let dict = fun_slow.call0().unwrap();
|
|
|
|
/// # assert!(dict.contains("foo").unwrap());
|
2022-04-04 18:25:47 +00:00
|
|
|
/// # let fun = wrap_pyfunction!(create_dict_faster, py).unwrap();
|
|
|
|
/// # let dict = fun.call0().unwrap();
|
|
|
|
/// # assert!(dict.contains("foo").unwrap());
|
|
|
|
/// # });
|
2022-04-03 10:27:34 +00:00
|
|
|
/// ```
|
|
|
|
#[macro_export]
|
|
|
|
macro_rules! intern {
|
2022-04-04 16:44:19 +00:00
|
|
|
($py: expr, $text: expr) => {{
|
2022-06-01 08:07:00 +00:00
|
|
|
static INTERNED: $crate::once_cell::Interned = $crate::once_cell::Interned::new($text);
|
|
|
|
INTERNED.get($py)
|
2022-04-03 10:27:34 +00:00
|
|
|
}};
|
|
|
|
}
|
2022-04-04 16:44:19 +00:00
|
|
|
|
2022-06-01 08:07:00 +00:00
|
|
|
/// Implementation detail for `intern!` macro.
|
|
|
|
#[doc(hidden)]
|
|
|
|
pub struct Interned(&'static str, GILOnceCell<Py<PyString>>);
|
|
|
|
|
|
|
|
impl Interned {
|
|
|
|
pub const fn new(value: &'static str) -> Self {
|
|
|
|
Interned(value, GILOnceCell::new())
|
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
pub fn get<'py>(&'py self, py: Python<'py>) -> &'py PyString {
|
|
|
|
self.1
|
|
|
|
.get_or_init(py, || PyString::intern(py, self.0).into())
|
|
|
|
.as_ref(py)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-04-04 16:44:19 +00:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
use crate::types::PyDict;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_intern() {
|
|
|
|
Python::with_gil(|py| {
|
|
|
|
let foo1 = "foo";
|
|
|
|
let foo2 = intern!(py, "foo");
|
|
|
|
let foo3 = intern!(py, stringify!(foo));
|
|
|
|
|
|
|
|
let dict = PyDict::new(py);
|
|
|
|
dict.set_item(foo1, 42_usize).unwrap();
|
|
|
|
assert!(dict.contains(foo2).unwrap());
|
|
|
|
assert_eq!(dict.get_item(foo3).unwrap().extract::<usize>().unwrap(), 42);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|