Show More
@@ -1,173 +1,186 | |||
|
1 | 1 | //! This module takes care of all conversions involving `rusthg` (hg-cpython) |
|
2 | 2 | //! objects in the PyO3 call context. |
|
3 | 3 | //! |
|
4 | 4 | //! For source code clarity, we only import (`use`) [`cpython`] traits and not |
|
5 | 5 | //! any of its data objects. We are instead using full qualifiers, such as |
|
6 | 6 | //! `cpython::PyObject`, and believe that the added heaviness is an acceptatble |
|
7 | 7 | //! price to pay to avoid confusion. |
|
8 | 8 | //! |
|
9 | 9 | //! Also it, is customary in [`cpython`] to label the GIL lifetime as `'p`, |
|
10 | 10 | //! whereas it is `'py` in PyO3 context. We keep both these conventions in |
|
11 | 11 | //! the arguments side of function signatures when they are not simply elided. |
|
12 | 12 | use pyo3::exceptions::PyTypeError; |
|
13 | 13 | use pyo3::prelude::*; |
|
14 | 14 | |
|
15 | 15 | use cpython::ObjectProtocol; |
|
16 | 16 | use cpython::PythonObject; |
|
17 | 17 | use lazy_static::lazy_static; |
|
18 | 18 | |
|
19 | use hg::revlog::index::Index as CoreIndex; | |
|
19 | 20 | use rusthg::revlog::{InnerRevlog, PySharedIndex}; |
|
20 | 21 | |
|
21 | 22 | /// Force cpython's GIL handle with the appropriate lifetime |
|
22 | 23 | /// |
|
23 | 24 | /// In `pyo3`, the fact that we have the GIL is expressed by the lifetime of |
|
24 | 25 | /// the incoming [`Bound`] smart pointer. We therefore simply instantiate |
|
25 | 26 | /// the `cpython` handle and coerce its lifetime by the function signature. |
|
26 | 27 | /// |
|
27 | 28 | /// Reacquiring the GIL is also a possible alternative, as the CPython |
|
28 | 29 | /// documentation explicitely states that "recursive calls are allowed" |
|
29 | 30 | /// (we interpret that as saying that acquiring the GIL within a thread that |
|
30 | 31 | /// already has it works) *as long as it is properly released* |
|
31 | 32 | /// reference: |
|
32 | 33 | /// <https://docs.python.org/3.8/c-api/init.html#c.PyGILState_Ensure> |
|
33 | 34 | pub(crate) fn cpython_handle<'py, T>( |
|
34 | 35 | _bound: &Bound<'py, T>, |
|
35 | 36 | ) -> cpython::Python<'py> { |
|
36 | 37 | // safety: this is safe because the returned object has the 'py lifetime |
|
37 | 38 | unsafe { cpython::Python::assume_gil_acquired() } |
|
38 | 39 | } |
|
39 | 40 | |
|
40 | 41 | /// Force PyO3 GIL handle from cpython's. |
|
41 | 42 | /// |
|
42 | 43 | /// Very similar to [`cpython_handle`] |
|
43 | 44 | pub fn pyo3_handle(_py: cpython::Python<'_>) -> Python<'_> { |
|
44 | 45 | // safety: this is safe because the returned object has the same lifetime |
|
45 | 46 | // as the incoming object. |
|
46 | 47 | unsafe { Python::assume_gil_acquired() } |
|
47 | 48 | } |
|
48 | 49 | |
|
49 | 50 | /// Convert a PyO3 [`PyObject`] into a [`cpython::PyObject`] |
|
50 | 51 | /// |
|
51 | 52 | /// During this process, the reference count is increased, then decreased. |
|
52 | 53 | /// This means that the GIL (symbolized by the lifetime on the `obj` |
|
53 | 54 | /// argument) is needed. |
|
54 | 55 | /// |
|
55 | 56 | /// We could make something perhaps more handy by simply stealing the |
|
56 | 57 | /// pointer, forgetting the incoming and then implement `From` with "newtype". |
|
57 | 58 | /// It would be worth the effort for a generic cpython-to-pyo3 crate, perhaps |
|
58 | 59 | /// not for the current endeavour. |
|
59 | 60 | pub(crate) fn to_cpython_py_object<'py>( |
|
60 | 61 | obj: &Bound<'py, PyAny>, |
|
61 | 62 | ) -> (cpython::Python<'py>, cpython::PyObject) { |
|
62 | 63 | let py = cpython_handle(obj); |
|
63 | 64 | // public alias of the private cpython::fii::PyObject (!) |
|
64 | 65 | let raw = obj.as_ptr() as *mut python3_sys::PyObject; |
|
65 | 66 | // both pyo3 and rust-cpython will decrement the refcount on drop. |
|
66 | 67 | // If we use from_owned_ptr, that's a segfault. |
|
67 | 68 | (py, unsafe { cpython::PyObject::from_borrowed_ptr(py, raw) }) |
|
68 | 69 | } |
|
69 | 70 | |
|
70 | 71 | /// Convert a [`cpython::PyObject`] into a PyO3 [`PyObject`] |
|
71 | 72 | /// |
|
72 | 73 | /// During this process, the reference count is increased, then decreased. |
|
73 | 74 | /// This means that the GIL (symbolized by the PyO3 [`Python`] handle is |
|
74 | 75 | /// needed. |
|
75 | 76 | /// |
|
76 | 77 | /// We could make something perhaps more handy by simply stealing the |
|
77 | 78 | /// pointer, forgetting the incoming and then implement `From` with "newtype". |
|
78 | 79 | /// It would be worth the effort for a generic cpython-to-pyo3 crate, perhaps |
|
79 | 80 | /// not for the current endeavour. |
|
80 | 81 | pub(crate) fn from_cpython_py_object( |
|
81 | 82 | py: Python<'_>, |
|
82 | 83 | obj: cpython::PyObject, |
|
83 | 84 | ) -> PyObject { |
|
84 | 85 | let raw = obj.as_ptr() as *mut pyo3::ffi::PyObject; |
|
85 | 86 | unsafe { Py::from_borrowed_ptr(py, raw) } |
|
86 | 87 | } |
|
87 | 88 | |
|
88 | 89 | /// Convert [`cpython::PyErr`] into [`pyo3::PyErr`] |
|
89 | 90 | /// |
|
90 | 91 | /// The exception class remains the same as the original exception, |
|
91 | 92 | /// hence if it is also defined in another dylib based on `cpython` crate, |
|
92 | 93 | /// it will need to be converted to be downcasted in this crate. |
|
93 | 94 | pub(crate) fn from_cpython_pyerr( |
|
94 | 95 | py: cpython::Python<'_>, |
|
95 | 96 | mut e: cpython::PyErr, |
|
96 | 97 | ) -> PyErr { |
|
97 | 98 | let pyo3_py = pyo3_handle(py); |
|
98 | 99 | let cpython_exc_obj = e.instance(py); |
|
99 | 100 | let pyo3_exc_obj = from_cpython_py_object(pyo3_py, cpython_exc_obj); |
|
100 | 101 | PyErr::from_value(pyo3_exc_obj.into_bound(pyo3_py)) |
|
101 | 102 | } |
|
102 | 103 | |
|
103 | 104 | /// Retrieve the PyType for objects from the `mercurial.rustext` crate. |
|
104 | 105 | fn retrieve_cpython_py_type( |
|
105 | 106 | submodule_name: &str, |
|
106 | 107 | type_name: &str, |
|
107 | 108 | ) -> cpython::PyResult<cpython::PyType> { |
|
108 | 109 | let guard = cpython::Python::acquire_gil(); |
|
109 | 110 | let py = guard.python(); |
|
110 | 111 | let module = py.import(&format!("mercurial.rustext.{submodule_name}"))?; |
|
111 | 112 | module.get(py, type_name)?.extract::<cpython::PyType>(py) |
|
112 | 113 | } |
|
113 | 114 | |
|
114 | 115 | lazy_static! { |
|
115 | 116 | static ref INNER_REVLOG_PY_TYPE: cpython::PyType = { |
|
116 | 117 | retrieve_cpython_py_type("revlog", "InnerRevlog") |
|
117 | 118 | .expect("Could not import InnerRevlog in Python") |
|
118 | 119 | }; |
|
119 | 120 | } |
|
120 | 121 | |
|
121 | 122 | /// Downcast [`InnerRevlog`], with the appropriate Python type checking. |
|
122 | 123 | /// |
|
123 | 124 | /// The PyType object representing the `InnerRevlog` Python class is not the |
|
124 | 125 | /// the same in this dylib as it is in the `mercurial.rustext` module. |
|
125 | 126 | /// This is because the code created with the [`cpython::py_class!`] |
|
126 | 127 | /// macro is itself duplicated in both dylibs. In the case of this crate, this |
|
127 | 128 | /// happens by linking to the [`rusthg`] crate and provides the `InnerRevlog` |
|
128 | 129 | /// that is visible from this crate. The `InnerRevlog::get_type` associated |
|
129 | 130 | /// function turns out to return a `static mut` (look for `TYPE_OBJECT` in |
|
130 | 131 | /// `py_class_impl3.rs`), which obviously is different in both dylibs. |
|
131 | 132 | /// |
|
132 | 133 | /// The consequence of that is that downcasting an `InnerRevlog` originally |
|
133 | 134 | /// from the `mecurial.rustext` module to our `InnerRevlog` cannot be done with |
|
134 | 135 | /// the usual `extract::<InnerRevlog>(py)`, as it would perform the type |
|
135 | 136 | /// checking with the `PyType` that is embedded in `mercurial.pyo3_rustext`. |
|
136 | 137 | /// We must check the `PyType` that is within `mercurial.rustext` instead. |
|
137 | 138 | /// This is what this function does. |
|
138 | 139 | fn extract_inner_revlog( |
|
139 | 140 | py: cpython::Python, |
|
140 | 141 | inner_revlog: cpython::PyObject, |
|
141 | 142 | ) -> PyResult<InnerRevlog> { |
|
142 | 143 | if !(*INNER_REVLOG_PY_TYPE).is_instance(py, &inner_revlog) { |
|
143 | 144 | return Err(PyTypeError::new_err("Not an InnerRevlog instance")); |
|
144 | 145 | } |
|
145 | 146 | // Safety: this is safe because we checked the PyType already, with the |
|
146 | 147 | // value embedded in `mercurial.rustext`. |
|
147 | 148 | Ok(unsafe { InnerRevlog::unchecked_downcast_from(inner_revlog) }) |
|
148 | 149 | } |
|
149 | 150 | |
|
150 | 151 | /// This is similar to [`rusthg.py_rust_index_to_graph`], with difference in |
|
151 | 152 | /// how we retrieve the [`InnerRevlog`]. |
|
152 | 153 | pub fn py_rust_index_to_graph( |
|
153 | 154 | py: cpython::Python, |
|
154 | 155 | index_proxy: cpython::PyObject, |
|
155 | 156 | ) -> PyResult<cpython::UnsafePyLeaked<PySharedIndex>> { |
|
156 | 157 | let inner_revlog = extract_inner_revlog( |
|
157 | 158 | py, |
|
158 | 159 | index_proxy |
|
159 | 160 | .getattr(py, "inner") |
|
160 | 161 | .map_err(|e| from_cpython_pyerr(py, e))?, |
|
161 | 162 | )?; |
|
162 | 163 | |
|
163 | 164 | let leaked = inner_revlog.pub_inner(py).leak_immutable(); |
|
164 | 165 | // Safety: we don't leak the "faked" reference out of the `UnsafePyLeaked` |
|
165 | 166 | Ok(unsafe { leaked.map(py, |idx| PySharedIndex { inner: &idx.index }) }) |
|
166 | 167 | } |
|
167 | 168 | |
|
168 | pub(crate) fn proxy_index_extract<'py>( | |
|
169 | /// Full extraction of the proxy index object as received in PyO3 to a | |
|
170 | /// [`CoreIndex`] reference. | |
|
171 | /// | |
|
172 | /// The safety invariants to maintain are those of the underlying | |
|
173 | /// [`UnsafePyLeaked::try_borrow`]: the caller must not leak the inner | |
|
174 | /// reference. | |
|
175 | pub(crate) unsafe fn proxy_index_extract<'py>( | |
|
169 | 176 | index_proxy: &Bound<'py, PyAny>, |
|
170 | ) -> PyResult<(cpython::Python<'py>, cpython::UnsafePyLeaked<PySharedIndex>)> { | |
|
177 | ) -> PyResult<&'py CoreIndex> { | |
|
171 | 178 | let (py, idx_proxy) = to_cpython_py_object(index_proxy); |
|
172 |
|
|
|
179 | let py_leaked = py_rust_index_to_graph(py, idx_proxy)?; | |
|
180 | let py_shared = &*unsafe { | |
|
181 | py_leaked | |
|
182 | .try_borrow(py) | |
|
183 | .map_err(|e| from_cpython_pyerr(py, e))? | |
|
184 | }; | |
|
185 | Ok(py_shared.inner) | |
|
173 | 186 | } |
@@ -1,73 +1,67 | |||
|
1 | 1 | // dagops.rs |
|
2 | 2 | // |
|
3 | 3 | // Copyright 2024 Georges Racinet <georges.racinet@cloudcrane.io> |
|
4 | 4 | // |
|
5 | 5 | // This software may be used and distributed according to the terms of the |
|
6 | 6 | // GNU General Public License version 2 or any later version. |
|
7 | 7 | |
|
8 | 8 | //! Bindings for the `hg::dagops` module provided by the |
|
9 | 9 | //! `hg-core` package. |
|
10 | 10 | //! |
|
11 | 11 | //! From Python, this will be seen as `mercurial.pyo3-rustext.dagop` |
|
12 | 12 | use pyo3::prelude::*; |
|
13 | 13 | |
|
14 | 14 | use std::collections::HashSet; |
|
15 | 15 | |
|
16 | 16 | use hg::{dagops, Revision}; |
|
17 | 17 | |
|
18 |
use crate::convert_cpython:: |
|
|
18 | use crate::convert_cpython::proxy_index_extract; | |
|
19 | 19 | use crate::exceptions::GraphError; |
|
20 | 20 | use crate::revision::{rev_pyiter_collect, PyRevision}; |
|
21 | 21 | use crate::util::new_submodule; |
|
22 | 22 | |
|
23 | 23 | /// Using the the `index_proxy`, return heads out of any Python iterable of |
|
24 | 24 | /// Revisions |
|
25 | 25 | /// |
|
26 | 26 | /// This is the Rust counterpart for `mercurial.dagop.headrevs` |
|
27 | 27 | #[pyfunction] |
|
28 | 28 | pub fn headrevs( |
|
29 | 29 | index_proxy: &Bound<'_, PyAny>, |
|
30 | 30 | revs: &Bound<'_, PyAny>, |
|
31 | 31 | ) -> PyResult<HashSet<PyRevision>> { |
|
32 | let (py, py_leaked) = proxy_index_extract(index_proxy)?; | |
|
33 | 32 | // Safety: we don't leak the "faked" reference out of `UnsafePyLeaked` |
|
34 | let index = &*unsafe { | |
|
35 | py_leaked | |
|
36 | .try_borrow(py) | |
|
37 | .map_err(|e| from_cpython_pyerr(py, e))? | |
|
38 | }; | |
|
39 | ||
|
33 | let index = unsafe { proxy_index_extract(index_proxy)? }; | |
|
40 | 34 | let mut as_set: HashSet<Revision> = rev_pyiter_collect(revs, index)?; |
|
41 | 35 | dagops::retain_heads(index, &mut as_set).map_err(GraphError::from_hg)?; |
|
42 | 36 | Ok(as_set.into_iter().map(Into::into).collect()) |
|
43 | 37 | } |
|
44 | 38 | |
|
45 | 39 | /// Computes the rank, i.e. the number of ancestors including itself, |
|
46 | 40 | /// of a node represented by its parents. |
|
47 | 41 | /// |
|
48 | 42 | /// Currently, the pure Rust index supports only the REVLOGV1 format, hence |
|
49 | 43 | /// the only possible return value is that the rank is unknown. |
|
50 | 44 | /// |
|
51 | 45 | /// References: |
|
52 | 46 | /// - C implementation, function `index_fast_rank()`. |
|
53 | 47 | /// - `impl vcsgraph::graph::RankedGraph for Index` in `crate::cindex`. |
|
54 | 48 | #[pyfunction] |
|
55 | 49 | pub fn rank( |
|
56 | 50 | _index: &Bound<'_, PyAny>, |
|
57 | 51 | _p1r: PyRevision, |
|
58 | 52 | _p2r: PyRevision, |
|
59 | 53 | ) -> PyResult<()> { |
|
60 | 54 | Err(GraphError::from_vcsgraph( |
|
61 | 55 | vcsgraph::graph::GraphReadError::InconsistentGraphData, |
|
62 | 56 | )) |
|
63 | 57 | } |
|
64 | 58 | |
|
65 | 59 | pub fn init_module<'py>( |
|
66 | 60 | py: Python<'py>, |
|
67 | 61 | package: &str, |
|
68 | 62 | ) -> PyResult<Bound<'py, PyModule>> { |
|
69 | 63 | let m = new_submodule(py, package, "dagop")?; |
|
70 | 64 | m.add_function(wrap_pyfunction!(headrevs, &m)?)?; |
|
71 | 65 | m.add_function(wrap_pyfunction!(rank, &m)?)?; |
|
72 | 66 | Ok(m) |
|
73 | 67 | } |
General Comments 0
You need to be logged in to leave comments.
Login now