##// END OF EJS Templates
rust-cpython: leverage py_shared_iterator::from_inner() where appropriate
Yuya Nishihara -
r43161:5ccc08d0 default
parent child Browse files
Show More
@@ -1,130 +1,130 b''
1 1 // dirs_multiset.rs
2 2 //
3 3 // Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
4 4 //
5 5 // This software may be used and distributed according to the terms of the
6 6 // GNU General Public License version 2 or any later version.
7 7
8 8 //! Bindings for the `hg::dirstate::dirs_multiset` file provided by the
9 9 //! `hg-core` package.
10 10
11 11 use std::cell::RefCell;
12 12 use std::convert::TryInto;
13 13
14 14 use cpython::{
15 15 exc, ObjectProtocol, PyBytes, PyClone, PyDict, PyErr, PyObject, PyResult,
16 16 Python,
17 17 };
18 18
19 19 use crate::dirstate::extract_dirstate;
20 20 use crate::ref_sharing::{PySharedRefCell, PySharedState};
21 21 use hg::{
22 22 DirsMultiset, DirsMultisetIter, DirstateMapError, DirstateParseError,
23 23 EntryState,
24 24 };
25 25
26 26 py_class!(pub class Dirs |py| {
27 27 data inner: PySharedRefCell<DirsMultiset>;
28 28 data py_shared_state: PySharedState;
29 29
30 30 // `map` is either a `dict` or a flat iterator (usually a `set`, sometimes
31 31 // a `list`)
32 32 def __new__(
33 33 _cls,
34 34 map: PyObject,
35 35 skip: Option<PyObject> = None
36 36 ) -> PyResult<Self> {
37 37 let mut skip_state: Option<EntryState> = None;
38 38 if let Some(skip) = skip {
39 39 skip_state = Some(
40 40 skip.extract::<PyBytes>(py)?.data(py)[0]
41 41 .try_into()
42 42 .map_err(|e: DirstateParseError| {
43 43 PyErr::new::<exc::ValueError, _>(py, e.to_string())
44 44 })?,
45 45 );
46 46 }
47 47 let inner = if let Ok(map) = map.cast_as::<PyDict>(py) {
48 48 let dirstate = extract_dirstate(py, &map)?;
49 49 DirsMultiset::from_dirstate(&dirstate, skip_state)
50 50 } else {
51 51 let map: Result<Vec<Vec<u8>>, PyErr> = map
52 52 .iter(py)?
53 53 .map(|o| Ok(o?.extract::<PyBytes>(py)?.data(py).to_owned()))
54 54 .collect();
55 55 DirsMultiset::from_manifest(&map?)
56 56 };
57 57
58 58 Self::create_instance(
59 59 py,
60 60 PySharedRefCell::new(inner),
61 61 PySharedState::default()
62 62 )
63 63 }
64 64
65 65 def addpath(&self, path: PyObject) -> PyResult<PyObject> {
66 66 self.borrow_mut(py)?.add_path(
67 67 path.extract::<PyBytes>(py)?.data(py),
68 68 );
69 69 Ok(py.None())
70 70 }
71 71
72 72 def delpath(&self, path: PyObject) -> PyResult<PyObject> {
73 73 self.borrow_mut(py)?.delete_path(
74 74 path.extract::<PyBytes>(py)?.data(py),
75 75 )
76 76 .and(Ok(py.None()))
77 77 .or_else(|e| {
78 78 match e {
79 79 DirstateMapError::PathNotFound(_p) => {
80 80 Err(PyErr::new::<exc::ValueError, _>(
81 81 py,
82 82 "expected a value, found none".to_string(),
83 83 ))
84 84 }
85 85 DirstateMapError::EmptyPath => {
86 86 Ok(py.None())
87 87 }
88 88 }
89 89 })
90 90 }
91 91 def __iter__(&self) -> PyResult<DirsMultisetKeysIterator> {
92 92 let (leak_handle, leaked_ref) = unsafe { self.leak_immutable(py)? };
93 DirsMultisetKeysIterator::create_instance(
93 DirsMultisetKeysIterator::from_inner(
94 94 py,
95 RefCell::new(Some(leak_handle)),
96 RefCell::new(leaked_ref.iter()),
95 leak_handle,
96 leaked_ref.iter(),
97 97 )
98 98 }
99 99
100 100 def __contains__(&self, item: PyObject) -> PyResult<bool> {
101 101 Ok(self
102 102 .inner(py)
103 103 .borrow()
104 104 .contains(item.extract::<PyBytes>(py)?.data(py).as_ref()))
105 105 }
106 106 });
107 107
108 108 py_shared_ref!(Dirs, DirsMultiset, inner, DirsMultisetLeakedRef,);
109 109
110 110 impl Dirs {
111 111 pub fn from_inner(py: Python, d: DirsMultiset) -> PyResult<Self> {
112 112 Self::create_instance(
113 113 py,
114 114 PySharedRefCell::new(d),
115 115 PySharedState::default(),
116 116 )
117 117 }
118 118
119 119 fn translate_key(py: Python, res: &Vec<u8>) -> PyResult<Option<PyBytes>> {
120 120 Ok(Some(PyBytes::new(py, res)))
121 121 }
122 122 }
123 123
124 124 py_shared_iterator!(
125 125 DirsMultisetKeysIterator,
126 126 DirsMultisetLeakedRef,
127 127 DirsMultisetIter<'static>,
128 128 Dirs::translate_key,
129 129 Option<PyBytes>
130 130 );
@@ -1,392 +1,392 b''
1 1 // macros.rs
2 2 //
3 3 // Copyright 2019 Raphaël Gomès <rgomes@octobus.net>
4 4 //
5 5 // This software may be used and distributed according to the terms of the
6 6 // GNU General Public License version 2 or any later version.
7 7
8 8 //! Macros for use in the `hg-cpython` bridge library.
9 9
10 10 use crate::exceptions::AlreadyBorrowed;
11 11 use cpython::{PyResult, Python};
12 12 use std::cell::{Cell, Ref, RefCell, RefMut};
13 13
14 14 /// Manages the shared state between Python and Rust
15 15 #[derive(Default)]
16 16 pub struct PySharedState {
17 17 leak_count: Cell<usize>,
18 18 mutably_borrowed: Cell<bool>,
19 19 }
20 20
21 21 impl PySharedState {
22 22 pub fn borrow_mut<'a, T>(
23 23 &'a self,
24 24 py: Python<'a>,
25 25 pyrefmut: RefMut<'a, T>,
26 26 ) -> PyResult<PyRefMut<'a, T>> {
27 27 if self.mutably_borrowed.get() {
28 28 return Err(AlreadyBorrowed::new(
29 29 py,
30 30 "Cannot borrow mutably while there exists another \
31 31 mutable reference in a Python object",
32 32 ));
33 33 }
34 34 match self.leak_count.get() {
35 35 0 => {
36 36 self.mutably_borrowed.replace(true);
37 37 Ok(PyRefMut::new(py, pyrefmut, self))
38 38 }
39 39 // TODO
40 40 // For now, this works differently than Python references
41 41 // in the case of iterators.
42 42 // Python does not complain when the data an iterator
43 43 // points to is modified if the iterator is never used
44 44 // afterwards.
45 45 // Here, we are stricter than this by refusing to give a
46 46 // mutable reference if it is already borrowed.
47 47 // While the additional safety might be argued for, it
48 48 // breaks valid programming patterns in Python and we need
49 49 // to fix this issue down the line.
50 50 _ => Err(AlreadyBorrowed::new(
51 51 py,
52 52 "Cannot borrow mutably while there are \
53 53 immutable references in Python objects",
54 54 )),
55 55 }
56 56 }
57 57
58 58 /// Return a reference to the wrapped data with an artificial static
59 59 /// lifetime.
60 60 /// We need to be protected by the GIL for thread-safety.
61 61 ///
62 62 /// # Safety
63 63 ///
64 64 /// This is highly unsafe since the lifetime of the given data can be
65 65 /// extended. Do not call this function directly.
66 66 pub unsafe fn leak_immutable<T>(
67 67 &self,
68 68 py: Python,
69 69 data: &PySharedRefCell<T>,
70 70 ) -> PyResult<&'static T> {
71 71 if self.mutably_borrowed.get() {
72 72 return Err(AlreadyBorrowed::new(
73 73 py,
74 74 "Cannot borrow immutably while there is a \
75 75 mutable reference in Python objects",
76 76 ));
77 77 }
78 78 let ptr = data.as_ptr();
79 79 self.leak_count.replace(self.leak_count.get() + 1);
80 80 Ok(&*ptr)
81 81 }
82 82
83 83 /// # Safety
84 84 ///
85 85 /// It's unsafe to update the reference count without knowing the
86 86 /// reference is deleted. Do not call this function directly.
87 87 pub unsafe fn decrease_leak_count(&self, _py: Python, mutable: bool) {
88 88 self.leak_count
89 89 .replace(self.leak_count.get().saturating_sub(1));
90 90 if mutable {
91 91 self.mutably_borrowed.replace(false);
92 92 }
93 93 }
94 94 }
95 95
96 96 /// `RefCell` wrapper to be safely used in conjunction with `PySharedState`.
97 97 ///
98 98 /// Only immutable operation is allowed through this interface.
99 99 #[derive(Debug)]
100 100 pub struct PySharedRefCell<T> {
101 101 inner: RefCell<T>,
102 102 }
103 103
104 104 impl<T> PySharedRefCell<T> {
105 105 pub const fn new(value: T) -> PySharedRefCell<T> {
106 106 Self {
107 107 inner: RefCell::new(value),
108 108 }
109 109 }
110 110
111 111 pub fn borrow(&self) -> Ref<T> {
112 112 // py_shared_state isn't involved since
113 113 // - inner.borrow() would fail if self is mutably borrowed,
114 114 // - and inner.borrow_mut() would fail while self is borrowed.
115 115 self.inner.borrow()
116 116 }
117 117
118 118 pub fn as_ptr(&self) -> *mut T {
119 119 self.inner.as_ptr()
120 120 }
121 121
122 122 pub unsafe fn borrow_mut(&self) -> RefMut<T> {
123 123 // must be borrowed by self.py_shared_state(py).borrow_mut().
124 124 self.inner.borrow_mut()
125 125 }
126 126 }
127 127
128 128 /// Holds a mutable reference to data shared between Python and Rust.
129 129 pub struct PyRefMut<'a, T> {
130 130 inner: RefMut<'a, T>,
131 131 py_shared_state: &'a PySharedState,
132 132 }
133 133
134 134 impl<'a, T> PyRefMut<'a, T> {
135 135 // Must be constructed by PySharedState after checking its leak_count.
136 136 // Otherwise, drop() would incorrectly update the state.
137 137 fn new(
138 138 _py: Python<'a>,
139 139 inner: RefMut<'a, T>,
140 140 py_shared_state: &'a PySharedState,
141 141 ) -> Self {
142 142 Self {
143 143 inner,
144 144 py_shared_state,
145 145 }
146 146 }
147 147 }
148 148
149 149 impl<'a, T> std::ops::Deref for PyRefMut<'a, T> {
150 150 type Target = RefMut<'a, T>;
151 151
152 152 fn deref(&self) -> &Self::Target {
153 153 &self.inner
154 154 }
155 155 }
156 156 impl<'a, T> std::ops::DerefMut for PyRefMut<'a, T> {
157 157 fn deref_mut(&mut self) -> &mut Self::Target {
158 158 &mut self.inner
159 159 }
160 160 }
161 161
162 162 impl<'a, T> Drop for PyRefMut<'a, T> {
163 163 fn drop(&mut self) {
164 164 let gil = Python::acquire_gil();
165 165 let py = gil.python();
166 166 unsafe {
167 167 self.py_shared_state.decrease_leak_count(py, true);
168 168 }
169 169 }
170 170 }
171 171
172 172 /// Allows a `py_class!` generated struct to share references to one of its
173 173 /// data members with Python.
174 174 ///
175 175 /// # Warning
176 176 ///
177 177 /// The targeted `py_class!` needs to have the
178 178 /// `data py_shared_state: PySharedState;` data attribute to compile.
179 179 /// A better, more complicated macro is needed to automatically insert it,
180 180 /// but this one is not yet really battle tested (what happens when
181 181 /// multiple references are needed?). See the example below.
182 182 ///
183 183 /// TODO allow Python container types: for now, integration with the garbage
184 184 /// collector does not extend to Rust structs holding references to Python
185 185 /// objects. Should the need surface, `__traverse__` and `__clear__` will
186 186 /// need to be written as per the `rust-cpython` docs on GC integration.
187 187 ///
188 188 /// # Parameters
189 189 ///
190 190 /// * `$name` is the same identifier used in for `py_class!` macro call.
191 191 /// * `$inner_struct` is the identifier of the underlying Rust struct
192 192 /// * `$data_member` is the identifier of the data member of `$inner_struct`
193 193 /// that will be shared.
194 194 /// * `$leaked` is the identifier to give to the struct that will manage
195 195 /// references to `$name`, to be used for example in other macros like
196 196 /// `py_shared_iterator`.
197 197 ///
198 198 /// # Example
199 199 ///
200 200 /// ```
201 201 /// struct MyStruct {
202 202 /// inner: Vec<u32>;
203 203 /// }
204 204 ///
205 205 /// py_class!(pub class MyType |py| {
206 206 /// data inner: PySharedRefCell<MyStruct>;
207 207 /// data py_shared_state: PySharedState;
208 208 /// });
209 209 ///
210 210 /// py_shared_ref!(MyType, MyStruct, inner, MyTypeLeakedRef);
211 211 /// ```
212 212 macro_rules! py_shared_ref {
213 213 (
214 214 $name: ident,
215 215 $inner_struct: ident,
216 216 $data_member: ident,
217 217 $leaked: ident,
218 218 ) => {
219 219 impl $name {
220 220 fn borrow_mut<'a>(
221 221 &'a self,
222 222 py: Python<'a>,
223 223 ) -> PyResult<crate::ref_sharing::PyRefMut<'a, $inner_struct>>
224 224 {
225 225 // assert $data_member type
226 226 use crate::ref_sharing::PySharedRefCell;
227 227 let data: &PySharedRefCell<_> = self.$data_member(py);
228 228 self.py_shared_state(py)
229 229 .borrow_mut(py, unsafe { data.borrow_mut() })
230 230 }
231 231
232 232 /// Returns a leaked reference and its management object.
233 233 ///
234 234 /// # Safety
235 235 ///
236 236 /// It's up to you to make sure that the management object lives
237 237 /// longer than the leaked reference. Otherwise, you'll get a
238 238 /// dangling reference.
239 239 unsafe fn leak_immutable<'a>(
240 240 &'a self,
241 241 py: Python<'a>,
242 242 ) -> PyResult<($leaked, &'static $inner_struct)> {
243 243 // assert $data_member type
244 244 use crate::ref_sharing::PySharedRefCell;
245 245 let data: &PySharedRefCell<_> = self.$data_member(py);
246 246 let static_ref =
247 247 self.py_shared_state(py).leak_immutable(py, data)?;
248 248 let leak_handle = $leaked::new(py, self);
249 249 Ok((leak_handle, static_ref))
250 250 }
251 251 }
252 252
253 253 /// Manage immutable references to `$name` leaked into Python
254 254 /// iterators.
255 255 ///
256 256 /// In truth, this does not represent leaked references themselves;
257 257 /// it is instead useful alongside them to manage them.
258 258 pub struct $leaked {
259 259 inner: $name,
260 260 }
261 261
262 262 impl $leaked {
263 263 // Marked as unsafe so client code wouldn't construct $leaked
264 264 // struct by mistake. Its drop() is unsafe.
265 265 unsafe fn new(py: Python, inner: &$name) -> Self {
266 266 Self {
267 267 inner: inner.clone_ref(py),
268 268 }
269 269 }
270 270 }
271 271
272 272 impl Drop for $leaked {
273 273 fn drop(&mut self) {
274 274 let gil = Python::acquire_gil();
275 275 let py = gil.python();
276 276 let state = self.inner.py_shared_state(py);
277 277 unsafe {
278 278 state.decrease_leak_count(py, false);
279 279 }
280 280 }
281 281 }
282 282 };
283 283 }
284 284
285 285 /// Defines a `py_class!` that acts as a Python iterator over a Rust iterator.
286 286 ///
287 287 /// TODO: this is a bit awkward to use, and a better (more complicated)
288 288 /// procedural macro would simplify the interface a lot.
289 289 ///
290 290 /// # Parameters
291 291 ///
292 292 /// * `$name` is the identifier to give to the resulting Rust struct.
293 293 /// * `$leaked` corresponds to `$leaked` in the matching `py_shared_ref!` call.
294 294 /// * `$iterator_type` is the type of the Rust iterator.
295 295 /// * `$success_func` is a function for processing the Rust `(key, value)`
296 296 /// tuple on iteration success, turning it into something Python understands.
297 297 /// * `$success_func` is the return type of `$success_func`
298 298 ///
299 299 /// # Example
300 300 ///
301 301 /// ```
302 302 /// struct MyStruct {
303 303 /// inner: HashMap<Vec<u8>, Vec<u8>>;
304 304 /// }
305 305 ///
306 306 /// py_class!(pub class MyType |py| {
307 307 /// data inner: PySharedRefCell<MyStruct>;
308 308 /// data py_shared_state: PySharedState;
309 309 ///
310 310 /// def __iter__(&self) -> PyResult<MyTypeItemsIterator> {
311 311 /// let (leak_handle, leaked_ref) = unsafe { self.leak_immutable(py)? };
312 /// MyTypeItemsIterator::create_instance(
312 /// MyTypeItemsIterator::from_inner(
313 313 /// py,
314 /// RefCell::new(Some(leak_handle)),
315 /// RefCell::new(leaked_ref.iter()),
314 /// leak_handle,
315 /// leaked_ref.iter(),
316 316 /// )
317 317 /// }
318 318 /// });
319 319 ///
320 320 /// impl MyType {
321 321 /// fn translate_key_value(
322 322 /// py: Python,
323 323 /// res: (&Vec<u8>, &Vec<u8>),
324 324 /// ) -> PyResult<Option<(PyBytes, PyBytes)>> {
325 325 /// let (f, entry) = res;
326 326 /// Ok(Some((
327 327 /// PyBytes::new(py, f),
328 328 /// PyBytes::new(py, entry),
329 329 /// )))
330 330 /// }
331 331 /// }
332 332 ///
333 333 /// py_shared_ref!(MyType, MyStruct, inner, MyTypeLeakedRef);
334 334 ///
335 335 /// py_shared_iterator!(
336 336 /// MyTypeItemsIterator,
337 337 /// MyTypeLeakedRef,
338 338 /// HashMap<'static, Vec<u8>, Vec<u8>>,
339 339 /// MyType::translate_key_value,
340 340 /// Option<(PyBytes, PyBytes)>
341 341 /// );
342 342 /// ```
343 343 macro_rules! py_shared_iterator {
344 344 (
345 345 $name: ident,
346 346 $leaked: ident,
347 347 $iterator_type: ty,
348 348 $success_func: expr,
349 349 $success_type: ty
350 350 ) => {
351 351 py_class!(pub class $name |py| {
352 352 data inner: RefCell<Option<$leaked>>;
353 353 data it: RefCell<$iterator_type>;
354 354
355 355 def __next__(&self) -> PyResult<$success_type> {
356 356 let mut inner_opt = self.inner(py).borrow_mut();
357 357 if inner_opt.is_some() {
358 358 match self.it(py).borrow_mut().next() {
359 359 None => {
360 360 // replace Some(inner) by None, drop $leaked
361 361 inner_opt.take();
362 362 Ok(None)
363 363 }
364 364 Some(res) => {
365 365 $success_func(py, res)
366 366 }
367 367 }
368 368 } else {
369 369 Ok(None)
370 370 }
371 371 }
372 372
373 373 def __iter__(&self) -> PyResult<Self> {
374 374 Ok(self.clone_ref(py))
375 375 }
376 376 });
377 377
378 378 impl $name {
379 379 pub fn from_inner(
380 380 py: Python,
381 381 leaked: $leaked,
382 382 it: $iterator_type
383 383 ) -> PyResult<Self> {
384 384 Self::create_instance(
385 385 py,
386 386 RefCell::new(Some(leaked)),
387 387 RefCell::new(it)
388 388 )
389 389 }
390 390 }
391 391 };
392 392 }
General Comments 0
You need to be logged in to leave comments. Login now