pyo3/types/
bytearray.rs

1use crate::err::{PyErr, PyResult};
2use crate::ffi_ptr_ext::FfiPtrExt;
3use crate::instance::{Borrowed, Bound};
4use crate::py_result_ext::PyResultExt;
5use crate::types::any::PyAnyMethods;
6use crate::{ffi, PyAny, Python};
7use std::slice;
8
9/// Represents a Python `bytearray`.
10///
11/// Values of this type are accessed via PyO3's smart pointers, e.g. as
12/// [`Py<PyByteArray>`][crate::Py] or [`Bound<'py, PyByteArray>`][Bound].
13///
14/// For APIs available on `bytearray` objects, see the [`PyByteArrayMethods`] trait which is implemented for
15/// [`Bound<'py, PyByteArray>`][Bound].
16#[repr(transparent)]
17pub struct PyByteArray(PyAny);
18
19pyobject_native_type_core!(PyByteArray, pyobject_native_static_type_object!(ffi::PyByteArray_Type), #checkfunction=ffi::PyByteArray_Check);
20
21impl PyByteArray {
22    /// Creates a new Python bytearray object.
23    ///
24    /// The byte string is initialized by copying the data from the `&[u8]`.
25    pub fn new<'py>(py: Python<'py>, src: &[u8]) -> Bound<'py, PyByteArray> {
26        let ptr = src.as_ptr().cast();
27        let len = src.len() as ffi::Py_ssize_t;
28        unsafe {
29            ffi::PyByteArray_FromStringAndSize(ptr, len)
30                .assume_owned(py)
31                .downcast_into_unchecked()
32        }
33    }
34
35    /// Creates a new Python `bytearray` object with an `init` closure to write its contents.
36    /// Before calling `init` the bytearray is zero-initialised.
37    /// * If Python raises a MemoryError on the allocation, `new_with` will return
38    ///   it inside `Err`.
39    /// * If `init` returns `Err(e)`, `new_with` will return `Err(e)`.
40    /// * If `init` returns `Ok(())`, `new_with` will return `Ok(&PyByteArray)`.
41    ///
42    /// # Examples
43    ///
44    /// ```
45    /// use pyo3::{prelude::*, types::PyByteArray};
46    ///
47    /// # fn main() -> PyResult<()> {
48    /// Python::with_gil(|py| -> PyResult<()> {
49    ///     let py_bytearray = PyByteArray::new_with(py, 10, |bytes: &mut [u8]| {
50    ///         bytes.copy_from_slice(b"Hello Rust");
51    ///         Ok(())
52    ///     })?;
53    ///     let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
54    ///     assert_eq!(bytearray, b"Hello Rust");
55    ///     Ok(())
56    /// })
57    /// # }
58    /// ```
59    pub fn new_with<F>(py: Python<'_>, len: usize, init: F) -> PyResult<Bound<'_, PyByteArray>>
60    where
61        F: FnOnce(&mut [u8]) -> PyResult<()>,
62    {
63        unsafe {
64            // Allocate buffer and check for an error
65            let pybytearray: Bound<'_, Self> =
66                ffi::PyByteArray_FromStringAndSize(std::ptr::null(), len as ffi::Py_ssize_t)
67                    .assume_owned_or_err(py)?
68                    .downcast_into_unchecked();
69
70            let buffer: *mut u8 = ffi::PyByteArray_AsString(pybytearray.as_ptr()).cast();
71            debug_assert!(!buffer.is_null());
72            // Zero-initialise the uninitialised bytearray
73            std::ptr::write_bytes(buffer, 0u8, len);
74            // (Further) Initialise the bytearray in init
75            // If init returns an Err, pypybytearray will automatically deallocate the buffer
76            init(std::slice::from_raw_parts_mut(buffer, len)).map(|_| pybytearray)
77        }
78    }
79
80    /// Creates a new Python `bytearray` object from another Python object that
81    /// implements the buffer protocol.
82    pub fn from<'py>(src: &Bound<'py, PyAny>) -> PyResult<Bound<'py, PyByteArray>> {
83        unsafe {
84            ffi::PyByteArray_FromObject(src.as_ptr())
85                .assume_owned_or_err(src.py())
86                .downcast_into_unchecked()
87        }
88    }
89}
90
91/// Implementation of functionality for [`PyByteArray`].
92///
93/// These methods are defined for the `Bound<'py, PyByteArray>` smart pointer, so to use method call
94/// syntax these methods are separated into a trait, because stable Rust does not yet support
95/// `arbitrary_self_types`.
96#[doc(alias = "PyByteArray")]
97pub trait PyByteArrayMethods<'py>: crate::sealed::Sealed {
98    /// Gets the length of the bytearray.
99    fn len(&self) -> usize;
100
101    /// Checks if the bytearray is empty.
102    fn is_empty(&self) -> bool;
103
104    /// Gets the start of the buffer containing the contents of the bytearray.
105    ///
106    /// # Safety
107    ///
108    /// See the safety requirements of [`PyByteArrayMethods::as_bytes`] and [`PyByteArrayMethods::as_bytes_mut`].
109    fn data(&self) -> *mut u8;
110
111    /// Extracts a slice of the `ByteArray`'s entire buffer.
112    ///
113    /// # Safety
114    ///
115    /// Mutation of the `bytearray` invalidates the slice. If it is used afterwards, the behavior is
116    /// undefined.
117    ///
118    /// These mutations may occur in Python code as well as from Rust:
119    /// - Calling methods like [`PyByteArrayMethods::as_bytes_mut`] and [`PyByteArrayMethods::resize`] will
120    ///   invalidate the slice.
121    /// - Actions like dropping objects or raising exceptions can invoke `__del__`methods or signal
122    ///   handlers, which may execute arbitrary Python code. This means that if Python code has a
123    ///   reference to the `bytearray` you cannot safely use the vast majority of PyO3's API whilst
124    ///   using the slice.
125    ///
126    /// As a result, this slice should only be used for short-lived operations without executing any
127    /// Python code, such as copying into a Vec.
128    ///
129    /// # Examples
130    ///
131    /// ```rust
132    /// use pyo3::prelude::*;
133    /// use pyo3::exceptions::PyRuntimeError;
134    /// use pyo3::types::PyByteArray;
135    ///
136    /// #[pyfunction]
137    /// fn a_valid_function(bytes: &Bound<'_, PyByteArray>) -> PyResult<()> {
138    ///     let section = {
139    ///         // SAFETY: We promise to not let the interpreter regain control
140    ///         // or invoke any PyO3 APIs while using the slice.
141    ///         let slice = unsafe { bytes.as_bytes() };
142    ///
143    ///         // Copy only a section of `bytes` while avoiding
144    ///         // `to_vec` which copies the entire thing.
145    ///         let section = slice
146    ///             .get(6..11)
147    ///             .ok_or_else(|| PyRuntimeError::new_err("input is not long enough"))?;
148    ///         Vec::from(section)
149    ///     };
150    ///
151    ///     // Now we can do things with `section` and call PyO3 APIs again.
152    ///     // ...
153    ///     # assert_eq!(&section, b"world");
154    ///
155    ///     Ok(())
156    /// }
157    /// # fn main() -> PyResult<()> {
158    /// #     Python::with_gil(|py| -> PyResult<()> {
159    /// #         let fun = wrap_pyfunction!(a_valid_function, py)?;
160    /// #         let locals = pyo3::types::PyDict::new(py);
161    /// #         locals.set_item("a_valid_function", fun)?;
162    /// #
163    /// #         py.run(pyo3::ffi::c_str!(
164    /// # r#"b = bytearray(b"hello world")
165    /// # a_valid_function(b)
166    /// #
167    /// # try:
168    /// #     a_valid_function(bytearray())
169    /// # except RuntimeError as e:
170    /// #     assert str(e) == 'input is not long enough'"#),
171    /// #             None,
172    /// #             Some(&locals),
173    /// #         )?;
174    /// #
175    /// #         Ok(())
176    /// #     })
177    /// # }
178    /// ```
179    ///
180    /// # Incorrect usage
181    ///
182    /// The following `bug` function is unsound ⚠️
183    ///
184    /// ```rust,no_run
185    /// # use pyo3::prelude::*;
186    /// # use pyo3::types::PyByteArray;
187    ///
188    /// # #[allow(dead_code)]
189    /// #[pyfunction]
190    /// fn bug(py: Python<'_>, bytes: &Bound<'_, PyByteArray>) {
191    ///     let slice = unsafe { bytes.as_bytes() };
192    ///
193    ///     // This explicitly yields control back to the Python interpreter...
194    ///     // ...but it's not always this obvious. Many things do this implicitly.
195    ///     py.allow_threads(|| {
196    ///         // Python code could be mutating through its handle to `bytes`,
197    ///         // which makes reading it a data race, which is undefined behavior.
198    ///         println!("{:?}", slice[0]);
199    ///     });
200    ///
201    ///     // Python code might have mutated it, so we can not rely on the slice
202    ///     // remaining valid. As such this is also undefined behavior.
203    ///     println!("{:?}", slice[0]);
204    /// }
205    /// ```
206    unsafe fn as_bytes(&self) -> &[u8];
207
208    /// Extracts a mutable slice of the `ByteArray`'s entire buffer.
209    ///
210    /// # Safety
211    ///
212    /// Any other accesses of the `bytearray`'s buffer invalidate the slice. If it is used
213    /// afterwards, the behavior is undefined. The safety requirements of [`PyByteArrayMethods::as_bytes`]
214    /// apply to this function as well.
215    #[allow(clippy::mut_from_ref)]
216    unsafe fn as_bytes_mut(&self) -> &mut [u8];
217
218    /// Copies the contents of the bytearray to a Rust vector.
219    ///
220    /// # Examples
221    ///
222    /// ```
223    /// # use pyo3::prelude::*;
224    /// # use pyo3::types::PyByteArray;
225    /// # Python::with_gil(|py| {
226    /// let bytearray = PyByteArray::new(py, b"Hello World.");
227    /// let mut copied_message = bytearray.to_vec();
228    /// assert_eq!(b"Hello World.", copied_message.as_slice());
229    ///
230    /// copied_message[11] = b'!';
231    /// assert_eq!(b"Hello World!", copied_message.as_slice());
232    ///
233    /// pyo3::py_run!(py, bytearray, "assert bytearray == b'Hello World.'");
234    /// # });
235    /// ```
236    fn to_vec(&self) -> Vec<u8>;
237
238    /// Resizes the bytearray object to the new length `len`.
239    ///
240    /// Note that this will invalidate any pointers obtained by [PyByteArrayMethods::data], as well as
241    /// any (unsafe) slices obtained from [PyByteArrayMethods::as_bytes] and [PyByteArrayMethods::as_bytes_mut].
242    fn resize(&self, len: usize) -> PyResult<()>;
243}
244
245impl<'py> PyByteArrayMethods<'py> for Bound<'py, PyByteArray> {
246    #[inline]
247    fn len(&self) -> usize {
248        // non-negative Py_ssize_t should always fit into Rust usize
249        unsafe { ffi::PyByteArray_Size(self.as_ptr()) as usize }
250    }
251
252    fn is_empty(&self) -> bool {
253        self.len() == 0
254    }
255
256    fn data(&self) -> *mut u8 {
257        self.as_borrowed().data()
258    }
259
260    unsafe fn as_bytes(&self) -> &[u8] {
261        unsafe { self.as_borrowed().as_bytes() }
262    }
263
264    #[allow(clippy::mut_from_ref)]
265    unsafe fn as_bytes_mut(&self) -> &mut [u8] {
266        unsafe { self.as_borrowed().as_bytes_mut() }
267    }
268
269    fn to_vec(&self) -> Vec<u8> {
270        unsafe { self.as_bytes() }.to_vec()
271    }
272
273    fn resize(&self, len: usize) -> PyResult<()> {
274        unsafe {
275            let result = ffi::PyByteArray_Resize(self.as_ptr(), len as ffi::Py_ssize_t);
276            if result == 0 {
277                Ok(())
278            } else {
279                Err(PyErr::fetch(self.py()))
280            }
281        }
282    }
283}
284
285impl<'a> Borrowed<'a, '_, PyByteArray> {
286    fn data(&self) -> *mut u8 {
287        unsafe { ffi::PyByteArray_AsString(self.as_ptr()).cast() }
288    }
289
290    #[allow(clippy::wrong_self_convention)]
291    unsafe fn as_bytes(self) -> &'a [u8] {
292        unsafe { slice::from_raw_parts(self.data(), self.len()) }
293    }
294
295    #[allow(clippy::wrong_self_convention)]
296    unsafe fn as_bytes_mut(self) -> &'a mut [u8] {
297        unsafe { slice::from_raw_parts_mut(self.data(), self.len()) }
298    }
299}
300
301impl<'py> TryFrom<&Bound<'py, PyAny>> for Bound<'py, PyByteArray> {
302    type Error = crate::PyErr;
303
304    /// Creates a new Python `bytearray` object from another Python object that
305    /// implements the buffer protocol.
306    fn try_from(value: &Bound<'py, PyAny>) -> Result<Self, Self::Error> {
307        PyByteArray::from(value)
308    }
309}
310
311#[cfg(test)]
312mod tests {
313    use crate::types::{PyAnyMethods, PyByteArray, PyByteArrayMethods};
314    use crate::{exceptions, Bound, PyAny, PyObject, Python};
315
316    #[test]
317    fn test_len() {
318        Python::with_gil(|py| {
319            let src = b"Hello Python";
320            let bytearray = PyByteArray::new(py, src);
321            assert_eq!(src.len(), bytearray.len());
322        });
323    }
324
325    #[test]
326    fn test_as_bytes() {
327        Python::with_gil(|py| {
328            let src = b"Hello Python";
329            let bytearray = PyByteArray::new(py, src);
330
331            let slice = unsafe { bytearray.as_bytes() };
332            assert_eq!(src, slice);
333            assert_eq!(bytearray.data() as *const _, slice.as_ptr());
334        });
335    }
336
337    #[test]
338    fn test_as_bytes_mut() {
339        Python::with_gil(|py| {
340            let src = b"Hello Python";
341            let bytearray = PyByteArray::new(py, src);
342
343            let slice = unsafe { bytearray.as_bytes_mut() };
344            assert_eq!(src, slice);
345            assert_eq!(bytearray.data(), slice.as_mut_ptr());
346
347            slice[0..5].copy_from_slice(b"Hi...");
348
349            assert_eq!(bytearray.str().unwrap(), "bytearray(b'Hi... Python')");
350        });
351    }
352
353    #[test]
354    fn test_to_vec() {
355        Python::with_gil(|py| {
356            let src = b"Hello Python";
357            let bytearray = PyByteArray::new(py, src);
358
359            let vec = bytearray.to_vec();
360            assert_eq!(src, vec.as_slice());
361        });
362    }
363
364    #[test]
365    fn test_from() {
366        Python::with_gil(|py| {
367            let src = b"Hello Python";
368            let bytearray = PyByteArray::new(py, src);
369
370            let ba: PyObject = bytearray.into();
371            let bytearray = PyByteArray::from(ba.bind(py)).unwrap();
372
373            assert_eq!(src, unsafe { bytearray.as_bytes() });
374        });
375    }
376
377    #[test]
378    fn test_from_err() {
379        Python::with_gil(|py| {
380            if let Err(err) = PyByteArray::from(py.None().bind(py)) {
381                assert!(err.is_instance_of::<exceptions::PyTypeError>(py));
382            } else {
383                panic!("error");
384            }
385        });
386    }
387
388    #[test]
389    fn test_try_from() {
390        Python::with_gil(|py| {
391            let src = b"Hello Python";
392            let bytearray: &Bound<'_, PyAny> = &PyByteArray::new(py, src);
393            let bytearray: Bound<'_, PyByteArray> = TryInto::try_into(bytearray).unwrap();
394
395            assert_eq!(src, unsafe { bytearray.as_bytes() });
396        });
397    }
398
399    #[test]
400    fn test_resize() {
401        Python::with_gil(|py| {
402            let src = b"Hello Python";
403            let bytearray = PyByteArray::new(py, src);
404
405            bytearray.resize(20).unwrap();
406            assert_eq!(20, bytearray.len());
407        });
408    }
409
410    #[test]
411    fn test_byte_array_new_with() -> super::PyResult<()> {
412        Python::with_gil(|py| -> super::PyResult<()> {
413            let py_bytearray = PyByteArray::new_with(py, 10, |b: &mut [u8]| {
414                b.copy_from_slice(b"Hello Rust");
415                Ok(())
416            })?;
417            let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
418            assert_eq!(bytearray, b"Hello Rust");
419            Ok(())
420        })
421    }
422
423    #[test]
424    fn test_byte_array_new_with_zero_initialised() -> super::PyResult<()> {
425        Python::with_gil(|py| -> super::PyResult<()> {
426            let py_bytearray = PyByteArray::new_with(py, 10, |_b: &mut [u8]| Ok(()))?;
427            let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
428            assert_eq!(bytearray, &[0; 10]);
429            Ok(())
430        })
431    }
432
433    #[test]
434    fn test_byte_array_new_with_error() {
435        use crate::exceptions::PyValueError;
436        Python::with_gil(|py| {
437            let py_bytearray_result = PyByteArray::new_with(py, 10, |_b: &mut [u8]| {
438                Err(PyValueError::new_err("Hello Crustaceans!"))
439            });
440            assert!(py_bytearray_result.is_err());
441            assert!(py_bytearray_result
442                .err()
443                .unwrap()
444                .is_instance_of::<PyValueError>(py));
445        })
446    }
447}
⚠️ Internal Docs ⚠️ Not Public API 👉 Official Docs Here