pyo3/types/bytearray.rs
1use crate::err::{PyErr, PyResult};
2use crate::ffi_ptr_ext::FfiPtrExt;
3use crate::instance::{Borrowed, Bound};
4use crate::py_result_ext::PyResultExt;
5use crate::types::any::PyAnyMethods;
6use crate::{ffi, PyAny, Python};
7use std::slice;
8
9/// Represents a Python `bytearray`.
10///
11/// Values of this type are accessed via PyO3's smart pointers, e.g. as
12/// [`Py<PyByteArray>`][crate::Py] or [`Bound<'py, PyByteArray>`][Bound].
13///
14/// For APIs available on `bytearray` objects, see the [`PyByteArrayMethods`] trait which is implemented for
15/// [`Bound<'py, PyByteArray>`][Bound].
16#[repr(transparent)]
17pub struct PyByteArray(PyAny);
18
19pyobject_native_type_core!(PyByteArray, pyobject_native_static_type_object!(ffi::PyByteArray_Type), #checkfunction=ffi::PyByteArray_Check);
20
21impl PyByteArray {
22 /// Creates a new Python bytearray object.
23 ///
24 /// The byte string is initialized by copying the data from the `&[u8]`.
25 pub fn new<'py>(py: Python<'py>, src: &[u8]) -> Bound<'py, PyByteArray> {
26 let ptr = src.as_ptr().cast();
27 let len = src.len() as ffi::Py_ssize_t;
28 unsafe {
29 ffi::PyByteArray_FromStringAndSize(ptr, len)
30 .assume_owned(py)
31 .downcast_into_unchecked()
32 }
33 }
34
35 /// Creates a new Python `bytearray` object with an `init` closure to write its contents.
36 /// Before calling `init` the bytearray is zero-initialised.
37 /// * If Python raises a MemoryError on the allocation, `new_with` will return
38 /// it inside `Err`.
39 /// * If `init` returns `Err(e)`, `new_with` will return `Err(e)`.
40 /// * If `init` returns `Ok(())`, `new_with` will return `Ok(&PyByteArray)`.
41 ///
42 /// # Examples
43 ///
44 /// ```
45 /// use pyo3::{prelude::*, types::PyByteArray};
46 ///
47 /// # fn main() -> PyResult<()> {
48 /// Python::with_gil(|py| -> PyResult<()> {
49 /// let py_bytearray = PyByteArray::new_with(py, 10, |bytes: &mut [u8]| {
50 /// bytes.copy_from_slice(b"Hello Rust");
51 /// Ok(())
52 /// })?;
53 /// let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
54 /// assert_eq!(bytearray, b"Hello Rust");
55 /// Ok(())
56 /// })
57 /// # }
58 /// ```
59 pub fn new_with<F>(py: Python<'_>, len: usize, init: F) -> PyResult<Bound<'_, PyByteArray>>
60 where
61 F: FnOnce(&mut [u8]) -> PyResult<()>,
62 {
63 unsafe {
64 // Allocate buffer and check for an error
65 let pybytearray: Bound<'_, Self> =
66 ffi::PyByteArray_FromStringAndSize(std::ptr::null(), len as ffi::Py_ssize_t)
67 .assume_owned_or_err(py)?
68 .downcast_into_unchecked();
69
70 let buffer: *mut u8 = ffi::PyByteArray_AsString(pybytearray.as_ptr()).cast();
71 debug_assert!(!buffer.is_null());
72 // Zero-initialise the uninitialised bytearray
73 std::ptr::write_bytes(buffer, 0u8, len);
74 // (Further) Initialise the bytearray in init
75 // If init returns an Err, pypybytearray will automatically deallocate the buffer
76 init(std::slice::from_raw_parts_mut(buffer, len)).map(|_| pybytearray)
77 }
78 }
79
80 /// Creates a new Python `bytearray` object from another Python object that
81 /// implements the buffer protocol.
82 pub fn from<'py>(src: &Bound<'py, PyAny>) -> PyResult<Bound<'py, PyByteArray>> {
83 unsafe {
84 ffi::PyByteArray_FromObject(src.as_ptr())
85 .assume_owned_or_err(src.py())
86 .downcast_into_unchecked()
87 }
88 }
89}
90
91/// Implementation of functionality for [`PyByteArray`].
92///
93/// These methods are defined for the `Bound<'py, PyByteArray>` smart pointer, so to use method call
94/// syntax these methods are separated into a trait, because stable Rust does not yet support
95/// `arbitrary_self_types`.
96#[doc(alias = "PyByteArray")]
97pub trait PyByteArrayMethods<'py>: crate::sealed::Sealed {
98 /// Gets the length of the bytearray.
99 fn len(&self) -> usize;
100
101 /// Checks if the bytearray is empty.
102 fn is_empty(&self) -> bool;
103
104 /// Gets the start of the buffer containing the contents of the bytearray.
105 ///
106 /// # Safety
107 ///
108 /// See the safety requirements of [`PyByteArrayMethods::as_bytes`] and [`PyByteArrayMethods::as_bytes_mut`].
109 fn data(&self) -> *mut u8;
110
111 /// Extracts a slice of the `ByteArray`'s entire buffer.
112 ///
113 /// # Safety
114 ///
115 /// Mutation of the `bytearray` invalidates the slice. If it is used afterwards, the behavior is
116 /// undefined.
117 ///
118 /// These mutations may occur in Python code as well as from Rust:
119 /// - Calling methods like [`PyByteArrayMethods::as_bytes_mut`] and [`PyByteArrayMethods::resize`] will
120 /// invalidate the slice.
121 /// - Actions like dropping objects or raising exceptions can invoke `__del__`methods or signal
122 /// handlers, which may execute arbitrary Python code. This means that if Python code has a
123 /// reference to the `bytearray` you cannot safely use the vast majority of PyO3's API whilst
124 /// using the slice.
125 ///
126 /// As a result, this slice should only be used for short-lived operations without executing any
127 /// Python code, such as copying into a Vec.
128 ///
129 /// # Examples
130 ///
131 /// ```rust
132 /// use pyo3::prelude::*;
133 /// use pyo3::exceptions::PyRuntimeError;
134 /// use pyo3::types::PyByteArray;
135 ///
136 /// #[pyfunction]
137 /// fn a_valid_function(bytes: &Bound<'_, PyByteArray>) -> PyResult<()> {
138 /// let section = {
139 /// // SAFETY: We promise to not let the interpreter regain control
140 /// // or invoke any PyO3 APIs while using the slice.
141 /// let slice = unsafe { bytes.as_bytes() };
142 ///
143 /// // Copy only a section of `bytes` while avoiding
144 /// // `to_vec` which copies the entire thing.
145 /// let section = slice
146 /// .get(6..11)
147 /// .ok_or_else(|| PyRuntimeError::new_err("input is not long enough"))?;
148 /// Vec::from(section)
149 /// };
150 ///
151 /// // Now we can do things with `section` and call PyO3 APIs again.
152 /// // ...
153 /// # assert_eq!(§ion, b"world");
154 ///
155 /// Ok(())
156 /// }
157 /// # fn main() -> PyResult<()> {
158 /// # Python::with_gil(|py| -> PyResult<()> {
159 /// # let fun = wrap_pyfunction!(a_valid_function, py)?;
160 /// # let locals = pyo3::types::PyDict::new(py);
161 /// # locals.set_item("a_valid_function", fun)?;
162 /// #
163 /// # py.run(pyo3::ffi::c_str!(
164 /// # r#"b = bytearray(b"hello world")
165 /// # a_valid_function(b)
166 /// #
167 /// # try:
168 /// # a_valid_function(bytearray())
169 /// # except RuntimeError as e:
170 /// # assert str(e) == 'input is not long enough'"#),
171 /// # None,
172 /// # Some(&locals),
173 /// # )?;
174 /// #
175 /// # Ok(())
176 /// # })
177 /// # }
178 /// ```
179 ///
180 /// # Incorrect usage
181 ///
182 /// The following `bug` function is unsound ⚠️
183 ///
184 /// ```rust,no_run
185 /// # use pyo3::prelude::*;
186 /// # use pyo3::types::PyByteArray;
187 ///
188 /// # #[allow(dead_code)]
189 /// #[pyfunction]
190 /// fn bug(py: Python<'_>, bytes: &Bound<'_, PyByteArray>) {
191 /// let slice = unsafe { bytes.as_bytes() };
192 ///
193 /// // This explicitly yields control back to the Python interpreter...
194 /// // ...but it's not always this obvious. Many things do this implicitly.
195 /// py.allow_threads(|| {
196 /// // Python code could be mutating through its handle to `bytes`,
197 /// // which makes reading it a data race, which is undefined behavior.
198 /// println!("{:?}", slice[0]);
199 /// });
200 ///
201 /// // Python code might have mutated it, so we can not rely on the slice
202 /// // remaining valid. As such this is also undefined behavior.
203 /// println!("{:?}", slice[0]);
204 /// }
205 /// ```
206 unsafe fn as_bytes(&self) -> &[u8];
207
208 /// Extracts a mutable slice of the `ByteArray`'s entire buffer.
209 ///
210 /// # Safety
211 ///
212 /// Any other accesses of the `bytearray`'s buffer invalidate the slice. If it is used
213 /// afterwards, the behavior is undefined. The safety requirements of [`PyByteArrayMethods::as_bytes`]
214 /// apply to this function as well.
215 #[allow(clippy::mut_from_ref)]
216 unsafe fn as_bytes_mut(&self) -> &mut [u8];
217
218 /// Copies the contents of the bytearray to a Rust vector.
219 ///
220 /// # Examples
221 ///
222 /// ```
223 /// # use pyo3::prelude::*;
224 /// # use pyo3::types::PyByteArray;
225 /// # Python::with_gil(|py| {
226 /// let bytearray = PyByteArray::new(py, b"Hello World.");
227 /// let mut copied_message = bytearray.to_vec();
228 /// assert_eq!(b"Hello World.", copied_message.as_slice());
229 ///
230 /// copied_message[11] = b'!';
231 /// assert_eq!(b"Hello World!", copied_message.as_slice());
232 ///
233 /// pyo3::py_run!(py, bytearray, "assert bytearray == b'Hello World.'");
234 /// # });
235 /// ```
236 fn to_vec(&self) -> Vec<u8>;
237
238 /// Resizes the bytearray object to the new length `len`.
239 ///
240 /// Note that this will invalidate any pointers obtained by [PyByteArrayMethods::data], as well as
241 /// any (unsafe) slices obtained from [PyByteArrayMethods::as_bytes] and [PyByteArrayMethods::as_bytes_mut].
242 fn resize(&self, len: usize) -> PyResult<()>;
243}
244
245impl<'py> PyByteArrayMethods<'py> for Bound<'py, PyByteArray> {
246 #[inline]
247 fn len(&self) -> usize {
248 // non-negative Py_ssize_t should always fit into Rust usize
249 unsafe { ffi::PyByteArray_Size(self.as_ptr()) as usize }
250 }
251
252 fn is_empty(&self) -> bool {
253 self.len() == 0
254 }
255
256 fn data(&self) -> *mut u8 {
257 self.as_borrowed().data()
258 }
259
260 unsafe fn as_bytes(&self) -> &[u8] {
261 unsafe { self.as_borrowed().as_bytes() }
262 }
263
264 #[allow(clippy::mut_from_ref)]
265 unsafe fn as_bytes_mut(&self) -> &mut [u8] {
266 unsafe { self.as_borrowed().as_bytes_mut() }
267 }
268
269 fn to_vec(&self) -> Vec<u8> {
270 unsafe { self.as_bytes() }.to_vec()
271 }
272
273 fn resize(&self, len: usize) -> PyResult<()> {
274 unsafe {
275 let result = ffi::PyByteArray_Resize(self.as_ptr(), len as ffi::Py_ssize_t);
276 if result == 0 {
277 Ok(())
278 } else {
279 Err(PyErr::fetch(self.py()))
280 }
281 }
282 }
283}
284
285impl<'a> Borrowed<'a, '_, PyByteArray> {
286 fn data(&self) -> *mut u8 {
287 unsafe { ffi::PyByteArray_AsString(self.as_ptr()).cast() }
288 }
289
290 #[allow(clippy::wrong_self_convention)]
291 unsafe fn as_bytes(self) -> &'a [u8] {
292 unsafe { slice::from_raw_parts(self.data(), self.len()) }
293 }
294
295 #[allow(clippy::wrong_self_convention)]
296 unsafe fn as_bytes_mut(self) -> &'a mut [u8] {
297 unsafe { slice::from_raw_parts_mut(self.data(), self.len()) }
298 }
299}
300
301impl<'py> TryFrom<&Bound<'py, PyAny>> for Bound<'py, PyByteArray> {
302 type Error = crate::PyErr;
303
304 /// Creates a new Python `bytearray` object from another Python object that
305 /// implements the buffer protocol.
306 fn try_from(value: &Bound<'py, PyAny>) -> Result<Self, Self::Error> {
307 PyByteArray::from(value)
308 }
309}
310
311#[cfg(test)]
312mod tests {
313 use crate::types::{PyAnyMethods, PyByteArray, PyByteArrayMethods};
314 use crate::{exceptions, Bound, PyAny, PyObject, Python};
315
316 #[test]
317 fn test_len() {
318 Python::with_gil(|py| {
319 let src = b"Hello Python";
320 let bytearray = PyByteArray::new(py, src);
321 assert_eq!(src.len(), bytearray.len());
322 });
323 }
324
325 #[test]
326 fn test_as_bytes() {
327 Python::with_gil(|py| {
328 let src = b"Hello Python";
329 let bytearray = PyByteArray::new(py, src);
330
331 let slice = unsafe { bytearray.as_bytes() };
332 assert_eq!(src, slice);
333 assert_eq!(bytearray.data() as *const _, slice.as_ptr());
334 });
335 }
336
337 #[test]
338 fn test_as_bytes_mut() {
339 Python::with_gil(|py| {
340 let src = b"Hello Python";
341 let bytearray = PyByteArray::new(py, src);
342
343 let slice = unsafe { bytearray.as_bytes_mut() };
344 assert_eq!(src, slice);
345 assert_eq!(bytearray.data(), slice.as_mut_ptr());
346
347 slice[0..5].copy_from_slice(b"Hi...");
348
349 assert_eq!(bytearray.str().unwrap(), "bytearray(b'Hi... Python')");
350 });
351 }
352
353 #[test]
354 fn test_to_vec() {
355 Python::with_gil(|py| {
356 let src = b"Hello Python";
357 let bytearray = PyByteArray::new(py, src);
358
359 let vec = bytearray.to_vec();
360 assert_eq!(src, vec.as_slice());
361 });
362 }
363
364 #[test]
365 fn test_from() {
366 Python::with_gil(|py| {
367 let src = b"Hello Python";
368 let bytearray = PyByteArray::new(py, src);
369
370 let ba: PyObject = bytearray.into();
371 let bytearray = PyByteArray::from(ba.bind(py)).unwrap();
372
373 assert_eq!(src, unsafe { bytearray.as_bytes() });
374 });
375 }
376
377 #[test]
378 fn test_from_err() {
379 Python::with_gil(|py| {
380 if let Err(err) = PyByteArray::from(py.None().bind(py)) {
381 assert!(err.is_instance_of::<exceptions::PyTypeError>(py));
382 } else {
383 panic!("error");
384 }
385 });
386 }
387
388 #[test]
389 fn test_try_from() {
390 Python::with_gil(|py| {
391 let src = b"Hello Python";
392 let bytearray: &Bound<'_, PyAny> = &PyByteArray::new(py, src);
393 let bytearray: Bound<'_, PyByteArray> = TryInto::try_into(bytearray).unwrap();
394
395 assert_eq!(src, unsafe { bytearray.as_bytes() });
396 });
397 }
398
399 #[test]
400 fn test_resize() {
401 Python::with_gil(|py| {
402 let src = b"Hello Python";
403 let bytearray = PyByteArray::new(py, src);
404
405 bytearray.resize(20).unwrap();
406 assert_eq!(20, bytearray.len());
407 });
408 }
409
410 #[test]
411 fn test_byte_array_new_with() -> super::PyResult<()> {
412 Python::with_gil(|py| -> super::PyResult<()> {
413 let py_bytearray = PyByteArray::new_with(py, 10, |b: &mut [u8]| {
414 b.copy_from_slice(b"Hello Rust");
415 Ok(())
416 })?;
417 let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
418 assert_eq!(bytearray, b"Hello Rust");
419 Ok(())
420 })
421 }
422
423 #[test]
424 fn test_byte_array_new_with_zero_initialised() -> super::PyResult<()> {
425 Python::with_gil(|py| -> super::PyResult<()> {
426 let py_bytearray = PyByteArray::new_with(py, 10, |_b: &mut [u8]| Ok(()))?;
427 let bytearray: &[u8] = unsafe { py_bytearray.as_bytes() };
428 assert_eq!(bytearray, &[0; 10]);
429 Ok(())
430 })
431 }
432
433 #[test]
434 fn test_byte_array_new_with_error() {
435 use crate::exceptions::PyValueError;
436 Python::with_gil(|py| {
437 let py_bytearray_result = PyByteArray::new_with(py, 10, |_b: &mut [u8]| {
438 Err(PyValueError::new_err("Hello Crustaceans!"))
439 });
440 assert!(py_bytearray_result.is_err());
441 assert!(py_bytearray_result
442 .err()
443 .unwrap()
444 .is_instance_of::<PyValueError>(py));
445 })
446 }
447}