pyo3/types/
bytes.rs

1use crate::ffi_ptr_ext::FfiPtrExt;
2use crate::instance::{Borrowed, Bound};
3use crate::types::any::PyAnyMethods;
4use crate::{ffi, Py, PyAny, PyResult, Python};
5use std::ops::Index;
6use std::slice::SliceIndex;
7use std::str;
8
9/// Represents a Python `bytes` object.
10///
11/// This type is immutable.
12///
13/// Values of this type are accessed via PyO3's smart pointers, e.g. as
14/// [`Py<PyBytes>`][crate::Py] or [`Bound<'py, PyBytes>`][Bound].
15///
16/// For APIs available on `bytes` objects, see the [`PyBytesMethods`] trait which is implemented for
17/// [`Bound<'py, PyBytes>`][Bound].
18///
19/// # Equality
20///
21/// For convenience, [`Bound<'py, PyBytes>`][Bound] implements [`PartialEq<[u8]>`][PartialEq] to allow comparing the
22/// data in the Python bytes to a Rust `[u8]` byte slice.
23///
24/// This is not always the most appropriate way to compare Python bytes, as Python bytes subclasses
25/// may have different equality semantics. In situations where subclasses overriding equality might be
26/// relevant, use [`PyAnyMethods::eq`], at cost of the additional overhead of a Python method call.
27///
28/// ```rust
29/// # use pyo3::prelude::*;
30/// use pyo3::types::PyBytes;
31///
32/// # Python::with_gil(|py| {
33/// let py_bytes = PyBytes::new(py, b"foo".as_slice());
34/// // via PartialEq<[u8]>
35/// assert_eq!(py_bytes, b"foo".as_slice());
36///
37/// // via Python equality
38/// let other = PyBytes::new(py, b"foo".as_slice());
39/// assert!(py_bytes.as_any().eq(other).unwrap());
40///
41/// // Note that `eq` will convert its argument to Python using `IntoPyObject`.
42/// // Byte collections are specialized, so that the following slice will indeed
43/// // convert into a `bytes` object and not a `list`:
44/// assert!(py_bytes.as_any().eq(b"foo".as_slice()).unwrap());
45/// # });
46/// ```
47#[repr(transparent)]
48pub struct PyBytes(PyAny);
49
50pyobject_native_type_core!(PyBytes, pyobject_native_static_type_object!(ffi::PyBytes_Type), #checkfunction=ffi::PyBytes_Check);
51
52impl PyBytes {
53    /// Creates a new Python bytestring object.
54    /// The bytestring is initialized by copying the data from the `&[u8]`.
55    ///
56    /// Panics if out of memory.
57    pub fn new<'p>(py: Python<'p>, s: &[u8]) -> Bound<'p, PyBytes> {
58        let ptr = s.as_ptr().cast();
59        let len = s.len() as ffi::Py_ssize_t;
60        unsafe {
61            ffi::PyBytes_FromStringAndSize(ptr, len)
62                .assume_owned(py)
63                .downcast_into_unchecked()
64        }
65    }
66
67    /// Creates a new Python `bytes` object with an `init` closure to write its contents.
68    /// Before calling `init` the bytes' contents are zero-initialised.
69    /// * If Python raises a MemoryError on the allocation, `new_with` will return
70    ///   it inside `Err`.
71    /// * If `init` returns `Err(e)`, `new_with` will return `Err(e)`.
72    /// * If `init` returns `Ok(())`, `new_with` will return `Ok(&PyBytes)`.
73    ///
74    /// # Examples
75    ///
76    /// ```
77    /// use pyo3::{prelude::*, types::PyBytes};
78    ///
79    /// # fn main() -> PyResult<()> {
80    /// Python::with_gil(|py| -> PyResult<()> {
81    ///     let py_bytes = PyBytes::new_with(py, 10, |bytes: &mut [u8]| {
82    ///         bytes.copy_from_slice(b"Hello Rust");
83    ///         Ok(())
84    ///     })?;
85    ///     let bytes: &[u8] = py_bytes.extract()?;
86    ///     assert_eq!(bytes, b"Hello Rust");
87    ///     Ok(())
88    /// })
89    /// # }
90    /// ```
91    #[inline]
92    pub fn new_with<F>(py: Python<'_>, len: usize, init: F) -> PyResult<Bound<'_, PyBytes>>
93    where
94        F: FnOnce(&mut [u8]) -> PyResult<()>,
95    {
96        unsafe {
97            let pyptr = ffi::PyBytes_FromStringAndSize(std::ptr::null(), len as ffi::Py_ssize_t);
98            // Check for an allocation error and return it
99            let pybytes = pyptr.assume_owned_or_err(py)?.downcast_into_unchecked();
100            let buffer: *mut u8 = ffi::PyBytes_AsString(pyptr).cast();
101            debug_assert!(!buffer.is_null());
102            // Zero-initialise the uninitialised bytestring
103            std::ptr::write_bytes(buffer, 0u8, len);
104            // (Further) Initialise the bytestring in init
105            // If init returns an Err, pypybytearray will automatically deallocate the buffer
106            init(std::slice::from_raw_parts_mut(buffer, len)).map(|_| pybytes)
107        }
108    }
109
110    /// Creates a new Python byte string object from a raw pointer and length.
111    ///
112    /// Panics if out of memory.
113    ///
114    /// # Safety
115    ///
116    /// This function dereferences the raw pointer `ptr` as the
117    /// leading pointer of a slice of length `len`. [As with
118    /// `std::slice::from_raw_parts`, this is
119    /// unsafe](https://doc.rust-lang.org/std/slice/fn.from_raw_parts.html#safety).
120    pub unsafe fn from_ptr(py: Python<'_>, ptr: *const u8, len: usize) -> Bound<'_, PyBytes> {
121        unsafe {
122            ffi::PyBytes_FromStringAndSize(ptr.cast(), len as isize)
123                .assume_owned(py)
124                .downcast_into_unchecked()
125        }
126    }
127}
128
129/// Implementation of functionality for [`PyBytes`].
130///
131/// These methods are defined for the `Bound<'py, PyBytes>` smart pointer, so to use method call
132/// syntax these methods are separated into a trait, because stable Rust does not yet support
133/// `arbitrary_self_types`.
134#[doc(alias = "PyBytes")]
135pub trait PyBytesMethods<'py>: crate::sealed::Sealed {
136    /// Gets the Python string as a byte slice.
137    fn as_bytes(&self) -> &[u8];
138}
139
140impl<'py> PyBytesMethods<'py> for Bound<'py, PyBytes> {
141    #[inline]
142    fn as_bytes(&self) -> &[u8] {
143        self.as_borrowed().as_bytes()
144    }
145}
146
147impl<'a> Borrowed<'a, '_, PyBytes> {
148    /// Gets the Python string as a byte slice.
149    #[allow(clippy::wrong_self_convention)]
150    pub(crate) fn as_bytes(self) -> &'a [u8] {
151        unsafe {
152            let buffer = ffi::PyBytes_AsString(self.as_ptr()) as *const u8;
153            let length = ffi::PyBytes_Size(self.as_ptr()) as usize;
154            debug_assert!(!buffer.is_null());
155            std::slice::from_raw_parts(buffer, length)
156        }
157    }
158}
159
160impl Py<PyBytes> {
161    /// Gets the Python bytes as a byte slice. Because Python bytes are
162    /// immutable, the result may be used for as long as the reference to
163    /// `self` is held, including when the GIL is released.
164    pub fn as_bytes<'a>(&'a self, py: Python<'_>) -> &'a [u8] {
165        self.bind_borrowed(py).as_bytes()
166    }
167}
168
169/// This is the same way [Vec] is indexed.
170impl<I: SliceIndex<[u8]>> Index<I> for Bound<'_, PyBytes> {
171    type Output = I::Output;
172
173    fn index(&self, index: I) -> &Self::Output {
174        &self.as_bytes()[index]
175    }
176}
177
178/// Compares whether the Python bytes object is equal to the [u8].
179///
180/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
181impl PartialEq<[u8]> for Bound<'_, PyBytes> {
182    #[inline]
183    fn eq(&self, other: &[u8]) -> bool {
184        self.as_borrowed() == *other
185    }
186}
187
188/// Compares whether the Python bytes object is equal to the [u8].
189///
190/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
191impl PartialEq<&'_ [u8]> for Bound<'_, PyBytes> {
192    #[inline]
193    fn eq(&self, other: &&[u8]) -> bool {
194        self.as_borrowed() == **other
195    }
196}
197
198/// Compares whether the Python bytes object is equal to the [u8].
199///
200/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
201impl PartialEq<Bound<'_, PyBytes>> for [u8] {
202    #[inline]
203    fn eq(&self, other: &Bound<'_, PyBytes>) -> bool {
204        *self == other.as_borrowed()
205    }
206}
207
208/// Compares whether the Python bytes object is equal to the [u8].
209///
210/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
211impl PartialEq<&'_ Bound<'_, PyBytes>> for [u8] {
212    #[inline]
213    fn eq(&self, other: &&Bound<'_, PyBytes>) -> bool {
214        *self == other.as_borrowed()
215    }
216}
217
218/// Compares whether the Python bytes object is equal to the [u8].
219///
220/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
221impl PartialEq<Bound<'_, PyBytes>> for &'_ [u8] {
222    #[inline]
223    fn eq(&self, other: &Bound<'_, PyBytes>) -> bool {
224        **self == other.as_borrowed()
225    }
226}
227
228/// Compares whether the Python bytes object is equal to the [u8].
229///
230/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
231impl PartialEq<[u8]> for &'_ Bound<'_, PyBytes> {
232    #[inline]
233    fn eq(&self, other: &[u8]) -> bool {
234        self.as_borrowed() == other
235    }
236}
237
238/// Compares whether the Python bytes object is equal to the [u8].
239///
240/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
241impl PartialEq<[u8]> for Borrowed<'_, '_, PyBytes> {
242    #[inline]
243    fn eq(&self, other: &[u8]) -> bool {
244        self.as_bytes() == other
245    }
246}
247
248/// Compares whether the Python bytes object is equal to the [u8].
249///
250/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
251impl PartialEq<&[u8]> for Borrowed<'_, '_, PyBytes> {
252    #[inline]
253    fn eq(&self, other: &&[u8]) -> bool {
254        *self == **other
255    }
256}
257
258/// Compares whether the Python bytes object is equal to the [u8].
259///
260/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
261impl PartialEq<Borrowed<'_, '_, PyBytes>> for [u8] {
262    #[inline]
263    fn eq(&self, other: &Borrowed<'_, '_, PyBytes>) -> bool {
264        other == self
265    }
266}
267
268/// Compares whether the Python bytes object is equal to the [u8].
269///
270/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
271impl PartialEq<Borrowed<'_, '_, PyBytes>> for &'_ [u8] {
272    #[inline]
273    fn eq(&self, other: &Borrowed<'_, '_, PyBytes>) -> bool {
274        other == self
275    }
276}
277
278#[cfg(test)]
279mod tests {
280    use super::*;
281
282    #[test]
283    fn test_bytes_index() {
284        Python::with_gil(|py| {
285            let bytes = PyBytes::new(py, b"Hello World");
286            assert_eq!(bytes[1], b'e');
287        });
288    }
289
290    #[test]
291    fn test_bound_bytes_index() {
292        Python::with_gil(|py| {
293            let bytes = PyBytes::new(py, b"Hello World");
294            assert_eq!(bytes[1], b'e');
295
296            let bytes = &bytes;
297            assert_eq!(bytes[1], b'e');
298        });
299    }
300
301    #[test]
302    fn test_bytes_new_with() -> super::PyResult<()> {
303        Python::with_gil(|py| -> super::PyResult<()> {
304            let py_bytes = PyBytes::new_with(py, 10, |b: &mut [u8]| {
305                b.copy_from_slice(b"Hello Rust");
306                Ok(())
307            })?;
308            let bytes: &[u8] = py_bytes.extract()?;
309            assert_eq!(bytes, b"Hello Rust");
310            Ok(())
311        })
312    }
313
314    #[test]
315    fn test_bytes_new_with_zero_initialised() -> super::PyResult<()> {
316        Python::with_gil(|py| -> super::PyResult<()> {
317            let py_bytes = PyBytes::new_with(py, 10, |_b: &mut [u8]| Ok(()))?;
318            let bytes: &[u8] = py_bytes.extract()?;
319            assert_eq!(bytes, &[0; 10]);
320            Ok(())
321        })
322    }
323
324    #[test]
325    fn test_bytes_new_with_error() {
326        use crate::exceptions::PyValueError;
327        Python::with_gil(|py| {
328            let py_bytes_result = PyBytes::new_with(py, 10, |_b: &mut [u8]| {
329                Err(PyValueError::new_err("Hello Crustaceans!"))
330            });
331            assert!(py_bytes_result.is_err());
332            assert!(py_bytes_result
333                .err()
334                .unwrap()
335                .is_instance_of::<PyValueError>(py));
336        });
337    }
338
339    #[test]
340    fn test_comparisons() {
341        Python::with_gil(|py| {
342            let b = b"hello, world".as_slice();
343            let py_bytes = PyBytes::new(py, b);
344
345            assert_eq!(py_bytes, b"hello, world".as_slice());
346
347            assert_eq!(py_bytes, b);
348            assert_eq!(&py_bytes, b);
349            assert_eq!(b, py_bytes);
350            assert_eq!(b, &py_bytes);
351
352            assert_eq!(py_bytes, *b);
353            assert_eq!(&py_bytes, *b);
354            assert_eq!(*b, py_bytes);
355            assert_eq!(*b, &py_bytes);
356
357            let py_string = py_bytes.as_borrowed();
358
359            assert_eq!(py_string, b);
360            assert_eq!(&py_string, b);
361            assert_eq!(b, py_string);
362            assert_eq!(b, &py_string);
363
364            assert_eq!(py_string, *b);
365            assert_eq!(*b, py_string);
366        })
367    }
368}
⚠️ Internal Docs ⚠️ Not Public API 👉 Official Docs Here