pyo3/types/bytes.rs
1use crate::ffi_ptr_ext::FfiPtrExt;
2use crate::instance::{Borrowed, Bound};
3use crate::types::any::PyAnyMethods;
4use crate::{ffi, Py, PyAny, PyResult, Python};
5use std::ops::Index;
6use std::slice::SliceIndex;
7use std::str;
8
9/// Represents a Python `bytes` object.
10///
11/// This type is immutable.
12///
13/// Values of this type are accessed via PyO3's smart pointers, e.g. as
14/// [`Py<PyBytes>`][crate::Py] or [`Bound<'py, PyBytes>`][Bound].
15///
16/// For APIs available on `bytes` objects, see the [`PyBytesMethods`] trait which is implemented for
17/// [`Bound<'py, PyBytes>`][Bound].
18///
19/// # Equality
20///
21/// For convenience, [`Bound<'py, PyBytes>`][Bound] implements [`PartialEq<[u8]>`][PartialEq] to allow comparing the
22/// data in the Python bytes to a Rust `[u8]` byte slice.
23///
24/// This is not always the most appropriate way to compare Python bytes, as Python bytes subclasses
25/// may have different equality semantics. In situations where subclasses overriding equality might be
26/// relevant, use [`PyAnyMethods::eq`], at cost of the additional overhead of a Python method call.
27///
28/// ```rust
29/// # use pyo3::prelude::*;
30/// use pyo3::types::PyBytes;
31///
32/// # Python::with_gil(|py| {
33/// let py_bytes = PyBytes::new(py, b"foo".as_slice());
34/// // via PartialEq<[u8]>
35/// assert_eq!(py_bytes, b"foo".as_slice());
36///
37/// // via Python equality
38/// let other = PyBytes::new(py, b"foo".as_slice());
39/// assert!(py_bytes.as_any().eq(other).unwrap());
40///
41/// // Note that `eq` will convert its argument to Python using `IntoPyObject`.
42/// // Byte collections are specialized, so that the following slice will indeed
43/// // convert into a `bytes` object and not a `list`:
44/// assert!(py_bytes.as_any().eq(b"foo".as_slice()).unwrap());
45/// # });
46/// ```
47#[repr(transparent)]
48pub struct PyBytes(PyAny);
49
50pyobject_native_type_core!(PyBytes, pyobject_native_static_type_object!(ffi::PyBytes_Type), #checkfunction=ffi::PyBytes_Check);
51
52impl PyBytes {
53 /// Creates a new Python bytestring object.
54 /// The bytestring is initialized by copying the data from the `&[u8]`.
55 ///
56 /// Panics if out of memory.
57 pub fn new<'p>(py: Python<'p>, s: &[u8]) -> Bound<'p, PyBytes> {
58 let ptr = s.as_ptr().cast();
59 let len = s.len() as ffi::Py_ssize_t;
60 unsafe {
61 ffi::PyBytes_FromStringAndSize(ptr, len)
62 .assume_owned(py)
63 .downcast_into_unchecked()
64 }
65 }
66
67 /// Creates a new Python `bytes` object with an `init` closure to write its contents.
68 /// Before calling `init` the bytes' contents are zero-initialised.
69 /// * If Python raises a MemoryError on the allocation, `new_with` will return
70 /// it inside `Err`.
71 /// * If `init` returns `Err(e)`, `new_with` will return `Err(e)`.
72 /// * If `init` returns `Ok(())`, `new_with` will return `Ok(&PyBytes)`.
73 ///
74 /// # Examples
75 ///
76 /// ```
77 /// use pyo3::{prelude::*, types::PyBytes};
78 ///
79 /// # fn main() -> PyResult<()> {
80 /// Python::with_gil(|py| -> PyResult<()> {
81 /// let py_bytes = PyBytes::new_with(py, 10, |bytes: &mut [u8]| {
82 /// bytes.copy_from_slice(b"Hello Rust");
83 /// Ok(())
84 /// })?;
85 /// let bytes: &[u8] = py_bytes.extract()?;
86 /// assert_eq!(bytes, b"Hello Rust");
87 /// Ok(())
88 /// })
89 /// # }
90 /// ```
91 #[inline]
92 pub fn new_with<F>(py: Python<'_>, len: usize, init: F) -> PyResult<Bound<'_, PyBytes>>
93 where
94 F: FnOnce(&mut [u8]) -> PyResult<()>,
95 {
96 unsafe {
97 let pyptr = ffi::PyBytes_FromStringAndSize(std::ptr::null(), len as ffi::Py_ssize_t);
98 // Check for an allocation error and return it
99 let pybytes = pyptr.assume_owned_or_err(py)?.downcast_into_unchecked();
100 let buffer: *mut u8 = ffi::PyBytes_AsString(pyptr).cast();
101 debug_assert!(!buffer.is_null());
102 // Zero-initialise the uninitialised bytestring
103 std::ptr::write_bytes(buffer, 0u8, len);
104 // (Further) Initialise the bytestring in init
105 // If init returns an Err, pypybytearray will automatically deallocate the buffer
106 init(std::slice::from_raw_parts_mut(buffer, len)).map(|_| pybytes)
107 }
108 }
109
110 /// Creates a new Python byte string object from a raw pointer and length.
111 ///
112 /// Panics if out of memory.
113 ///
114 /// # Safety
115 ///
116 /// This function dereferences the raw pointer `ptr` as the
117 /// leading pointer of a slice of length `len`. [As with
118 /// `std::slice::from_raw_parts`, this is
119 /// unsafe](https://doc.rust-lang.org/std/slice/fn.from_raw_parts.html#safety).
120 pub unsafe fn from_ptr(py: Python<'_>, ptr: *const u8, len: usize) -> Bound<'_, PyBytes> {
121 unsafe {
122 ffi::PyBytes_FromStringAndSize(ptr.cast(), len as isize)
123 .assume_owned(py)
124 .downcast_into_unchecked()
125 }
126 }
127}
128
129/// Implementation of functionality for [`PyBytes`].
130///
131/// These methods are defined for the `Bound<'py, PyBytes>` smart pointer, so to use method call
132/// syntax these methods are separated into a trait, because stable Rust does not yet support
133/// `arbitrary_self_types`.
134#[doc(alias = "PyBytes")]
135pub trait PyBytesMethods<'py>: crate::sealed::Sealed {
136 /// Gets the Python string as a byte slice.
137 fn as_bytes(&self) -> &[u8];
138}
139
140impl<'py> PyBytesMethods<'py> for Bound<'py, PyBytes> {
141 #[inline]
142 fn as_bytes(&self) -> &[u8] {
143 self.as_borrowed().as_bytes()
144 }
145}
146
147impl<'a> Borrowed<'a, '_, PyBytes> {
148 /// Gets the Python string as a byte slice.
149 #[allow(clippy::wrong_self_convention)]
150 pub(crate) fn as_bytes(self) -> &'a [u8] {
151 unsafe {
152 let buffer = ffi::PyBytes_AsString(self.as_ptr()) as *const u8;
153 let length = ffi::PyBytes_Size(self.as_ptr()) as usize;
154 debug_assert!(!buffer.is_null());
155 std::slice::from_raw_parts(buffer, length)
156 }
157 }
158}
159
160impl Py<PyBytes> {
161 /// Gets the Python bytes as a byte slice. Because Python bytes are
162 /// immutable, the result may be used for as long as the reference to
163 /// `self` is held, including when the GIL is released.
164 pub fn as_bytes<'a>(&'a self, py: Python<'_>) -> &'a [u8] {
165 self.bind_borrowed(py).as_bytes()
166 }
167}
168
169/// This is the same way [Vec] is indexed.
170impl<I: SliceIndex<[u8]>> Index<I> for Bound<'_, PyBytes> {
171 type Output = I::Output;
172
173 fn index(&self, index: I) -> &Self::Output {
174 &self.as_bytes()[index]
175 }
176}
177
178/// Compares whether the Python bytes object is equal to the [u8].
179///
180/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
181impl PartialEq<[u8]> for Bound<'_, PyBytes> {
182 #[inline]
183 fn eq(&self, other: &[u8]) -> bool {
184 self.as_borrowed() == *other
185 }
186}
187
188/// Compares whether the Python bytes object is equal to the [u8].
189///
190/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
191impl PartialEq<&'_ [u8]> for Bound<'_, PyBytes> {
192 #[inline]
193 fn eq(&self, other: &&[u8]) -> bool {
194 self.as_borrowed() == **other
195 }
196}
197
198/// Compares whether the Python bytes object is equal to the [u8].
199///
200/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
201impl PartialEq<Bound<'_, PyBytes>> for [u8] {
202 #[inline]
203 fn eq(&self, other: &Bound<'_, PyBytes>) -> bool {
204 *self == other.as_borrowed()
205 }
206}
207
208/// Compares whether the Python bytes object is equal to the [u8].
209///
210/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
211impl PartialEq<&'_ Bound<'_, PyBytes>> for [u8] {
212 #[inline]
213 fn eq(&self, other: &&Bound<'_, PyBytes>) -> bool {
214 *self == other.as_borrowed()
215 }
216}
217
218/// Compares whether the Python bytes object is equal to the [u8].
219///
220/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
221impl PartialEq<Bound<'_, PyBytes>> for &'_ [u8] {
222 #[inline]
223 fn eq(&self, other: &Bound<'_, PyBytes>) -> bool {
224 **self == other.as_borrowed()
225 }
226}
227
228/// Compares whether the Python bytes object is equal to the [u8].
229///
230/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
231impl PartialEq<[u8]> for &'_ Bound<'_, PyBytes> {
232 #[inline]
233 fn eq(&self, other: &[u8]) -> bool {
234 self.as_borrowed() == other
235 }
236}
237
238/// Compares whether the Python bytes object is equal to the [u8].
239///
240/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
241impl PartialEq<[u8]> for Borrowed<'_, '_, PyBytes> {
242 #[inline]
243 fn eq(&self, other: &[u8]) -> bool {
244 self.as_bytes() == other
245 }
246}
247
248/// Compares whether the Python bytes object is equal to the [u8].
249///
250/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
251impl PartialEq<&[u8]> for Borrowed<'_, '_, PyBytes> {
252 #[inline]
253 fn eq(&self, other: &&[u8]) -> bool {
254 *self == **other
255 }
256}
257
258/// Compares whether the Python bytes object is equal to the [u8].
259///
260/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
261impl PartialEq<Borrowed<'_, '_, PyBytes>> for [u8] {
262 #[inline]
263 fn eq(&self, other: &Borrowed<'_, '_, PyBytes>) -> bool {
264 other == self
265 }
266}
267
268/// Compares whether the Python bytes object is equal to the [u8].
269///
270/// In some cases Python equality might be more appropriate; see the note on [`PyBytes`].
271impl PartialEq<Borrowed<'_, '_, PyBytes>> for &'_ [u8] {
272 #[inline]
273 fn eq(&self, other: &Borrowed<'_, '_, PyBytes>) -> bool {
274 other == self
275 }
276}
277
278#[cfg(test)]
279mod tests {
280 use super::*;
281
282 #[test]
283 fn test_bytes_index() {
284 Python::with_gil(|py| {
285 let bytes = PyBytes::new(py, b"Hello World");
286 assert_eq!(bytes[1], b'e');
287 });
288 }
289
290 #[test]
291 fn test_bound_bytes_index() {
292 Python::with_gil(|py| {
293 let bytes = PyBytes::new(py, b"Hello World");
294 assert_eq!(bytes[1], b'e');
295
296 let bytes = &bytes;
297 assert_eq!(bytes[1], b'e');
298 });
299 }
300
301 #[test]
302 fn test_bytes_new_with() -> super::PyResult<()> {
303 Python::with_gil(|py| -> super::PyResult<()> {
304 let py_bytes = PyBytes::new_with(py, 10, |b: &mut [u8]| {
305 b.copy_from_slice(b"Hello Rust");
306 Ok(())
307 })?;
308 let bytes: &[u8] = py_bytes.extract()?;
309 assert_eq!(bytes, b"Hello Rust");
310 Ok(())
311 })
312 }
313
314 #[test]
315 fn test_bytes_new_with_zero_initialised() -> super::PyResult<()> {
316 Python::with_gil(|py| -> super::PyResult<()> {
317 let py_bytes = PyBytes::new_with(py, 10, |_b: &mut [u8]| Ok(()))?;
318 let bytes: &[u8] = py_bytes.extract()?;
319 assert_eq!(bytes, &[0; 10]);
320 Ok(())
321 })
322 }
323
324 #[test]
325 fn test_bytes_new_with_error() {
326 use crate::exceptions::PyValueError;
327 Python::with_gil(|py| {
328 let py_bytes_result = PyBytes::new_with(py, 10, |_b: &mut [u8]| {
329 Err(PyValueError::new_err("Hello Crustaceans!"))
330 });
331 assert!(py_bytes_result.is_err());
332 assert!(py_bytes_result
333 .err()
334 .unwrap()
335 .is_instance_of::<PyValueError>(py));
336 });
337 }
338
339 #[test]
340 fn test_comparisons() {
341 Python::with_gil(|py| {
342 let b = b"hello, world".as_slice();
343 let py_bytes = PyBytes::new(py, b);
344
345 assert_eq!(py_bytes, b"hello, world".as_slice());
346
347 assert_eq!(py_bytes, b);
348 assert_eq!(&py_bytes, b);
349 assert_eq!(b, py_bytes);
350 assert_eq!(b, &py_bytes);
351
352 assert_eq!(py_bytes, *b);
353 assert_eq!(&py_bytes, *b);
354 assert_eq!(*b, py_bytes);
355 assert_eq!(*b, &py_bytes);
356
357 let py_string = py_bytes.as_borrowed();
358
359 assert_eq!(py_string, b);
360 assert_eq!(&py_string, b);
361 assert_eq!(b, py_string);
362 assert_eq!(b, &py_string);
363
364 assert_eq!(py_string, *b);
365 assert_eq!(*b, py_string);
366 })
367 }
368}