From cc3800cbae5588d19106655f23c8000db5b86349 Mon Sep 17 00:00:00 2001 From: Miles Granger Date: Thu, 29 Feb 2024 22:16:11 +0100 Subject: [PATCH 1/3] Add pyo3 build config --- Cargo.lock | 1 + cramjam-python/Cargo.toml | 3 +++ cramjam-python/build.rs | 3 +++ 3 files changed, 7 insertions(+) create mode 100644 cramjam-python/build.rs diff --git a/Cargo.lock b/Cargo.lock index f86bf36b..5b7a5e65 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -304,6 +304,7 @@ version = "2.8.1" dependencies = [ "libcramjam 0.2.0 (registry+https://github.com/rust-lang/crates.io-index)", "pyo3", + "pyo3-build-config", ] [[package]] diff --git a/cramjam-python/Cargo.toml b/cramjam-python/Cargo.toml index 20a72b72..c9e4cd79 100644 --- a/cramjam-python/Cargo.toml +++ b/cramjam-python/Cargo.toml @@ -20,3 +20,6 @@ extension-module = ["pyo3/extension-module"] [dependencies] pyo3 = { version = "^0.20", default-features = false, features = ["macros"] } libcramjam = "0.2.0" + +[build-dependencies] +pyo3-build-config = "^0.20" diff --git a/cramjam-python/build.rs b/cramjam-python/build.rs new file mode 100644 index 00000000..0475124b --- /dev/null +++ b/cramjam-python/build.rs @@ -0,0 +1,3 @@ +fn main() { + pyo3_build_config::use_pyo3_cfgs(); +} From a477ed325f818204b3b5c1a81fe42614a46f1f61 Mon Sep 17 00:00:00 2001 From: Miles Granger Date: Fri, 1 Mar 2024 07:40:08 +0100 Subject: [PATCH 2/3] Kinda working, kinda not [skip ci] --- cramjam-python/src/io.rs | 47 ++++++++++++++++++++++++++++++++-------- 1 file changed, 38 insertions(+), 9 deletions(-) diff --git a/cramjam-python/src/io.rs b/cramjam-python/src/io.rs index d9561204..123aaa5e 100644 --- a/cramjam-python/src/io.rs +++ b/cramjam-python/src/io.rs @@ -244,19 +244,48 @@ impl<'py> FromPyObject<'py> for PythonBuffer { } } +#[cfg(not(PyPy))] +fn make_py_buffer(obj: &PyAny) -> PyResult { + let mut buf = mem::MaybeUninit::uninit(); + let rc = unsafe { ffi::PyObject_GetBuffer(obj.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; + if rc != 0 { + return Err(exceptions::PyBufferError::new_err( + "Failed to get buffer, is it C contiguous, and shape is not null?", + )); + } + let buf = unsafe { mem::MaybeUninit::::assume_init(buf) }; + Ok(buf) +} + +#[cfg(PyPy)] +fn make_py_buffer(obj: &PyAny) -> PyResult { + let is_memview = unsafe { ffi::PyMemoryView_Check(obj.as_ptr()) } == 1; + + let mut object = Python::with_gil(|py| obj.to_object(py)); + + if !is_memview { + let ptr = unsafe { ffi::PyMemoryView_FromObject(obj.as_ptr()) }; + Python::with_gil(|py| { + object = unsafe { PyObject::from_owned_ptr(py, ptr) }; + }) + } + let mut buf = mem::MaybeUninit::uninit(); + let rc = unsafe { ffi::PyObject_GetBuffer(object.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; + if rc != 0 { + return Err(exceptions::PyBufferError::new_err( + "Failed to get buffer, is it C contiguous, and shape is not null?", + )); + } + let buf = unsafe { mem::MaybeUninit::::assume_init(buf) }; + Ok(buf) +} + impl<'py> TryFrom<&'py PyAny> for PythonBuffer { type Error = PyErr; fn try_from(obj: &'py PyAny) -> Result { - let mut buf = Box::new(mem::MaybeUninit::uninit()); - let rc = unsafe { ffi::PyObject_GetBuffer(obj.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; - if rc != 0 { - return Err(exceptions::PyBufferError::new_err( - "Failed to get buffer, is it C contiguous, and shape is not null?", - )); - } - let buf = Box::new(unsafe { mem::MaybeUninit::::assume_init(*buf) }); + let py_buffer = make_py_buffer(obj)?; let buf = Self { - inner: std::pin::Pin::from(buf), + inner: std::pin::Pin::from(Box::new(py_buffer)), pos: 0, }; // sanity checks From 51e0988cf27d89a7c52cbcbb0917bb1b842f214a Mon Sep 17 00:00:00 2001 From: Miles Granger Date: Fri, 1 Mar 2024 10:20:31 +0100 Subject: [PATCH 3/3] Trying doing things the right way, CPython happy, PyPy sad [skip ci] --- cramjam-python/src/io.rs | 65 +++++++++++------------------------- cramjam-python/src/lib.rs | 16 ++++----- cramjam-python/src/lz4.rs | 4 +-- cramjam-python/src/snappy.rs | 4 +-- 4 files changed, 32 insertions(+), 57 deletions(-) diff --git a/cramjam-python/src/io.rs b/cramjam-python/src/io.rs index 123aaa5e..992e66d0 100644 --- a/cramjam-python/src/io.rs +++ b/cramjam-python/src/io.rs @@ -18,7 +18,7 @@ use std::path::PathBuf; pub(crate) trait AsBytes { fn as_bytes(&self) -> &[u8]; - fn as_bytes_mut(&mut self) -> &mut [u8]; + fn as_bytes_mut(&mut self) -> PyResult<&mut [u8]>; } /// A native Rust file-like object. Reading and writing takes place @@ -49,7 +49,7 @@ impl AsBytes for RustyFile { entire file into memory; consider using cramjam.Buffer" ) } - fn as_bytes_mut(&mut self) -> &mut [u8] { + fn as_bytes_mut(&mut self) -> PyResult<&mut [u8]> { unimplemented!( "Converting a File to bytes is not supported, as it'd require reading the \ entire file into memory; consider using cramjam.Buffer" @@ -194,7 +194,7 @@ impl PythonBuffer { } /// Is the Python buffer readonly pub fn readonly(&self) -> bool { - self.inner.readonly != 0 + self.inner.readonly == 1 } /// Get the underlying buffer as a slice of bytes pub fn as_slice(&self) -> &[u8] { @@ -202,13 +202,16 @@ impl PythonBuffer { } /// Get the underlying buffer as a mutable slice of bytes pub fn as_slice_mut(&mut self) -> PyResult<&mut [u8]> { - // TODO: For v3 release, add self.readonly check; bytes is readonly but - // v1 and v2 releases have not treated it as such. + if self.readonly() { + let repr = Python::with_gil(|py| unsafe { PyObject::from_borrowed_ptr(py, self.inner.obj) }.to_string()); + let msg = format!("The output buffer '{}' is readonly, refusing to overwrite.", repr); + return Err(pyo3::exceptions::PyTypeError::new_err(msg)); + } Ok(unsafe { std::slice::from_raw_parts_mut(self.buf_ptr() as *mut u8, self.len_bytes()) }) } /// If underlying buffer is c_contiguous pub fn is_c_contiguous(&self) -> bool { - unsafe { ffi::PyBuffer_IsContiguous(&*self.inner as *const ffi::Py_buffer, b'C' as std::os::raw::c_char) != 0 } + unsafe { ffi::PyBuffer_IsContiguous(&*self.inner as *const ffi::Py_buffer, b'C' as std::os::raw::c_char) == 1 } } /// Dimensions for buffer pub fn dimensions(&self) -> usize { @@ -244,46 +247,17 @@ impl<'py> FromPyObject<'py> for PythonBuffer { } } -#[cfg(not(PyPy))] -fn make_py_buffer(obj: &PyAny) -> PyResult { - let mut buf = mem::MaybeUninit::uninit(); - let rc = unsafe { ffi::PyObject_GetBuffer(obj.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; - if rc != 0 { - return Err(exceptions::PyBufferError::new_err( - "Failed to get buffer, is it C contiguous, and shape is not null?", - )); - } - let buf = unsafe { mem::MaybeUninit::::assume_init(buf) }; - Ok(buf) -} - -#[cfg(PyPy)] -fn make_py_buffer(obj: &PyAny) -> PyResult { - let is_memview = unsafe { ffi::PyMemoryView_Check(obj.as_ptr()) } == 1; - - let mut object = Python::with_gil(|py| obj.to_object(py)); - - if !is_memview { - let ptr = unsafe { ffi::PyMemoryView_FromObject(obj.as_ptr()) }; - Python::with_gil(|py| { - object = unsafe { PyObject::from_owned_ptr(py, ptr) }; - }) - } - let mut buf = mem::MaybeUninit::uninit(); - let rc = unsafe { ffi::PyObject_GetBuffer(object.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; - if rc != 0 { - return Err(exceptions::PyBufferError::new_err( - "Failed to get buffer, is it C contiguous, and shape is not null?", - )); - } - let buf = unsafe { mem::MaybeUninit::::assume_init(buf) }; - Ok(buf) -} - impl<'py> TryFrom<&'py PyAny> for PythonBuffer { type Error = PyErr; fn try_from(obj: &'py PyAny) -> Result { - let py_buffer = make_py_buffer(obj)?; + let mut buf = mem::MaybeUninit::uninit(); + let rc = unsafe { ffi::PyObject_GetBuffer(obj.as_ptr(), buf.as_mut_ptr(), ffi::PyBUF_CONTIG_RO) }; + if rc != 0 { + return Err(exceptions::PyBufferError::new_err( + "Failed to get buffer, is it C contiguous, and shape is not null?", + )); + } + let py_buffer = unsafe { mem::MaybeUninit::::assume_init(buf) }; let buf = Self { inner: std::pin::Pin::from(Box::new(py_buffer)), pos: 0, @@ -357,8 +331,9 @@ impl AsBytes for RustyBuffer { fn as_bytes(&self) -> &[u8] { self.inner.get_ref().as_slice() } - fn as_bytes_mut(&mut self) -> &mut [u8] { - self.inner.get_mut().as_mut_slice() + fn as_bytes_mut(&mut self) -> PyResult<&mut [u8]> { + let slice = self.inner.get_mut().as_mut_slice(); + Ok(slice) } } diff --git a/cramjam-python/src/lib.rs b/cramjam-python/src/lib.rs index c494db86..f5fea3ba 100644 --- a/cramjam-python/src/lib.rs +++ b/cramjam-python/src/lib.rs @@ -101,18 +101,18 @@ impl<'a> AsBytes for BytesType<'a> { } } } - fn as_bytes_mut(&mut self) -> &mut [u8] { + fn as_bytes_mut(&mut self) -> PyResult<&mut [u8]> { match self { BytesType::RustyBuffer(b) => { let mut py_ref = b.borrow_mut(); - let bytes = py_ref.as_bytes_mut(); - unsafe { std::slice::from_raw_parts_mut(bytes.as_mut_ptr(), bytes.len()) } + let bytes = py_ref.as_bytes_mut()?; + Ok(unsafe { std::slice::from_raw_parts_mut(bytes.as_mut_ptr(), bytes.len()) }) } - BytesType::PyBuffer(b) => b.as_slice_mut().unwrap(), + BytesType::PyBuffer(b) => b.as_slice_mut(), BytesType::RustyFile(b) => { let mut py_ref = b.borrow_mut(); - let bytes = py_ref.as_bytes_mut(); - unsafe { std::slice::from_raw_parts_mut(bytes.as_mut_ptr(), bytes.len()) } + let bytes = py_ref.as_bytes_mut()?; + Ok(unsafe { std::slice::from_raw_parts_mut(bytes.as_mut_ptr(), bytes.len()) }) } } } @@ -212,7 +212,7 @@ macro_rules! generic { }) }, _ => { - let bytes_out = $output.as_bytes_mut(); + let bytes_out = $output.as_bytes_mut()?; $py.allow_threads(|| { $op(f_in, &mut Cursor::new(bytes_out) $(, $level)? ) }) @@ -237,7 +237,7 @@ macro_rules! generic { }) }, _ => { - let bytes_out = $output.as_bytes_mut(); + let bytes_out = $output.as_bytes_mut()?; $py.allow_threads(|| { $op(bytes_in, &mut Cursor::new(bytes_out) $(, $level)?) }) diff --git a/cramjam-python/src/lz4.rs b/cramjam-python/src/lz4.rs index 016c4470..c7894a00 100644 --- a/cramjam-python/src/lz4.rs +++ b/cramjam-python/src/lz4.rs @@ -146,7 +146,7 @@ pub fn compress_block( #[pyfunction] pub fn decompress_block_into(py: Python, input: BytesType, mut output: BytesType) -> PyResult { let bytes = input.as_bytes(); - let out_bytes = output.as_bytes_mut(); + let out_bytes = output.as_bytes_mut()?; py.allow_threads(|| libcramjam::lz4::block::decompress_into(bytes, out_bytes, Some(true))) .map_err(DecompressionError::from_err) .map(|v| v as _) @@ -180,7 +180,7 @@ pub fn compress_block_into( store_size: Option, ) -> PyResult { let bytes = data.as_bytes(); - let out_bytes = output.as_bytes_mut(); + let out_bytes = output.as_bytes_mut()?; py.allow_threads(|| { libcramjam::lz4::block::compress_into(bytes, out_bytes, compression.map(|v| v as _), acceleration, store_size) }) diff --git a/cramjam-python/src/snappy.rs b/cramjam-python/src/snappy.rs index 1cd9ed83..9133c7af 100644 --- a/cramjam-python/src/snappy.rs +++ b/cramjam-python/src/snappy.rs @@ -100,7 +100,7 @@ pub fn decompress_into(py: Python, input: BytesType, mut output: BytesType) -> P #[pyfunction] pub fn compress_raw_into(py: Python, input: BytesType, mut output: BytesType) -> PyResult { let bytes_in = input.as_bytes(); - let bytes_out = output.as_bytes_mut(); + let bytes_out = output.as_bytes_mut()?; py.allow_threads(|| libcramjam::snappy::raw::compress(bytes_in, bytes_out)) .map_err(CompressionError::from_err) } @@ -109,7 +109,7 @@ pub fn compress_raw_into(py: Python, input: BytesType, mut output: BytesType) -> #[pyfunction] pub fn decompress_raw_into(py: Python, input: BytesType, mut output: BytesType) -> PyResult { let bytes_in = input.as_bytes(); - let bytes_out = output.as_bytes_mut(); + let bytes_out = output.as_bytes_mut()?; py.allow_threads(|| libcramjam::snappy::raw::decompress(bytes_in, bytes_out)) .map_err(DecompressionError::from_err) }