Skip to content

Commit 36d01fb

Browse files
committed
Revert "Enhance ArrowArrayStream handling by adding ARROW_STREAM_NAME and improving memory management in drop_stream function"
This reverts commit cd99b1d.
1 parent cd99b1d commit 36d01fb

1 file changed

Lines changed: 13 additions & 25 deletions

File tree

src/dataframe.rs

Lines changed: 13 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ use arrow::array::{new_null_array, RecordBatch, RecordBatchReader};
2323
use arrow::compute::can_cast_types;
2424
use arrow::error::ArrowError;
2525
use arrow::ffi::FFI_ArrowSchema;
26-
use arrow::ffi_stream::{FFI_ArrowArrayStream, ARROW_STREAM_NAME};
26+
use arrow::ffi_stream::FFI_ArrowArrayStream;
2727
use arrow::pyarrow::FromPyArrow;
2828
use datafusion::arrow::datatypes::{Schema, SchemaRef};
2929
use datafusion::arrow::pyarrow::{PyArrowType, ToPyArrow};
@@ -39,7 +39,6 @@ use datafusion::prelude::*;
3939
use datafusion_ffi::table_provider::FFI_TableProvider;
4040
use futures::{StreamExt, TryStreamExt};
4141
use pyo3::exceptions::PyValueError;
42-
use pyo3::ffi;
4342
use pyo3::prelude::*;
4443
use pyo3::pybacked::PyBackedStr;
4544
use pyo3::types::{PyCapsule, PyList, PyTuple, PyTupleMethods};
@@ -59,17 +58,6 @@ use crate::{
5958
expr::{sort_expr::PySortExpr, PyExpr},
6059
};
6160

62-
unsafe extern "C" fn drop_stream(capsule: *mut ffi::PyObject) {
63-
if capsule.is_null() {
64-
return;
65-
}
66-
let name = CString::new(ARROW_STREAM_NAME).unwrap();
67-
let stream_ptr = ffi::PyCapsule_GetPointer(capsule, name.as_ptr()) as *mut FFI_ArrowArrayStream;
68-
if !stream_ptr.is_null() {
69-
drop(Box::from_raw(stream_ptr));
70-
}
71-
}
72-
7361
// https://github.com/apache/datafusion-python/pull/1016#discussion_r1983239116
7462
// - we have not decided on the table_provider approach yet
7563
// this is an interim implementation
@@ -970,20 +958,20 @@ impl PyDataFrame {
970958
!stream_ptr.is_null(),
971959
"ArrowArrayStream pointer should never be null"
972960
);
973-
let stream_name = CString::new(ARROW_STREAM_NAME).unwrap();
974-
let capsule = unsafe {
975-
ffi::PyCapsule_New(
976-
stream_ptr as *mut c_void,
977-
stream_name.as_ptr(),
978-
Some(drop_stream),
961+
let stream_capsule_name = CString::new("arrow_array_stream").unwrap();
962+
unsafe {
963+
PyCapsule::new_bound_with_destructor(
964+
py,
965+
stream_ptr,
966+
Some(stream_capsule_name),
967+
|ptr: *mut FFI_ArrowArrayStream, _| {
968+
if !ptr.is_null() {
969+
unsafe { Box::from_raw(ptr) };
970+
}
971+
},
979972
)
980-
};
981-
if capsule.is_null() {
982-
unsafe { drop(Box::from_raw(stream_ptr)) };
983-
Err(PyErr::fetch(py).into())
984-
} else {
985-
Ok(unsafe { Bound::from_owned_ptr(py, capsule) })
986973
}
974+
.map_err(PyDataFusionError::from)
987975
}
988976

989977
fn execute_stream(&self, py: Python) -> PyDataFusionResult<PyRecordBatchStream> {

0 commit comments

Comments
 (0)