Skip to content

Commit

Permalink
clarify & document memory ownership of passed arrow C FFI structs
Browse files Browse the repository at this point in the history
  • Loading branch information
Wumpf committed Nov 20, 2023
1 parent 324c3e6 commit ca6a0cf
Show file tree
Hide file tree
Showing 5 changed files with 38 additions and 23 deletions.
40 changes: 23 additions & 17 deletions crates/rerun_c/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -123,7 +123,7 @@ pub struct CDataRow {
pub entity_path: CStringView,
pub num_instances: u32,
pub num_data_cells: u32,
pub data_cells: *const CDataCell,
pub data_cells: *mut CDataCell,
}

#[repr(u32)]
Expand Down Expand Up @@ -559,58 +559,64 @@ pub extern "C" fn rr_recording_stream_reset_time(stream: CRecordingStream) {

#[allow(unsafe_code)]
#[allow(clippy::result_large_err)]
#[allow(clippy::needless_pass_by_value)] // Conceptually we're consuming the data_row, as we take ownership of data it points to.
fn rr_log_impl(
stream: CRecordingStream,
data_row: *const CDataRow,
data_row: CDataRow,
inject_time: bool,
) -> Result<(), CError> {
let stream = recording_stream(stream)?;

let data_row = ptr::try_ptr_as_ref(data_row, "data_row")?;

let CDataRow {
entity_path,
num_instances,
num_data_cells,
data_cells,
} = *data_row;
} = data_row;

let entity_path = entity_path.as_str("entity_path")?;
let entity_path = EntityPath::parse_forgiving(entity_path);

let num_data_cells = num_data_cells as usize;
re_log::debug!(
"rerun_log {entity_path:?}, num_instances: {num_instances}, num_data_cells: {num_data_cells}",
);

let mut cells = re_log_types::DataCellVec::default();
cells.reserve(num_data_cells as usize);
cells.reserve(num_data_cells);

let data_cells = unsafe { std::slice::from_raw_parts(data_cells, num_data_cells as usize) };
let data_cells = unsafe { std::slice::from_raw_parts_mut(data_cells, num_data_cells) };

for data_cell in data_cells {
// Arrow2 implements drop for ArrowArray and ArrowSchema.
//
// Therefore, for things to work correctly we have to take ownership of the data cell!
// The C interface is documented to take ownership of the data cell - the user should NOT call `release`.
// This makes sense because from here on out we want to manage the lifetime of the underlying schema and array data:
// the schema won't survive a loop iteration since it's reference passed for import, whereas the ArrowArray lives
// on a longer within the resulting arrow::Array.
let CDataCell {
component_name,
array,
schema,
} = &data_cell;
} = unsafe { std::ptr::read(data_cell) };

// It would be nice to now mark the data_cell as "consumed" by setting the original release method to nullptr.
// This would signifies to the calling code that the data_cell is no longer owned.
// However, Arrow2 doesn't allow us to access the the fields of the ArrowArray and ArrowSchema structs.

let component_name = component_name.as_str("data_cells[i].component_name")?;
let component_name = ComponentName::from(component_name);

let field = unsafe { arrow2::ffi::import_field_from_c(schema) }.map_err(|err| {
let field = unsafe { arrow2::ffi::import_field_from_c(&schema) }.map_err(|err| {
CError::new(
CErrorCode::ArrowFfiSchemaImportError,
&format!("Failed to import ffi schema: {err}"),
)
})?;

// We need to copy the array since `import_array_from_c` takes ownership of the array.
// Since we don't touch the original afterwards anymore and array doesn't have a drop implementation,
// it should be safe to do so.
let ffi_array: arrow2::ffi::ArrowArray = unsafe { std::mem::transmute_copy(array) };

let values = unsafe { arrow2::ffi::import_array_from_c(ffi_array, field.data_type) }
.map_err(|err| {
let values =
unsafe { arrow2::ffi::import_array_from_c(array, field.data_type) }.map_err(|err| {
CError::new(
CErrorCode::ArrowFfiArrayImportError,
&format!("Failed to import ffi array: {err}"),
Expand Down Expand Up @@ -650,7 +656,7 @@ fn rr_log_impl(
#[no_mangle]
pub unsafe extern "C" fn rr_recording_stream_log(
stream: CRecordingStream,
data_row: *const CDataRow,
data_row: CDataRow,
inject_time: bool,
error: *mut CError,
) {
Expand Down
8 changes: 6 additions & 2 deletions crates/rerun_c/src/rerun.h
Original file line number Diff line number Diff line change
Expand Up @@ -159,7 +159,7 @@ typedef struct {
uint32_t num_data_cells;

/// One for each component.
const rr_data_cell* data_cells;
rr_data_cell* data_cells;
} rr_data_row;

/// Error codes returned by the Rerun C SDK as part of `rr_error`.
Expand Down Expand Up @@ -360,8 +360,12 @@ extern void rr_recording_stream_reset_time(rr_recording_stream stream);
///
/// If `inject_time` is set to `true`, the row's timestamp data will be
/// overridden using the recording streams internal clock.
///
/// Takes ownership of the passed data cells and will release underlying
/// arrow data once it is no longer needed.
/// Any pointers passed via `rr_string` can be safely freed after this call.
extern void rr_recording_stream_log(
rr_recording_stream stream, const rr_data_row* data_row, bool inject_time, rr_error* error
rr_recording_stream stream, rr_data_row data_row, bool inject_time, rr_error* error
);

// ----------------------------------------------------------------------------
Expand Down
8 changes: 6 additions & 2 deletions rerun_cpp/src/rerun/c/rerun.h

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

2 changes: 1 addition & 1 deletion rerun_cpp/src/rerun/data_cell.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ namespace rerun {

/// To rerun C API data cell.
///
/// Only valid as long as the C++ data cell is alive.
/// The resulting `rr_data_cell` keeps the `arrow::Array` alive until it is released.
Error to_c_ffi_struct(rr_data_cell& out_cell) const;
};
} // namespace rerun
3 changes: 2 additions & 1 deletion rerun_cpp/src/rerun/recording_stream.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -236,7 +236,8 @@ namespace rerun {
c_data_row.data_cells = c_data_cells.data();

rr_error status = {};
rr_recording_stream_log(_id, &c_data_row, inject_time, &status);
rr_recording_stream_log(_id, c_data_row, inject_time, &status);

return status;
}
} // namespace rerun

0 comments on commit ca6a0cf

Please sign in to comment.