Skip to content

Commit

Permalink
Introduce DeserializableComponent trait and high-level `query_lates…
Browse files Browse the repository at this point in the history
…t` (#1417)

* introduce DeserializableComponent

* turn query_transform into a generic query_latest

* use DeserializableComponent everywhere it makes sense

* use SerializableComponent everywhere it makes sense

* self review

* addressed PR comments
  • Loading branch information
teh-cmc authored Feb 27, 2023
1 parent 34123fb commit c31906a
Show file tree
Hide file tree
Showing 11 changed files with 100 additions and 107 deletions.
36 changes: 21 additions & 15 deletions crates/re_data_store/src/entity_properties.rs
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
use re_arrow_store::LatestAtQuery;
use re_log_types::{
external::arrow2_convert::deserialize::arrow_array_deserialize_iterator, msg_bundle::Component,
EntityPath, Transform,
external::arrow2_convert::deserialize::arrow_array_deserialize_iterator,
msg_bundle::DeserializableComponent, EntityPath,
};

use crate::log_db::EntityDb;
Expand Down Expand Up @@ -38,6 +38,10 @@ pub struct EntityProperties {
pub visible: bool,
pub visible_history: ExtraQueryHistory,
pub interactive: bool,

/// Distance of the projection plane.
///
/// Only applies to pinhole cameras when in a spatial view, using 3D navigation.
pinhole_image_plane_distance: Option<ordered_float::NotNan<f32>>,
}

Expand Down Expand Up @@ -114,37 +118,39 @@ impl ExtraQueryHistory {

// ----------------------------------------------------------------------------

/// Get the latest value of the transform
/// Get the latest value for a given [`re_log_types::msg_bundle::Component`].
///
/// We first look for the transform in the classic storage system since that's
/// what most users are still using. If we don't find the transform there, then
/// we check to see if it exists in the arrow storage.
pub fn query_transform(
/// This assumes that the row we get from the store only contains a single instance for this
/// component; it will log a warning otherwise.
pub fn query_latest_single<C: DeserializableComponent>(
entity_db: &EntityDb,
entity_path: &EntityPath,
query: &LatestAtQuery,
) -> Option<Transform> {
) -> Option<C>
where
for<'b> &'b C::ArrayType: IntoIterator,
{
crate::profile_function!();

// Although it would be nice to use the `re_query` helpers for this, we would need to move
// this out of re_data_store to avoid a circular dep. Since we don't need to do a join for
// transforms this is easy enough.
// single components this is easy enough.
let data_store = &entity_db.data_store;

let components = [Transform::name()];
let components = [C::name()];

let row_indices = data_store.latest_at(query, entity_path, Transform::name(), &components)?;
let row_indices = data_store.latest_at(query, entity_path, C::name(), &components)?;

let results = data_store.get(&components, &row_indices);
let arr = results.get(0)?.as_ref()?.as_ref();

let mut iter = arrow_array_deserialize_iterator::<Transform>(arr).ok()?;
let mut iter = arrow_array_deserialize_iterator::<C>(arr).ok()?;

let transform = iter.next();
let component = iter.next();

if iter.next().is_some() {
re_log::warn_once!("Unexpected batch for Transform at: {}", entity_path);
re_log::warn_once!("Unexpected batch for {} at: {}", C::name(), entity_path);
}

transform
component
}
34 changes: 31 additions & 3 deletions crates/re_log_types/src/msg_bundle.rs
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,7 @@ use arrow2::{
offset::Offsets,
};
use arrow2_convert::{
deserialize::{ArrowArray, ArrowDeserialize},
field::ArrowField,
serialize::{ArrowSerialize, TryIntoArrow},
};
Expand Down Expand Up @@ -88,9 +89,8 @@ pub trait Component: ArrowField {
}
}

/// A trait to identify any [`Component`] that is ready to be collected and subsequently serialized
/// into an Arrow payload.
pub trait SerializableComponent
/// A [`Component`] that fulfils all the conditions required to be serialized as an Arrow payload.
pub trait SerializableComponent<ArrowFieldType = Self>
where
Self: Component + ArrowSerialize + ArrowField<Type = Self> + 'static,
{
Expand All @@ -101,6 +101,34 @@ impl<C> SerializableComponent for C where
{
}

/// A [`Component`] that fulfils all the conditions required to be deserialized from an Arrow
/// payload.
///
/// Note that due to the use of HRTBs in `arrow2_convert` traits, you will still need an extra HRTB
/// clause when marking a type as `DeserializableComponent`:
/// ```ignore
/// where
/// T: SerializableComponent,
/// for<'a> &'a T::ArrayType: IntoIterator,
/// ```
pub trait DeserializableComponent<ArrowFieldType = Self>
where
Self: Component,
Self: ArrowDeserialize + ArrowField<Type = ArrowFieldType> + 'static,
Self::ArrayType: ArrowArray,
for<'b> &'b Self::ArrayType: IntoIterator,
{
}

impl<C> DeserializableComponent for C
where
C: Component,
C: ArrowDeserialize + ArrowField<Type = C> + 'static,
C::ArrayType: ArrowArray,
for<'b> &'b C::ArrayType: IntoIterator,
{
}

/// A [`ComponentBundle`] holds an Arrow component column, and its field name.
///
/// A [`ComponentBundle`] can be created from a collection of any element that implements the
Expand Down
51 changes: 16 additions & 35 deletions crates/re_query/src/dataframe_util.rs
Original file line number Diff line number Diff line change
Expand Up @@ -7,12 +7,8 @@ use polars_core::prelude::*;
use re_arrow_store::ArrayExt;
use re_log_types::{
component_types::InstanceKey,
external::arrow2_convert::{
deserialize::{arrow_array_deserialize_iterator, ArrowArray, ArrowDeserialize},
field::ArrowField,
serialize::ArrowSerialize,
},
msg_bundle::Component,
external::arrow2_convert::deserialize::arrow_array_deserialize_iterator,
msg_bundle::{Component, DeserializableComponent, SerializableComponent},
};

use crate::{
Expand Down Expand Up @@ -55,10 +51,10 @@ fn fix_polars_nulls<C: Component>(array: &dyn Array) -> Box<dyn Array> {
}

/// Iterator for a single column in a dataframe as the rust-native Component type
pub fn iter_column<'a, C: Component>(df: &'a DataFrame) -> impl Iterator<Item = Option<C>> + 'a
pub fn iter_column<'a, C: DeserializableComponent>(
df: &'a DataFrame,
) -> impl Iterator<Item = Option<C>> + 'a
where
C: ArrowDeserialize + ArrowField<Type = C> + 'static,
C::ArrayType: ArrowArray,
for<'b> &'b C::ArrayType: IntoIterator,
{
let res = match df.column(C::name().as_str()) {
Expand All @@ -74,11 +70,7 @@ where
res.into_iter()
}

pub fn df_builder1<C0>(c0: &Vec<Option<C0>>) -> crate::Result<DataFrame>
where
C0: Component + 'static,
Option<C0>: ArrowSerialize + ArrowField<Type = Option<C0>>,
{
pub fn df_builder1<C0: SerializableComponent>(c0: &Vec<Option<C0>>) -> crate::Result<DataFrame> {
use arrow2::array::MutableArray;
use re_log_types::external::arrow2_convert::serialize::arrow_serialize_to_mutable_array;

Expand All @@ -92,10 +84,8 @@ where

pub fn df_builder2<C0, C1>(c0: &Vec<Option<C0>>, c1: &Vec<Option<C1>>) -> crate::Result<DataFrame>
where
C0: Component + 'static,
Option<C0>: ArrowSerialize + ArrowField<Type = Option<C0>>,
C1: Component + 'static,
Option<C1>: ArrowSerialize + ArrowField<Type = Option<C1>>,
C0: SerializableComponent,
C1: SerializableComponent,
{
use arrow2::array::MutableArray;
use re_log_types::external::arrow2_convert::serialize::arrow_serialize_to_mutable_array;
Expand All @@ -117,12 +107,9 @@ pub fn df_builder3<C0, C1, C2>(
c2: &Vec<Option<C2>>,
) -> crate::Result<DataFrame>
where
C0: Component + 'static,
Option<C0>: ArrowSerialize + ArrowField<Type = Option<C0>>,
C1: Component + 'static,
Option<C1>: ArrowSerialize + ArrowField<Type = Option<C1>>,
C2: Component + 'static,
Option<C2>: ArrowSerialize + ArrowField<Type = Option<C2>>,
C0: SerializableComponent,
C1: SerializableComponent,
C2: SerializableComponent,
{
use arrow2::array::MutableArray;
use re_log_types::external::arrow2_convert::serialize::arrow_serialize_to_mutable_array;
Expand All @@ -142,12 +129,10 @@ where
}

impl ComponentWithInstances {
pub fn as_df<C0>(&self) -> crate::Result<DataFrame>
pub fn as_df<C0: SerializableComponent + DeserializableComponent>(
&self,
) -> crate::Result<DataFrame>
where
C0: Component,
Option<C0>: ArrowSerialize + ArrowField<Type = Option<C0>>,
C0: ArrowDeserialize + ArrowField<Type = C0> + 'static,
C0::ArrayType: ArrowArray,
for<'a> &'a C0::ArrayType: IntoIterator,
{
if C0::name() != self.name {
Expand All @@ -169,8 +154,7 @@ impl ComponentWithInstances {

impl<Primary> EntityView<Primary>
where
Primary: Component + ArrowSerialize + ArrowDeserialize + ArrowField<Type = Primary> + 'static,
Primary::ArrayType: ArrowArray,
Primary: SerializableComponent + DeserializableComponent,
for<'a> &'a Primary::ArrayType: IntoIterator,
{
pub fn as_df1(&self) -> crate::Result<DataFrame> {
Expand All @@ -184,10 +168,7 @@ where

pub fn as_df2<C1>(&self) -> crate::Result<DataFrame>
where
C1: Clone + Component,
Option<C1>: ArrowSerialize + ArrowField<Type = Option<C1>>,
C1: ArrowDeserialize + ArrowField<Type = C1> + 'static,
C1::ArrayType: ArrowArray,
C1: SerializableComponent + DeserializableComponent + Clone,
for<'a> &'a C1::ArrayType: IntoIterator,
{
let instance_keys = self.primary.iter_instance_keys()?.map(Some).collect_vec();
Expand Down
32 changes: 10 additions & 22 deletions crates/re_query/src/entity_view.rs
Original file line number Diff line number Diff line change
Expand Up @@ -6,11 +6,9 @@ use re_format::arrow;
use re_log_types::{
component_types::InstanceKey,
external::arrow2_convert::{
deserialize::{arrow_array_deserialize_iterator, ArrowArray, ArrowDeserialize},
field::ArrowField,
serialize::ArrowSerialize,
deserialize::arrow_array_deserialize_iterator, field::ArrowField, serialize::ArrowSerialize,
},
msg_bundle::Component,
msg_bundle::{Component, DeserializableComponent, SerializableComponent},
ComponentName,
};

Expand Down Expand Up @@ -58,10 +56,10 @@ impl ComponentWithInstances {
}

/// Iterate over the values and convert them to a native `Component`
pub fn iter_values<C: Component>(&self) -> crate::Result<impl Iterator<Item = Option<C>> + '_>
pub fn iter_values<C: DeserializableComponent>(
&self,
) -> crate::Result<impl Iterator<Item = Option<C>> + '_>
where
C: ArrowDeserialize + ArrowField<Type = C> + 'static,
C::ArrayType: ArrowArray,
for<'a> &'a C::ArrayType: IntoIterator,
{
if C::name() != self.name {
Expand All @@ -77,10 +75,8 @@ impl ComponentWithInstances {
}

/// Look up the value that corresponds to a given `InstanceKey` and convert to `Component`
pub fn lookup<C: Component>(&self, instance_key: &InstanceKey) -> crate::Result<C>
pub fn lookup<C: DeserializableComponent>(&self, instance_key: &InstanceKey) -> crate::Result<C>
where
C: ArrowDeserialize + ArrowField<Type = C> + 'static,
C::ArrayType: ArrowArray,
for<'a> &'a C::ArrayType: IntoIterator,
{
if C::name() != self.name {
Expand Down Expand Up @@ -132,14 +128,10 @@ impl ComponentWithInstances {
}

/// Produce a `ComponentWithInstances` from native component types
pub fn from_native<C>(
pub fn from_native<C: SerializableComponent>(
instance_keys: Option<&Vec<InstanceKey>>,
values: &Vec<C>,
) -> crate::Result<ComponentWithInstances>
where
C: Component + 'static,
C: ArrowSerialize + ArrowField<Type = C>,
{
) -> crate::Result<ComponentWithInstances> {
use re_log_types::external::arrow2_convert::serialize::arrow_serialize_to_mutable_array;

let instance_keys = if let Some(keys) = instance_keys {
Expand Down Expand Up @@ -296,10 +288,8 @@ where
}
}

impl<Primary> EntityView<Primary>
impl<Primary: SerializableComponent + DeserializableComponent> EntityView<Primary>
where
Primary: Component + ArrowSerialize + ArrowDeserialize + ArrowField<Type = Primary> + 'static,
Primary::ArrayType: ArrowArray,
for<'a> &'a Primary::ArrayType: IntoIterator,
{
/// Iterate over the instance keys
Expand Down Expand Up @@ -332,12 +322,10 @@ where
/// Iterate over the values of a `Component`.
///
/// Always produces an iterator of length `self.primary.len()`
pub fn iter_component<C: Component>(
pub fn iter_component<C: DeserializableComponent + Clone>(
&self,
) -> crate::Result<impl Iterator<Item = Option<C>> + '_>
where
C: Clone + ArrowDeserialize + ArrowField<Type = C> + 'static,
C::ArrayType: ArrowArray,
for<'b> &'b C::ArrayType: IntoIterator,
{
let component = self.components.get(&C::name());
Expand Down
14 changes: 3 additions & 11 deletions crates/re_query/src/visit.rs
Original file line number Diff line number Diff line change
Expand Up @@ -44,12 +44,7 @@
use re_log_types::{
component_types::InstanceKey,
external::arrow2_convert::{
deserialize::{ArrowArray, ArrowDeserialize},
field::ArrowField,
serialize::ArrowSerialize,
},
msg_bundle::Component,
msg_bundle::{Component, DeserializableComponent, SerializableComponent},
};

use crate::EntityView;
Expand All @@ -72,8 +67,7 @@ macro_rules! create_visitor {

) -> crate::Result<()>
where $(
$CC: Clone + ArrowDeserialize + ArrowField<Type = $CC> + 'static,
$CC::ArrayType: ArrowArray,
$CC: Clone + DeserializableComponent,
for<'a> &'a $CC::ArrayType: IntoIterator,
)*
{
Expand All @@ -98,10 +92,8 @@ macro_rules! create_visitor {
);
}

impl<Primary> EntityView<Primary>
impl<Primary: SerializableComponent + DeserializableComponent> EntityView<Primary>
where
Primary: Component + ArrowSerialize + ArrowDeserialize + ArrowField<Type = Primary> + 'static,
Primary::ArrayType: ArrowArray,
for<'a> &'a Primary::ArrayType: IntoIterator,
{
create_visitor! {visit1; ;}
Expand Down
7 changes: 4 additions & 3 deletions crates/re_viewer/src/misc/space_info.rs
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ use std::collections::BTreeMap;
use nohash_hasher::IntSet;

use re_arrow_store::{LatestAtQuery, TimeInt, Timeline};
use re_data_store::{log_db::EntityDb, query_transform, EntityPath, EntityTree};
use re_data_store::{log_db::EntityDb, query_latest_single, EntityPath, EntityTree};
use re_log_types::{Transform, ViewCoordinates};
use re_query::query_entity_with_primary;

Expand Down Expand Up @@ -112,7 +112,8 @@ impl SpaceInfoCollection {
tree: &EntityTree,
query: &LatestAtQuery,
) {
if let Some(transform) = query_transform(entity_db, &tree.path, query) {
if let Some(transform) = query_latest_single::<Transform>(entity_db, &tree.path, query)
{
// A set transform (likely non-identity) - create a new space.
parent_space
.child_spaces
Expand Down Expand Up @@ -156,7 +157,7 @@ impl SpaceInfoCollection {
let mut spaces_info = Self::default();

// Start at the root. The root is always part of the collection!
if query_transform(entity_db, &EntityPath::root(), &query).is_some() {
if query_latest_single::<Transform>(entity_db, &EntityPath::root(), &query).is_some() {
re_log::warn_once!("The root entity has a 'transform' component! This will have no effect. Did you mean to apply the transform elsewhere?");
}
let mut root_space_info = SpaceInfo::new(EntityPath::root());
Expand Down
Loading

1 comment on commit c31906a

@github-actions
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Rust Benchmark

Benchmark suite Current: c31906a Previous: 34123fb Ratio
datastore/insert/batch/rects/insert 553475 ns/iter (± 2321) 549163 ns/iter (± 2031) 1.01
datastore/latest_at/batch/rects/query 1849 ns/iter (± 45) 1846 ns/iter (± 7) 1.00
datastore/latest_at/missing_components/primary 357 ns/iter (± 0) 355 ns/iter (± 0) 1.01
datastore/latest_at/missing_components/secondaries 438 ns/iter (± 1) 423 ns/iter (± 3) 1.04
datastore/range/batch/rects/query 153348 ns/iter (± 109) 152640 ns/iter (± 555) 1.00
mono_points_arrow/generate_message_bundles 47887125 ns/iter (± 966688) 49140283 ns/iter (± 1710411) 0.97
mono_points_arrow/generate_messages 126221483 ns/iter (± 1199828) 138227626 ns/iter (± 8448348) 0.91
mono_points_arrow/encode_log_msg 160135846 ns/iter (± 1922368) 164924427 ns/iter (± 2386829) 0.97
mono_points_arrow/encode_total 332667330 ns/iter (± 2479116) 355860002 ns/iter (± 2427617) 0.93
mono_points_arrow/decode_log_msg 178838297 ns/iter (± 1315718) 186595401 ns/iter (± 1287110) 0.96
mono_points_arrow/decode_message_bundles 65131150 ns/iter (± 802289) 74760592 ns/iter (± 1537929) 0.87
mono_points_arrow/decode_total 241253413 ns/iter (± 1814790) 256120396 ns/iter (± 2077994) 0.94
batch_points_arrow/generate_message_bundles 334076 ns/iter (± 509) 332919 ns/iter (± 2119) 1.00
batch_points_arrow/generate_messages 6141 ns/iter (± 13) 6210 ns/iter (± 53) 0.99
batch_points_arrow/encode_log_msg 366232 ns/iter (± 2426) 370721 ns/iter (± 1954) 0.99
batch_points_arrow/encode_total 732741 ns/iter (± 2727) 726085 ns/iter (± 3905) 1.01
batch_points_arrow/decode_log_msg 349966 ns/iter (± 1421) 347020 ns/iter (± 1289) 1.01
batch_points_arrow/decode_message_bundles 1987 ns/iter (± 2) 1985 ns/iter (± 15) 1.00
batch_points_arrow/decode_total 354712 ns/iter (± 1035) 356050 ns/iter (± 1457) 1.00
arrow_mono_points/insert 6199287558 ns/iter (± 26669187) 7141936290 ns/iter (± 18219870) 0.87
arrow_mono_points/query 1747844 ns/iter (± 13148) 1763477 ns/iter (± 12201) 0.99
arrow_batch_points/insert 2724636 ns/iter (± 54017) 2705162 ns/iter (± 21006) 1.01
arrow_batch_points/query 17375 ns/iter (± 79) 17519 ns/iter (± 139) 0.99
tuid/Tuid::random 34 ns/iter (± 0) 34 ns/iter (± 0) 1

This comment was automatically generated by workflow using github-action-benchmark.

Please sign in to comment.