From d0a177363e8f550c352efce118139c9abb53dce0 Mon Sep 17 00:00:00 2001 From: Aykut Bozkurt Date: Mon, 23 Sep 2024 13:01:41 +0300 Subject: [PATCH] Adds crunchy_map type conversion from/to Arrow --- src/type_compat.rs | 1 + src/type_compat/map.rs | 169 +++++++++++++++++++++++++++++++++++++++++ 2 files changed, 170 insertions(+) create mode 100644 src/type_compat/map.rs diff --git a/src/type_compat.rs b/src/type_compat.rs index 5d1ba00..061f992 100644 --- a/src/type_compat.rs +++ b/src/type_compat.rs @@ -1,2 +1,3 @@ pub(crate) mod geometry; +pub(crate) mod map; pub(crate) mod pg_arrow_type_conversions; diff --git a/src/type_compat/map.rs b/src/type_compat/map.rs new file mode 100644 index 0000000..6fb5f15 --- /dev/null +++ b/src/type_compat/map.rs @@ -0,0 +1,169 @@ +use once_cell::sync::OnceCell; +use pgrx::{ + datum::UnboxDatum, + pg_sys::{ + self, get_extension_oid, get_extension_schema, Anum_pg_type_oid, AsPgCStr, GetSysCacheOid, + InvalidOid, Oid, SysCacheIdentifier::TYPEOID, + }, + prelude::PgHeapTuple, + AllocatedByRust, FromDatum, IntoDatum, +}; + +use crate::pgrx_utils::is_domain_of_array_type; + +// we need to reset the crunchy_map context at each copy start +static mut CRUNCHY_MAP_CONTEXT: OnceCell = OnceCell::new(); + +fn get_crunchy_map_context() -> &'static mut CrunchyMapContext { + unsafe { + CRUNCHY_MAP_CONTEXT + .get_mut() + .expect("crunchy_map context is not initialized") + } +} + +pub(crate) fn reset_crunchy_map_context() { + unsafe { CRUNCHY_MAP_CONTEXT.take() }; + + unsafe { + CRUNCHY_MAP_CONTEXT + .set(CrunchyMapContext::new()) + .expect("failed to reset crunchy_map context") + }; +} + +pub(crate) fn is_crunchy_map_type(typoid: Oid) -> bool { + let crunchy_map_context = get_crunchy_map_context(); + + if crunchy_map_context.crunchy_map_ext_schema_oid.is_none() { + return false; + } + + // crunchy map is a domain type over array of key-value pairs + if !is_domain_of_array_type(typoid) { + return false; + } + + let crunchy_map_ext_schema_oid = crunchy_map_context + .crunchy_map_ext_schema_oid + .expect("expected crunchy_map is created"); + + let found_typoid = unsafe { + GetSysCacheOid( + TYPEOID as _, + Anum_pg_type_oid as _, + typoid.into_datum().unwrap(), + crunchy_map_ext_schema_oid.into_datum().unwrap(), + pg_sys::Datum::from(0), + pg_sys::Datum::from(0), + ) + }; + + let is_crunchy_map = found_typoid != InvalidOid; + + if is_crunchy_map { + crunchy_map_context + .per_crunchy_map_context + .set_current_crunchy_map_typoid(typoid); + } + + is_crunchy_map +} + +#[derive(Debug, PartialEq, Clone)] +struct CrunchyMapPerTypeContext { + current_crunchy_map_typoid: Option, +} + +impl CrunchyMapPerTypeContext { + fn set_current_crunchy_map_typoid(&mut self, typoid: Oid) { + self.current_crunchy_map_typoid = Some(typoid); + } +} + +#[derive(Debug, PartialEq, Clone)] +struct CrunchyMapContext { + crunchy_map_ext_oid: Option, + crunchy_map_ext_schema_oid: Option, + per_crunchy_map_context: CrunchyMapPerTypeContext, +} + +impl CrunchyMapContext { + fn new() -> Self { + let crunchy_map_ext_oid = unsafe { get_extension_oid("crunchy_map".as_pg_cstr(), true) }; + let crunchy_map_ext_oid = if crunchy_map_ext_oid == InvalidOid { + None + } else { + Some(crunchy_map_ext_oid) + }; + + let crunchy_map_ext_schema_oid = crunchy_map_ext_oid + .map(|crunchy_map_ext_oid| unsafe { get_extension_schema(crunchy_map_ext_oid) }); + + Self { + crunchy_map_ext_oid, + crunchy_map_ext_schema_oid, + per_crunchy_map_context: CrunchyMapPerTypeContext { + current_crunchy_map_typoid: None, + }, + } + } +} + +// crunchy_map is a domain type over array of key-value pairs +pub(crate) struct CrunchyMap<'a> { + pub(crate) entries: pgrx::Array<'a, PgHeapTuple<'a, AllocatedByRust>>, +} + +impl IntoDatum for CrunchyMap<'_> { + fn into_datum(self) -> Option { + // since the map is stored as an array of tuples, we can simply convert the array to a datum + self.entries.into_datum() + } + + fn type_oid() -> pg_sys::Oid { + get_crunchy_map_context() + .per_crunchy_map_context + .current_crunchy_map_typoid + .expect("crunchy_map type context is not initialized") + } +} + +impl FromDatum for CrunchyMap<'_> { + unsafe fn from_polymorphic_datum( + datum: pg_sys::Datum, + is_null: bool, + _typoid: pg_sys::Oid, + ) -> Option + where + Self: Sized, + { + if is_null { + None + } else { + let is_null = false; + let entries = pgrx::Array::>::from_datum(datum, is_null) + .expect("cannot convert datum to crunchy_map entries"); + + Some(CrunchyMap { entries }) + } + } +} + +unsafe impl<'a> UnboxDatum for CrunchyMap<'a> { + type As<'src> = Self + where + Self: 'src; + + unsafe fn unbox<'src>(datum: pgrx::datum::Datum<'src>) -> Self::As<'src> + where + Self: 'src, + { + let is_null = false; + let entries = + pgrx::Array::>::from_datum(datum.sans_lifetime(), is_null) + .expect("cannot convert datum to crunchy_map entries"); + + CrunchyMap { entries } + } +}