From e26633793303c1ac865dc57c6d371c0e3e2fd518 Mon Sep 17 00:00:00 2001 From: Manish Goregaokar Date: Tue, 10 Sep 2024 07:34:55 -0700 Subject: [PATCH] Add a Format parameter to MultiFieldsULE, add Index8 format (#5522) --- utils/zerovec/derive/src/make_varule.rs | 6 ++-- utils/zerovec/src/lib.rs | 2 +- utils/zerovec/src/ule/multi.rs | 5 ++-- utils/zerovec/src/varzerovec/components.rs | 35 ++++++++++++++++++++++ utils/zerovec/src/varzerovec/mod.rs | 2 +- utils/zerovec/src/varzerovec/owned.rs | 5 +--- 6 files changed, 45 insertions(+), 10 deletions(-) diff --git a/utils/zerovec/derive/src/make_varule.rs b/utils/zerovec/derive/src/make_varule.rs index 36a6f6e7a9e..597140d32cf 100644 --- a/utils/zerovec/derive/src/make_varule.rs +++ b/utils/zerovec/derive/src/make_varule.rs @@ -522,7 +522,8 @@ impl<'a> UnsizedFields<'a> { quote!( let lengths = [#(#lengths),*]; - let mut multi = zerovec::ule::MultiFieldsULE::new_from_lengths_partially_initialized(&lengths, #out); + // Todo: index type should be settable by attribute + let mut multi = zerovec::ule::MultiFieldsULE::::new_from_lengths_partially_initialized(&lengths, #out); unsafe { #(#writers;)* } @@ -539,7 +540,8 @@ impl<'a> UnsizedFields<'a> { for field in self.fields.iter() { lengths.push(field.encode_func(quote!(encode_var_ule_len), quote!())); } - quote!(zerovec::ule::MultiFieldsULE::compute_encoded_len_for(&[#(#lengths),*])) + // Todo: index type should be settable by attribute + quote!(zerovec::ule::MultiFieldsULE::::compute_encoded_len_for(&[#(#lengths),*])) } } diff --git a/utils/zerovec/src/lib.rs b/utils/zerovec/src/lib.rs index 4f54d9fbc7b..214039a1faf 100644 --- a/utils/zerovec/src/lib.rs +++ b/utils/zerovec/src/lib.rs @@ -293,7 +293,7 @@ pub mod vecs { #[doc(no_inline)] pub use crate::varzerovec::{VarZeroSlice, VarZeroVec}; - pub use crate::varzerovec::{Index16, Index32, VarZeroVecFormat, VarZeroVecOwned}; + pub use crate::varzerovec::{Index16, Index32, Index8, VarZeroVecFormat, VarZeroVecOwned}; pub use crate::flexzerovec::{FlexZeroSlice, FlexZeroVec, FlexZeroVecOwned}; } diff --git a/utils/zerovec/src/ule/multi.rs b/utils/zerovec/src/ule/multi.rs index d5ae94ba7f9..9cdb226488d 100644 --- a/utils/zerovec/src/ule/multi.rs +++ b/utils/zerovec/src/ule/multi.rs @@ -4,6 +4,7 @@ use super::*; use crate::varzerovec::Index32; +use crate::vecs::VarZeroVecFormat; use crate::VarZeroSlice; use core::mem; @@ -17,9 +18,9 @@ use core::mem; /// Internally, it is represented by a VarZeroSlice. #[derive(PartialEq, Eq, Debug)] #[repr(transparent)] -pub struct MultiFieldsULE(VarZeroSlice<[u8], Index32>); +pub struct MultiFieldsULE(VarZeroSlice<[u8], Format>); -impl MultiFieldsULE { +impl MultiFieldsULE { /// Compute the amount of bytes needed to support elements with lengths `lengths` #[inline] pub fn compute_encoded_len_for(lengths: &[usize]) -> usize { diff --git a/utils/zerovec/src/varzerovec/components.rs b/utils/zerovec/src/varzerovec/components.rs index 6bc3af8965b..8a06c304f3d 100644 --- a/utils/zerovec/src/varzerovec/components.rs +++ b/utils/zerovec/src/varzerovec/components.rs @@ -30,6 +30,9 @@ pub(super) const MAX_INDEX: usize = u32::MAX as usize; /// and all of its associated items are hidden from the docs. #[allow(clippy::missing_safety_doc)] // no safety section for you, don't implement this trait period pub unsafe trait VarZeroVecFormat: 'static + Sized { + /// The error to show when unable to construct a vec + #[doc(hidden)] + const TOO_LARGE_ERROR: &'static str; #[doc(hidden)] const INDEX_WIDTH: usize; #[doc(hidden)] @@ -50,6 +53,14 @@ pub unsafe trait VarZeroVecFormat: 'static + Sized { fn rawbytes_from_byte_slice_unchecked_mut(bytes: &mut [u8]) -> &mut [Self::RawBytes]; } +/// This is a [`VarZeroVecFormat`] that stores u8s in the index array. +/// Will have a smaller data size, but it's *extremely* likely for larger arrays +/// to be unrepresentable (and error on construction). Should probably be used +/// for known-small arrays, where all but the last field are known-small. +#[derive(Copy, Clone, Debug, Hash, PartialEq, Eq, PartialOrd, Ord)] +#[allow(clippy::exhaustive_structs)] // marker +pub struct Index8; + /// This is a [`VarZeroVecFormat`] that stores u16s in the index array. /// Will have a smaller data size, but it's more likely for larger arrays /// to be unrepresentable (and error on construction) @@ -66,7 +77,29 @@ pub struct Index16; #[allow(clippy::exhaustive_structs)] // marker pub struct Index32; +unsafe impl VarZeroVecFormat for Index8 { + const TOO_LARGE_ERROR: &'static str = "Attempted to build VarZeroVec out of elements that \ + cumulatively are larger than a u8 in size"; + const INDEX_WIDTH: usize = 1; + const MAX_VALUE: u32 = u8::MAX as u32; + type RawBytes = u8; + #[inline] + fn rawbytes_to_usize(raw: Self::RawBytes) -> usize { + raw as usize + } + #[inline] + fn usize_to_rawbytes(u: usize) -> Self::RawBytes { + u as u8 + } + #[inline] + fn rawbytes_from_byte_slice_unchecked_mut(bytes: &mut [u8]) -> &mut [Self::RawBytes] { + bytes + } +} + unsafe impl VarZeroVecFormat for Index16 { + const TOO_LARGE_ERROR: &'static str = "Attempted to build VarZeroVec out of elements that \ + cumulatively are larger than a u16 in size"; const INDEX_WIDTH: usize = 2; const MAX_VALUE: u32 = u16::MAX as u32; type RawBytes = RawBytesULE<2>; @@ -85,6 +118,8 @@ unsafe impl VarZeroVecFormat for Index16 { } unsafe impl VarZeroVecFormat for Index32 { + const TOO_LARGE_ERROR: &'static str = "Attempted to build VarZeroVec out of elements that \ + cumulatively are larger than a u32 in size"; const INDEX_WIDTH: usize = 4; const MAX_VALUE: u32 = u32::MAX; type RawBytes = RawBytesULE<4>; diff --git a/utils/zerovec/src/varzerovec/mod.rs b/utils/zerovec/src/varzerovec/mod.rs index 97049e32e23..662f0e91df0 100644 --- a/utils/zerovec/src/varzerovec/mod.rs +++ b/utils/zerovec/src/varzerovec/mod.rs @@ -22,7 +22,7 @@ pub use crate::{VarZeroSlice, VarZeroVec}; #[doc(hidden)] pub use components::VarZeroVecComponents; -pub use components::{Index16, Index32, VarZeroVecFormat}; +pub use components::{Index16, Index32, Index8, VarZeroVecFormat}; pub use owned::VarZeroVecOwned; diff --git a/utils/zerovec/src/varzerovec/owned.rs b/utils/zerovec/src/varzerovec/owned.rs index c5556315fbd..2998f4410ed 100644 --- a/utils/zerovec/src/varzerovec/owned.rs +++ b/utils/zerovec/src/varzerovec/owned.rs @@ -91,10 +91,7 @@ impl VarZeroVecOwned { marker: PhantomData, // TODO(#1410): Rethink length errors in VZV. entire_slice: components::get_serializable_bytes_non_empty::(elements) - .ok_or( - "Attempted to build VarZeroVec out of elements that \ - cumulatively are larger than a u32 in size", - )?, + .ok_or(F::TOO_LARGE_ERROR)?, } }) }