zerovec/ule/custom.rs
1// This file is part of ICU4X. For terms of use, please see the file
2// called LICENSE at the top level of the ICU4X source tree
3// (online at: https://github.com/unicode-org/icu4x/blob/main/LICENSE ).
4
5//! Documentation on implementing custom VarULE types.
6//!
7//! This module contains documentation for defining custom VarULE types,
8//! especially those using complex custom dynamically sized types.
9//!
10//! In *most cases* you should be able to create custom VarULE types using
11//! [`#[make_varule]`](crate::make_ule).
12//!
13//! # Example
14//!
15//! For example, if your regular stack type is:
16//!
17//! ```rust
18//! use zerofrom::ZeroFrom;
19//! use zerovec::ule::*;
20//! use zerovec::ZeroVec;
21//!
22//! #[derive(serde::Serialize, serde::Deserialize)]
23//! struct Foo<'a> {
24//! field1: char,
25//! field2: u32,
26//! #[serde(borrow)]
27//! field3: ZeroVec<'a, u32>,
28//! }
29//! ```
30//!
31//! then the ULE type will be implemented as follows. Ideally, you should have
32//! `EncodeAsVarULE` and `ZeroFrom` implementations on `Foo` pertaining to `FooULE`,
33//! as well as a `Serialize` impl on `FooULE` and a `Deserialize` impl on `Box<FooULE>`
34//! to enable human-readable serialization and deserialization.
35//!
36//! ```rust
37//! use zerovec::{ZeroVec, VarZeroVec, ZeroSlice};
38//! use zerovec::ule::*;
39//! use zerofrom::ZeroFrom;
40//! use core::mem;
41//!
42//! # #[derive(serde::Serialize, serde::Deserialize)]
43//! # struct Foo<'a> {
44//! # field1: char,
45//! # field2: u32,
46//! # #[serde(borrow)]
47//! # field3: ZeroVec<'a, u32>
48//! # }
49//!
50//! // Must be repr(C, packed) for safety of VarULE!
51//! // Must also only contain ULE types
52//! #[repr(C, packed)]
53//! struct FooULE {
54//! field1: <char as AsULE>::ULE,
55//! field2: <u32 as AsULE>::ULE,
56//! field3: ZeroSlice<u32>,
57//! }
58//!
59//! // Safety (based on the safety checklist on the VarULE trait):
60//! // 1. FooULE does not include any uninitialized or padding bytes. (achieved by `#[repr(C, packed)]` on
61//! // a struct with only ULE fields)
62//! // 2. FooULE is aligned to 1 byte. (achieved by `#[repr(C, packed)]` on
63//! // a struct with only ULE fields)
64//! // 3. The impl of `validate_byte_slice()` returns an error if any byte is not valid.
65//! // 4. The impl of `validate_byte_slice()` returns an error if the slice cannot be used in its entirety
66//! // 5. The impl of `from_byte_slice_unchecked()` returns a reference to the same data.
67//! // 6. The other VarULE methods use the default impl.
68//! // 7. FooULE byte equality is semantic equality
69//! unsafe impl VarULE for FooULE {
70//! fn validate_byte_slice(bytes: &[u8]) -> Result<(), ZeroVecError> {
71//! // validate each field
72//! <char as AsULE>::ULE::validate_byte_slice(&bytes[0..3]).map_err(|_| ZeroVecError::parse::<Self>())?;
73//! <u32 as AsULE>::ULE::validate_byte_slice(&bytes[3..7]).map_err(|_| ZeroVecError::parse::<Self>())?;
74//! let _ = ZeroVec::<u32>::parse_byte_slice(&bytes[7..]).map_err(|_| ZeroVecError::parse::<Self>())?;
75//! Ok(())
76//! }
77//! unsafe fn from_byte_slice_unchecked(bytes: &[u8]) -> &Self {
78//! let ptr = bytes.as_ptr();
79//! let len = bytes.len();
80//! // subtract the length of the char and u32 to get the length of the array
81//! let len_new = (len - 7) / 4;
82//! // it's hard constructing custom DSTs, we fake a pointer/length construction
83//! // eventually we can use the Pointer::Metadata APIs when they stabilize
84//! let fake_slice = core::ptr::slice_from_raw_parts(ptr as *const <u32 as AsULE>::ULE, len_new);
85//! &*(fake_slice as *const Self)
86//! }
87//! }
88//!
89//! unsafe impl EncodeAsVarULE<FooULE> for Foo<'_> {
90//! fn encode_var_ule_as_slices<R>(&self, cb: impl FnOnce(&[&[u8]]) -> R) -> R {
91//! // take each field, convert to ULE byte slices, and pass them through
92//! cb(&[<char as AsULE>::ULE::as_byte_slice(&[self.field1.to_unaligned()]),
93//! <u32 as AsULE>::ULE::as_byte_slice(&[self.field2.to_unaligned()]),
94//! // the ZeroVec is already in the correct slice format
95//! self.field3.as_bytes()])
96//! }
97//! }
98//!
99//! impl<'a> ZeroFrom<'a, FooULE> for Foo<'a> {
100//! fn zero_from(other: &'a FooULE) -> Self {
101//! Self {
102//! field1: AsULE::from_unaligned(other.field1),
103//! field2: AsULE::from_unaligned(other.field2),
104//! field3: ZeroFrom::zero_from(&other.field3),
105//! }
106//! }
107//! }
108//!
109//!
110//! impl serde::Serialize for FooULE
111//! {
112//! fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
113//! where
114//! S: serde::Serializer,
115//! {
116//! Foo::zero_from(self).serialize(serializer)
117//! }
118//! }
119//!
120//! impl<'de> serde::Deserialize<'de> for Box<FooULE>
121//! {
122//! fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
123//! where
124//! D: serde::Deserializer<'de>,
125//! {
126//! let mut foo = Foo::deserialize(deserializer)?;
127//! Ok(encode_varule_to_box(&foo))
128//! }
129//! }
130//!
131//! fn main() {
132//! let mut foos = [Foo {field1: 'u', field2: 983, field3: ZeroVec::alloc_from_slice(&[1212,2309,500,7000])},
133//! Foo {field1: 'l', field2: 1010, field3: ZeroVec::alloc_from_slice(&[1932, 0, 8888, 91237])}];
134//!
135//! let vzv = VarZeroVec::<_>::from(&foos);
136//!
137//! assert_eq!(char::from_unaligned(vzv.get(0).unwrap().field1), 'u');
138//! assert_eq!(u32::from_unaligned(vzv.get(0).unwrap().field2), 983);
139//! assert_eq!(&vzv.get(0).unwrap().field3, &[1212,2309,500,7000][..]);
140//!
141//! assert_eq!(char::from_unaligned(vzv.get(1).unwrap().field1), 'l');
142//! assert_eq!(u32::from_unaligned(vzv.get(1).unwrap().field2), 1010);
143//! assert_eq!(&vzv.get(1).unwrap().field3, &[1932, 0, 8888, 91237][..]);
144//! }
145//! ```