1// This file is part of ICU4X. For terms of use, please see the file
2// called LICENSE at the top level of the ICU4X source tree
3// (online at: https://github.com/unicode-org/icu4x/blob/main/LICENSE ).
45// Provider structs must be stable
6#![allow(clippy::exhaustive_structs, clippy::exhaustive_enums)]
78//! 🚧 \[Unstable\] Data provider struct definitions for this ICU4X component.
9//!
10//! <div class="stab unstable">
11//! 🚧 This code is considered unstable; it may change at any time, in breaking or non-breaking ways,
12//! including in SemVer minor releases. While the serde representation of data structs is guaranteed
13//! to be stable, their Rust representation might not be. Use with caution.
14//! </div>
15//!
16//! Read more about data providers: [`icu_provider`]
1718mod canonicalizer;
19pub use canonicalizer::*;
20use icu_locid::subtags::Language;
21mod directionality;
22pub use directionality::*;
23mod expander;
24pub use expander::*;
25mod fallback;
26pub use fallback::*;
2728#[cfg(feature = "compiled_data")]
29#[derive(Debug)]
30/// Baked data
31///
32/// <div class="stab unstable">
33/// 🚧 This code is considered unstable; it may change at any time, in breaking or non-breaking ways,
34/// including in SemVer minor releases. In particular, the `DataProvider` implementations are only
35/// guaranteed to match with this version's `*_unstable` providers. Use with caution.
36/// </div>
37pub struct Baked;
3839#[cfg(feature = "compiled_data")]
40const _: () = {
41pub mod icu {
42pub use crate as locid_transform;
43pub use icu_locid as locid;
44 }
45icu_locid_transform_data::make_provider!(Baked);
46icu_locid_transform_data::impl_fallback_likelysubtags_v1!(Baked);
47icu_locid_transform_data::impl_fallback_parents_v1!(Baked);
48icu_locid_transform_data::impl_fallback_supplement_co_v1!(Baked);
49icu_locid_transform_data::impl_locid_transform_aliases_v2!(Baked);
50icu_locid_transform_data::impl_locid_transform_likelysubtags_ext_v1!(Baked);
51icu_locid_transform_data::impl_locid_transform_likelysubtags_l_v1!(Baked);
52icu_locid_transform_data::impl_locid_transform_likelysubtags_sr_v1!(Baked);
53icu_locid_transform_data::impl_locid_transform_script_dir_v1!(Baked);
54};
5556#[cfg(feature = "datagen")]
57use icu_provider::prelude::*;
5859#[cfg(feature = "datagen")]
60/// The latest minimum set of keys required by this component.
61pub const KEYS: &[DataKey] = &[
62 AliasesV2Marker::KEY,
63 CollationFallbackSupplementV1Marker::KEY,
64 LikelySubtagsExtendedV1Marker::KEY,
65 LikelySubtagsForLanguageV1Marker::KEY,
66 LikelySubtagsForScriptRegionV1Marker::KEY,
67 LocaleFallbackLikelySubtagsV1Marker::KEY,
68 LocaleFallbackParentsV1Marker::KEY,
69 ScriptDirectionV1Marker::KEY,
70];
7172use alloc::borrow::Cow;
73use tinystr::{TinyAsciiStr, UnvalidatedTinyAsciiStr};
7475// We use raw TinyAsciiStrs for map keys, as we then don't have to
76// validate them as subtags on deserialization. Map lookup can be
77// done even if they are not valid tags (an invalid key will just
78// become inaccessible).
79type UnvalidatedLanguage = UnvalidatedTinyAsciiStr<3>;
80type UnvalidatedScript = UnvalidatedTinyAsciiStr<4>;
81type UnvalidatedRegion = UnvalidatedTinyAsciiStr<3>;
82type UnvalidatedVariant = UnvalidatedTinyAsciiStr<8>;
83type UnvalidatedSubdivision = UnvalidatedTinyAsciiStr<7>;
84type SemivalidatedSubdivision = TinyAsciiStr<7>;
8586// LanguageIdentifier doesn't have an AsULE implementation, so we have
87// to store strs and parse when needed.
88type UnvalidatedLanguageIdentifier = str;
89type UnvalidatedLanguageIdentifierPair = StrStrPairVarULE;
90type UnvalidatedLanguageVariantsPair = LanguageStrStrPairVarULE;
9192#[zerovec::make_varule(StrStrPairVarULE)]
93#[zerovec::derive(Debug)]
94#[derive(Clone, PartialEq, Eq, PartialOrd, Ord, Debug)]
95#[cfg_attr(
96 feature = "serde",
97 derive(serde::Deserialize),
98 zerovec::derive(Deserialize)
99)]
100#[cfg_attr(
101 feature = "datagen",
102 derive(serde::Serialize, databake::Bake),
103 zerovec::derive(Serialize),
104 databake(path = icu_locid_transform::provider),
105)]
106/// A pair of strings with a EncodeAsVarULE implementation.
107///
108/// <div class="stab unstable">
109/// 🚧 This code is considered unstable; it may change at any time, in breaking or non-breaking ways,
110/// including in SemVer minor releases. While the serde representation of data structs is guaranteed
111/// to be stable, their Rust representation might not be. Use with caution.
112/// </div>
113pub struct StrStrPair<'a>(
114#[cfg_attr(feature = "serde", serde(borrow))] pub Cow<'a, str>,
115#[cfg_attr(feature = "serde", serde(borrow))] pub Cow<'a, str>,
116);
117118#[zerovec::make_varule(LanguageStrStrPairVarULE)]
119#[zerovec::derive(Debug)]
120#[derive(Clone, PartialEq, Eq, PartialOrd, Ord, Debug)]
121#[cfg_attr(
122 feature = "serde",
123 derive(serde::Deserialize),
124 zerovec::derive(Deserialize)
125)]
126#[cfg_attr(
127 feature = "datagen",
128 derive(serde::Serialize, databake::Bake),
129 zerovec::derive(Serialize),
130 databake(path = icu_locid_transform::provider),
131)]
132/// A triplet of strings with a EncodeAsVarULE implementation.
133pub struct LanguageStrStrPair<'a>(
134pub Language,
135#[cfg_attr(feature = "serde", serde(borrow))] pub Cow<'a, str>,
136#[cfg_attr(feature = "serde", serde(borrow))] pub Cow<'a, str>,
137);