lib.rs source code [crates/unic_langid/src/lib.rs]

1	//! `unic-langid` is a core API for parsing, manipulating, and serializing Unicode Language
2	//! Identifiers.
3	//!
4	//! The crate provides algorithms for parsing a string into a well-formed language identifier
5	//! as defined by [`UTS #35: Unicode LDML 3.1 Unicode Language Identifier`].
6	//!
7	//! # Examples
8	//!
9	//! ```
10	//! use unic_langid::LanguageIdentifier;
11	//! use unic_langid::subtags::{Language, Script, Region};
12	//!
13	//! let mut li: LanguageIdentifier = "en-US".parse()
14	//! .expect("Parsing failed.");
15	//!
16	//! let lang: Language = "en".parse().expect("Parsing failed.");
17	//! let region: Region = "US".parse().expect("Parsing failed.");
18	//! assert_eq!(li.language, lang);
19	//! assert_eq!(li.script, None);
20	//! assert_eq!(li.region, Some(region));
21	//! assert_eq!(li.variants().len(), `0`);
22	//!
23	//! let region: Region = "GB".parse().expect("Parsing failed.");
24	//! li.region = Some(region);
25	//!
26	//! assert_eq!(li.to_string(), "en-GB");
27	//! ```
28	//!
29	//! For more details, see [`LanguageIdentifier`].
30	//!
31	//! # Optional features
32	//!
33	//! ## `langid!`, `langids!`, and `langid_slice!` macros
34	//!
35	//! If `feature = "macros"` is selected, the crate provides a procedural macro
36	//! which allows to construct build-time well-formed language identifiers with zero-cost at runtime.
37	//!
38	//! ``` ignore
39	//! use unic_langid::{langid, langid_slice, langids, lang, region, script, variant, LanguageIdentifier};
40	//! use unic_langid::subtags::{Language, Script, Region, Variant};
41	//! use std::str::FromStr;
42	//!
43	//! let es_ar = langid!("es-AR");
44	//! let en_us = langid!("en-US");
45	//!
46	//! assert_eq!(&es_ar.to_string(), "es-AR");
47	//! assert_eq!(&en_us.to_string(), "en-US");
48	//!
49	//! let lang_ids = langids!("es-AR", "en-US", "de");
50	//!
51	//! assert_eq!(lang_ids[`0`], "es-AR");
52	//! assert_eq!(lang_ids[`1`], "en-US");
53	//! assert_eq!(lang_ids[`2`], "de");
54	//!
55	//! const LANGUAGES: &[LanguageIdentifier] = langid_slice!["en-GB", "fr"];
56	//!
57	//! assert_eq!(lang!("pl"), "pl");
58	//! assert_eq!(lang!("pl"), Language::from_str("pl").unwrap());
59	//!
60	//! assert_eq!(script!("latn"), "Latn");
61	//! assert_eq!(script!("latn"), Script::from_str("Latn").unwrap());
62	//!
63	//! assert_eq!(region!("us"), "US");
64	//! assert_eq!(region!("us"), Region::from_str("us").unwrap());
65	//!
66	//! assert_eq!(variant!("macos"), "macos");
67	//! assert_eq!(variant!("macos"), Variant::from_str("macos").unwrap());
68	//! ```
69	//!
70	//! The macros produce instances of `LanguageIdentifier` the same way as parsing from `&str` does,
71	//! but since the parsing is performed at build time, it doesn't need a `Result`.
72	//!
73	//! At the moment `langid!` can also be used for const variables, but only if no variants are used.
74	//!
75	//! The macros are optional to reduce the dependency chain and compilation time of `unic-langid`.
76	//!
77	//! ## Likely Subtags
78	//!
79	//! If `feature = "likelysubtags"` is selected, the `LanguageIdentifier` gains two more methods:
80	//!
81	//! add_likely_subtags*
82	//! remove_likely_subtags*
83	//!
84	//! Both of them operate in place updating the existing `LanguageIdentifier` by either extending
85	//! subtags to most likely values, or removing the subtags that are not needed.
86	//!
87	//! Both methods return a `bool` that indicates if the identifier has been modified.
88	//!
89	//! ``` ignore
90	//! use unic_langid::LanuageIdentifier;
91	//!
92	//! let mut li: LanguageIdentifier = "fr-FR".parse()
93	//! .expect("Parsing failed.");
94	//!
95	//! assert_eq!(li.add_likely_subtags(), `true`);
96	//! assert_eq!(li, "fr-Latn-FR");
97	//!
98	//! assert_eq!(li.remove_likely_subtags(), `true`);
99	//! assert_eq!(li, "fr");
100	//! ```
101	//!
102	//! The feature is optional because it increases the binary size of the library by including
103	//! a data table for CLDR likelySubtags.
104	//!
105	//! [`UTS #35: Unicode LDML 3.1 Unicode Language Identifier`]: https://unicode.org/reports/tr35/tr35.html#Unicode_language_identifier
106	//! [`LanguageIdentifier`]: ./struct.LanguageIdentifier.html
107
108	pub use unic_langid_impl::*;
109
110	#[cfg(feature = "unic-langid-macros")]
111	pub use unic_langid_macros::{lang, langid, region, script, variant};
112
113	#[cfg(feature = "unic-langid-macros")]
114	#[macro_export]
115	macro_rules! langids {
116	( $($langid:expr),* ) => {
117	vec![$(
118	$crate::langid!($langid),
119	)*]
120	};
121	( $($langid:expr,)* ) => {
122	$crate::langids![$($langid),*]
123	};
124	}
125	#[cfg(feature = "unic-langid-macros")]
126	#[macro_export]
127	macro_rules! langid_slice {
128	( $($langid:expr),* ) => {
129	&[$(
130	$crate::langid!($langid),
131	)*]
132	};
133	( $($langid:expr,)* ) => {
134	$crate::langid_slice![$($langid),*]
135	};
136	}
137