pub struct LanguageIdentifier {
pub language: Language,
pub script: Option<Script>,
pub region: Option<Region>,
pub variants: Variants,
}Expand description
A core struct representing a Unicode BCP47 Language Identifier.
§Examples
use icu::locid::{
langid,
subtags::{language, region},
};
let li = langid!("en-US");
assert_eq!(li.language, language!("en"));
assert_eq!(li.script, None);
assert_eq!(li.region, Some(region!("US")));
assert_eq!(li.variants.len(), 0);§Parsing
Unicode recognizes three levels of standard conformance for any language identifier:
- well-formed - syntactically correct
- valid - well-formed and only uses registered language, region, script and variant subtags…
- canonical - valid and no deprecated codes or structure.
At the moment parsing normalizes a well-formed language identifier converting
_ separators to - and adjusting casing to conform to the Unicode standard.
Any bogus subtags will cause the parsing to fail with an error. No subtag validation is performed.
§Examples
use icu::locid::{
langid,
subtags::{language, region, script, variant},
};
let li = langid!("eN_latn_Us-Valencia");
assert_eq!(li.language, language!("en"));
assert_eq!(li.script, Some(script!("Latn")));
assert_eq!(li.region, Some(region!("US")));
assert_eq!(li.variants.get(0), Some(&variant!("valencia")));Fields§
§language: LanguageLanguage subtag of the language identifier.
script: Option<Script>Script subtag of the language identifier.
region: Option<Region>Region subtag of the language identifier.
variants: VariantsVariant subtags of the language identifier.
Implementations§
Source§impl LanguageIdentifier
impl LanguageIdentifier
Sourcepub fn try_from_bytes(v: &[u8]) -> Result<Self, ParserError>
pub fn try_from_bytes(v: &[u8]) -> Result<Self, ParserError>
A constructor which takes a utf8 slice, parses it and
produces a well-formed LanguageIdentifier.
§Examples
use icu::locid::LanguageIdentifier;
LanguageIdentifier::try_from_bytes(b"en-US").expect("Parsing failed");Sourcepub fn try_from_locale_bytes(v: &[u8]) -> Result<Self, ParserError>
pub fn try_from_locale_bytes(v: &[u8]) -> Result<Self, ParserError>
A constructor which takes a utf8 slice which may contain extension keys,
parses it and produces a well-formed LanguageIdentifier.
§Examples
use icu::locid::{langid, LanguageIdentifier};
let li = LanguageIdentifier::try_from_locale_bytes(b"en-US-x-posix")
.expect("Parsing failed.");
assert_eq!(li, langid!("en-US"));This method should be used for input that may be a locale identifier. All extensions will be lost.
Sourcepub fn canonicalize<S: AsRef<[u8]>>(input: S) -> Result<String, ParserError>
pub fn canonicalize<S: AsRef<[u8]>>(input: S) -> Result<String, ParserError>
This is a best-effort operation that performs all available levels of canonicalization.
At the moment the operation will normalize casing and the separator, but in the future it may also validate and update from deprecated subtags to canonical ones.
§Examples
use icu::locid::LanguageIdentifier;
assert_eq!(
LanguageIdentifier::canonicalize("pL_latn_pl").as_deref(),
Ok("pl-Latn-PL")
);Sourcepub fn strict_cmp(&self, other: &[u8]) -> Ordering
pub fn strict_cmp(&self, other: &[u8]) -> Ordering
Compare this LanguageIdentifier with BCP-47 bytes.
The return value is equivalent to what would happen if you first converted this
LanguageIdentifier to a BCP-47 string and then performed a byte comparison.
This function is case-sensitive and results in a total order, so it is appropriate for
binary search. The only argument producing Ordering::Equal is self.to_string().
§Examples
use icu::locid::LanguageIdentifier;
use std::cmp::Ordering;
let bcp47_strings: &[&str] = &[
"pl-Latn-PL",
"und",
"und-Adlm",
"und-GB",
"und-ZA",
"und-fonipa",
"zh",
];
for ab in bcp47_strings.windows(2) {
let a = ab[0];
let b = ab[1];
assert!(a.cmp(b) == Ordering::Less);
let a_langid = a.parse::<LanguageIdentifier>().unwrap();
assert!(a_langid.strict_cmp(a.as_bytes()) == Ordering::Equal);
assert!(a_langid.strict_cmp(b.as_bytes()) == Ordering::Less);
}Sourcepub fn total_cmp(&self, other: &Self) -> Ordering
pub fn total_cmp(&self, other: &Self) -> Ordering
Compare this LanguageIdentifier with another LanguageIdentifier field-by-field.
The result is a total ordering sufficient for use in a BTreeMap.
Unlike Self::strict_cmp, this function’s ordering may not equal string ordering.
Sourcepub fn strict_cmp_iter<'l, I>(&self, subtags: I) -> SubtagOrderingResult<I>
👎Deprecated since 1.5.0: if you need this, please file an issue
pub fn strict_cmp_iter<'l, I>(&self, subtags: I) -> SubtagOrderingResult<I>
Compare this LanguageIdentifier with an iterator of BCP-47 subtags.
This function has the same equality semantics as LanguageIdentifier::strict_cmp. It is intended as
a more modular version that allows multiple subtag iterators to be chained together.
For an additional example, see SubtagOrderingResult.
§Examples
use icu::locid::LanguageIdentifier;
use std::cmp::Ordering;
let subtags: &[&[u8]] = &[b"ca", b"ES", b"valencia"];
let loc = "ca-ES-valencia".parse::<LanguageIdentifier>().unwrap();
assert_eq!(
Ordering::Equal,
loc.strict_cmp_iter(subtags.iter().copied()).end()
);
let loc = "ca-ES".parse::<LanguageIdentifier>().unwrap();
assert_eq!(
Ordering::Less,
loc.strict_cmp_iter(subtags.iter().copied()).end()
);
let loc = "ca-ZA".parse::<LanguageIdentifier>().unwrap();
assert_eq!(
Ordering::Greater,
loc.strict_cmp_iter(subtags.iter().copied()).end()
);Sourcepub fn normalizing_eq(&self, other: &str) -> bool
pub fn normalizing_eq(&self, other: &str) -> bool
Compare this LanguageIdentifier with a potentially unnormalized BCP-47 string.
The return value is equivalent to what would happen if you first parsed the
BCP-47 string to a LanguageIdentifier and then performed a structural comparison.
§Examples
use icu::locid::LanguageIdentifier;
let bcp47_strings: &[&str] = &[
"pl-LaTn-pL",
"uNd",
"UnD-adlm",
"uNd-GB",
"UND-FONIPA",
"ZH",
];
for a in bcp47_strings {
assert!(a.parse::<LanguageIdentifier>().unwrap().normalizing_eq(a));
}Trait Implementations§
Source§impl AsMut<LanguageIdentifier> for LanguageIdentifier
impl AsMut<LanguageIdentifier> for LanguageIdentifier
Source§impl AsMut<LanguageIdentifier> for Locale
impl AsMut<LanguageIdentifier> for Locale
Source§fn as_mut(&mut self) -> &mut LanguageIdentifier
fn as_mut(&mut self) -> &mut LanguageIdentifier
Source§impl AsRef<LanguageIdentifier> for LanguageIdentifier
impl AsRef<LanguageIdentifier> for LanguageIdentifier
Source§impl AsRef<LanguageIdentifier> for Locale
impl AsRef<LanguageIdentifier> for Locale
Source§fn as_ref(&self) -> &LanguageIdentifier
fn as_ref(&self) -> &LanguageIdentifier
Source§impl Clone for LanguageIdentifier
impl Clone for LanguageIdentifier
Source§fn clone(&self) -> LanguageIdentifier
fn clone(&self) -> LanguageIdentifier
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source. Read moreSource§impl Debug for LanguageIdentifier
impl Debug for LanguageIdentifier
Source§impl Default for LanguageIdentifier
impl Default for LanguageIdentifier
Source§fn default() -> LanguageIdentifier
fn default() -> LanguageIdentifier
Source§impl Display for LanguageIdentifier
impl Display for LanguageIdentifier
This trait is implemented for compatibility with fmt!.
To create a string, Writeable::write_to_string is usually more efficient.
Source§impl From<&LanguageIdentifier> for (Language, Option<Script>, Option<Region>)
impl From<&LanguageIdentifier> for (Language, Option<Script>, Option<Region>)
Convert from a LanguageIdentifier to an LSR tuple.
§Examples
use icu::locid::{
langid,
subtags::{language, region, script},
};
let lid = langid!("en-Latn-US");
let (lang, script, region) = (&lid).into();
assert_eq!(lang, language!("en"));
assert_eq!(script, Some(script!("Latn")));
assert_eq!(region, Some(region!("US")));Source§fn from(langid: &LanguageIdentifier) -> Self
fn from(langid: &LanguageIdentifier) -> Self
Source§impl From<(Language, Option<Script>, Option<Region>)> for LanguageIdentifier
impl From<(Language, Option<Script>, Option<Region>)> for LanguageIdentifier
Convert from an LSR tuple to a LanguageIdentifier.
§Examples
use icu::locid::{
langid,
subtags::{language, region, script},
LanguageIdentifier,
};
let lang = language!("en");
let script = script!("Latn");
let region = region!("US");
assert_eq!(
LanguageIdentifier::from((lang, Some(script), Some(region))),
langid!("en-Latn-US")
);Source§impl From<Language> for LanguageIdentifier
impl From<Language> for LanguageIdentifier
§Examples
use icu::locid::{langid, subtags::language, LanguageIdentifier};
assert_eq!(LanguageIdentifier::from(language!("en")), langid!("en"));Source§impl From<LanguageIdentifier> for Locale
impl From<LanguageIdentifier> for Locale
Source§fn from(id: LanguageIdentifier) -> Self
fn from(id: LanguageIdentifier) -> Self
Source§impl From<Locale> for LanguageIdentifier
impl From<Locale> for LanguageIdentifier
Source§impl From<Option<Region>> for LanguageIdentifier
impl From<Option<Region>> for LanguageIdentifier
§Examples
use icu::locid::{langid, subtags::region, LanguageIdentifier};
assert_eq!(
LanguageIdentifier::from(Some(region!("US"))),
langid!("und-US")
);Source§impl From<Option<Script>> for LanguageIdentifier
impl From<Option<Script>> for LanguageIdentifier
§Examples
use icu::locid::{langid, subtags::script, LanguageIdentifier};
assert_eq!(
LanguageIdentifier::from(Some(script!("latn"))),
langid!("und-Latn")
);Source§impl FromStr for LanguageIdentifier
impl FromStr for LanguageIdentifier
Source§impl Hash for LanguageIdentifier
impl Hash for LanguageIdentifier
Source§impl PartialEq for LanguageIdentifier
impl PartialEq for LanguageIdentifier
Source§impl Writeable for LanguageIdentifier
impl Writeable for LanguageIdentifier
Source§fn write_to<W: Write + ?Sized>(&self, sink: &mut W) -> Result
fn write_to<W: Write + ?Sized>(&self, sink: &mut W) -> Result
write_to_parts, and discards any
Part annotations.Source§fn writeable_length_hint(&self) -> LengthHint
fn writeable_length_hint(&self) -> LengthHint
Source§fn write_to_string(&self) -> Cow<'_, str>
fn write_to_string(&self) -> Cow<'_, str>
String with the data from this Writeable. Like ToString,
but smaller and faster. Read moreSource§fn write_to_parts<S>(&self, sink: &mut S) -> Result<(), Error>where
S: PartsWrite + ?Sized,
fn write_to_parts<S>(&self, sink: &mut S) -> Result<(), Error>where
S: PartsWrite + ?Sized,
Part annotations to the given sink. Errors from the
sink are bubbled up. The default implementation delegates to write_to,
and doesn’t produce any Part annotations.