summaryrefslogtreecommitdiffstats
path: root/third_party/rust/tinystr/src/tinystr16.rs
diff options
context:
space:
mode:
Diffstat (limited to 'third_party/rust/tinystr/src/tinystr16.rs')
-rw-r--r--third_party/rust/tinystr/src/tinystr16.rs321
1 files changed, 321 insertions, 0 deletions
diff --git a/third_party/rust/tinystr/src/tinystr16.rs b/third_party/rust/tinystr/src/tinystr16.rs
new file mode 100644
index 0000000000..c089516419
--- /dev/null
+++ b/third_party/rust/tinystr/src/tinystr16.rs
@@ -0,0 +1,321 @@
+use std::cmp::Ordering;
+use std::convert::Into;
+use std::fmt;
+use std::num::NonZeroU128;
+use std::ops::Deref;
+use std::ptr::copy_nonoverlapping;
+use std::str::FromStr;
+
+use crate::Error;
+
+/// A tiny string that is from 1 to 16 non-NUL ASCII characters.
+///
+/// # Examples
+///
+/// ```
+/// use tinystr::TinyStr16;
+///
+/// let s1: TinyStr16 = "Metamorphosis".parse()
+/// .expect("Failed to parse.");
+///
+/// assert_eq!(s1, "Metamorphosis");
+/// assert!(s1.is_ascii_alphabetic());
+/// ```
+#[derive(Copy, Clone, PartialEq, Eq, Hash)]
+pub struct TinyStr16(NonZeroU128);
+
+impl TinyStr16 {
+ /// Creates a TinyStr16 from a byte slice.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1 = TinyStr16::from_bytes("Testing".as_bytes())
+ /// .expect("Failed to parse.");
+ ///
+ /// assert_eq!(s1, "Testing");
+ /// ```
+ #[inline(always)]
+ pub fn from_bytes(bytes: &[u8]) -> Result<Self, Error> {
+ let len = bytes.len();
+ if len < 1 || len > 16 {
+ return Err(Error::InvalidSize);
+ }
+ unsafe {
+ let mut word: u128 = 0;
+ copy_nonoverlapping(bytes.as_ptr(), &mut word as *mut u128 as *mut u8, len);
+ let mask = 0x80808080_80808080_80808080_80808080u128 >> (8 * (16 - len));
+ // TODO: could do this with #cfg(target_endian), but this is clearer and
+ // more confidence-inspiring.
+ let mask = u128::from_le(mask);
+ if (word & mask) != 0 {
+ return Err(Error::NonAscii);
+ }
+ if ((mask - word) & mask) != 0 {
+ return Err(Error::InvalidNull);
+ }
+ Ok(Self(NonZeroU128::new_unchecked(word)))
+ }
+ }
+
+ /// An unsafe constructor intended for cases where the consumer
+ /// guarantees that the input is a little endian integer which
+ /// is a correct representation of a `TinyStr16` string.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "Metamorphosis".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// let num: u128 = s1.into();
+ ///
+ /// let s2 = unsafe { TinyStr16::new_unchecked(num) };
+ ///
+ /// assert_eq!(s1, s2);
+ /// assert_eq!(s2.as_str(), "Metamorphosis");
+ /// ```
+ #[inline(always)]
+ pub const unsafe fn new_unchecked(text: u128) -> Self {
+ Self(NonZeroU128::new_unchecked(u128::from_le(text)))
+ }
+
+ /// Extracts a string slice containing the entire `TinyStr16`.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "Metamorphosis".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert_eq!(s1.as_str(), "Metamorphosis");
+ /// ```
+ #[inline(always)]
+ pub fn as_str(&self) -> &str {
+ self.deref()
+ }
+
+ /// Checks if the value is composed of ASCII alphabetic characters:
+ ///
+ /// * U+0041 'A' ..= U+005A 'Z', or
+ /// * U+0061 'a' ..= U+007A 'z'.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "Metamorphosis".parse()
+ /// .expect("Failed to parse.");
+ /// let s2: TinyStr16 = "Met3mo4pho!is".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert!(s1.is_ascii_alphabetic());
+ /// assert!(!s2.is_ascii_alphabetic());
+ /// ```
+ pub fn is_ascii_alphabetic(self) -> bool {
+ let word = self.0.get();
+ let mask =
+ (word + 0x7f7f7f7f_7f7f7f7f_7f7f7f7f_7f7f7f7f) & 0x80808080_80808080_80808080_80808080;
+ let lower = word | 0x20202020_20202020_20202020_20202020;
+ let alpha = !(lower + 0x1f1f1f1f_1f1f1f1f_1f1f1f1f_1f1f1f1f)
+ | (lower + 0x05050505_05050505_05050505_05050505);
+ (alpha & mask) == 0
+ }
+
+ /// Checks if the value is composed of ASCII alphanumeric characters:
+ ///
+ /// * U+0041 'A' ..= U+005A 'Z', or
+ /// * U+0061 'a' ..= U+007A 'z', or
+ /// * U+0030 '0' ..= U+0039 '9'.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "A15bingA1".parse()
+ /// .expect("Failed to parse.");
+ /// let s2: TinyStr16 = "[3@w00Fs1".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert!(s1.is_ascii_alphanumeric());
+ /// assert!(!s2.is_ascii_alphanumeric());
+ /// ```
+ pub fn is_ascii_alphanumeric(self) -> bool {
+ let word = self.0.get();
+ let mask =
+ (word + 0x7f7f7f7f_7f7f7f7f_7f7f7f7f_7f7f7f7f) & 0x80808080_80808080_80808080_80808080;
+ let numeric = !(word + 0x50505050_50505050_50505050_50505050)
+ | (word + 0x46464646_46464646_46464646_46464646);
+ let lower = word | 0x20202020_20202020_20202020_20202020;
+ let alpha = !(lower + 0x1f1f1f1f_1f1f1f1f_1f1f1f1f_1f1f1f1f)
+ | (lower + 0x05050505_05050505_05050505_05050505);
+ (alpha & numeric & mask) == 0
+ }
+
+ /// Checks if the value is composed of ASCII decimal digits:
+ ///
+ /// * U+0030 '0' ..= U+0039 '9'.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "31212314141".parse()
+ /// .expect("Failed to parse.");
+ /// let s2: TinyStr16 = "3d3d3d3d".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert!(s1.is_ascii_numeric());
+ /// assert!(!s2.is_ascii_numeric());
+ /// ```
+ pub fn is_ascii_numeric(self) -> bool {
+ let word = self.0.get();
+ let mask =
+ (word + 0x7f7f7f7f_7f7f7f7f_7f7f7f7f_7f7f7f7f) & 0x80808080_80808080_80808080_80808080;
+ let numeric = !(word + 0x50505050_50505050_50505050_50505050)
+ | (word + 0x46464646_46464646_46464646_46464646);
+ (numeric & mask) == 0
+ }
+
+ /// Converts this type to its ASCII lower case equivalent in-place.
+ ///
+ /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z', other characters are unchanged.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "MeTAmOrpHo3sis".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert_eq!(s1.to_ascii_lowercase(), "metamorpho3sis");
+ /// ```
+ pub fn to_ascii_lowercase(self) -> Self {
+ let word = self.0.get();
+ let result = word
+ | (((word + 0x3f3f3f3f_3f3f3f3f_3f3f3f3f_3f3f3f3f)
+ & !(word + 0x25252525_25252525_25252525_25252525)
+ & 0x80808080_80808080_80808080_80808080)
+ >> 2);
+ unsafe { Self(NonZeroU128::new_unchecked(result)) }
+ }
+
+ /// Converts this type to its ASCII title case equivalent in-place.
+ ///
+ /// First character, if is an ASCII letter 'a' to 'z' is mapped to 'A' to 'Z',
+ /// other characters are unchanged.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "metamorphosis".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert_eq!(s1.to_ascii_titlecase(), "Metamorphosis");
+ /// ```
+ pub fn to_ascii_titlecase(self) -> Self {
+ let word = self.0.get().to_le();
+ let mask = ((word + 0x3f3f3f3f_3f3f3f3f_3f3f3f3f_3f3f3f1f)
+ & !(word + 0x25252525_25252525_25252525_25252505)
+ & 0x80808080_80808080_80808080_80808080)
+ >> 2;
+ let result = (word | mask) & !(0x20 & mask);
+ unsafe { Self(NonZeroU128::new_unchecked(u128::from_le(result))) }
+ }
+
+ /// Converts this type to its ASCII upper case equivalent in-place.
+ ///
+ /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z', other characters are unchanged.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use tinystr::TinyStr16;
+ ///
+ /// let s1: TinyStr16 = "Met3amorphosis".parse()
+ /// .expect("Failed to parse.");
+ ///
+ /// assert_eq!(s1.to_ascii_uppercase(), "MET3AMORPHOSIS");
+ /// ```
+ pub fn to_ascii_uppercase(self) -> Self {
+ let word = self.0.get();
+ let result = word
+ & !(((word + 0x1f1f1f1f_1f1f1f1f_1f1f1f1f_1f1f1f1f)
+ & !(word + 0x05050505_05050505_05050505_05050505)
+ & 0x80808080_80808080_80808080_80808080)
+ >> 2);
+ unsafe { Self(NonZeroU128::new_unchecked(result)) }
+ }
+}
+
+impl fmt::Display for TinyStr16 {
+ fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+ write!(f, "{}", self.deref())
+ }
+}
+
+impl fmt::Debug for TinyStr16 {
+ fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
+ write!(f, "{:?}", self.deref())
+ }
+}
+
+impl Deref for TinyStr16 {
+ type Target = str;
+
+ #[inline(always)]
+ fn deref(&self) -> &str {
+ // Again, could use #cfg to hand-roll a big-endian implementation.
+ let word = self.0.get().to_le();
+ let len = (16 - word.leading_zeros() / 8) as usize;
+ unsafe {
+ let slice = core::slice::from_raw_parts(&self.0 as *const _ as *const u8, len);
+ std::str::from_utf8_unchecked(slice)
+ }
+ }
+}
+
+impl PartialEq<&str> for TinyStr16 {
+ fn eq(&self, other: &&str) -> bool {
+ self.deref() == *other
+ }
+}
+
+impl PartialOrd for TinyStr16 {
+ fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
+ Some(self.cmp(other))
+ }
+}
+
+impl Ord for TinyStr16 {
+ fn cmp(&self, other: &Self) -> Ordering {
+ self.0.get().to_be().cmp(&other.0.get().to_be())
+ }
+}
+
+impl FromStr for TinyStr16 {
+ type Err = Error;
+
+ #[inline(always)]
+ fn from_str(text: &str) -> Result<Self, Self::Err> {
+ Self::from_bytes(text.as_bytes())
+ }
+}
+
+impl Into<u128> for TinyStr16 {
+ fn into(self) -> u128 {
+ self.0.get().to_le()
+ }
+}