summaryrefslogtreecommitdiffstats
path: root/third_party/rust/unicode-width/src/tests.rs
diff options
context:
space:
mode:
Diffstat (limited to 'third_party/rust/unicode-width/src/tests.rs')
-rw-r--r--third_party/rust/unicode-width/src/tests.rs191
1 files changed, 191 insertions, 0 deletions
diff --git a/third_party/rust/unicode-width/src/tests.rs b/third_party/rust/unicode-width/src/tests.rs
new file mode 100644
index 0000000000..e49b1bfbec
--- /dev/null
+++ b/third_party/rust/unicode-width/src/tests.rs
@@ -0,0 +1,191 @@
+// Copyright 2012-2015 The Rust Project Developers. See the COPYRIGHT
+// file at the top-level directory of this distribution and at
+// http://rust-lang.org/COPYRIGHT.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+#[cfg(feature = "bench")]
+use std::iter;
+#[cfg(feature = "bench")]
+use test::{self, Bencher};
+#[cfg(feature = "bench")]
+use super::{UnicodeWidthChar, UnicodeWidthStr};
+
+use std::prelude::v1::*;
+
+#[cfg(feature = "bench")]
+#[bench]
+fn cargo(b: &mut Bencher) {
+ let string = iter::repeat('a').take(4096).collect::<String>();
+
+ b.iter(|| {
+ for c in string.chars() {
+ test::black_box(UnicodeWidthChar::width(c));
+ }
+ });
+}
+
+#[cfg(feature = "bench")]
+#[bench]
+#[allow(deprecated)]
+fn stdlib(b: &mut Bencher) {
+ let string = iter::repeat('a').take(4096).collect::<String>();
+
+ b.iter(|| {
+ for c in string.chars() {
+ test::black_box(c.width());
+ }
+ });
+}
+
+#[cfg(feature = "bench")]
+#[bench]
+fn simple_if(b: &mut Bencher) {
+ let string = iter::repeat('a').take(4096).collect::<String>();
+
+ b.iter(|| {
+ for c in string.chars() {
+ test::black_box(simple_width_if(c));
+ }
+ });
+}
+
+#[cfg(feature = "bench")]
+#[bench]
+fn simple_match(b: &mut Bencher) {
+ let string = iter::repeat('a').take(4096).collect::<String>();
+
+ b.iter(|| {
+ for c in string.chars() {
+ test::black_box(simple_width_match(c));
+ }
+ });
+}
+
+#[cfg(feature = "bench")]
+#[inline]
+fn simple_width_if(c: char) -> Option<usize> {
+ let cu = c as u32;
+ if cu < 127 {
+ if cu > 31 {
+ Some(1)
+ } else if cu == 0 {
+ Some(0)
+ } else {
+ None
+ }
+ } else {
+ UnicodeWidthChar::width(c)
+ }
+}
+
+#[cfg(feature = "bench")]
+#[inline]
+fn simple_width_match(c: char) -> Option<usize> {
+ match c as u32 {
+ cu if cu == 0 => Some(0),
+ cu if cu < 0x20 => None,
+ cu if cu < 0x7f => Some(1),
+ _ => UnicodeWidthChar::width(c)
+ }
+}
+#[cfg(all(feature = "bench", not(feature = "no_std")))]
+#[bench]
+fn enwik8(b: &mut Bencher) {
+ // To benchmark, download & unzip `enwik8` from https://data.deepai.org/enwik8.zip
+ let data_path = "bench_data/enwik8";
+ let string = std::fs::read_to_string(data_path).unwrap_or_default();
+ b.iter(|| test::black_box(UnicodeWidthStr::width(string.as_str())));
+}
+#[cfg(all(feature = "bench", not(feature = "no_std")))]
+#[bench]
+fn jawiki(b: &mut Bencher) {
+ // To benchmark, download & extract `jawiki-20220501-pages-articles-multistream-index.txt` from
+ // https://dumps.wikimedia.org/jawiki/20220501/jawiki-20220501-pages-articles-multistream-index.txt.bz2
+ let data_path = "bench_data/jawiki-20220501-pages-articles-multistream-index.txt";
+ let string = std::fs::read_to_string(data_path).unwrap_or_default();
+ b.iter(|| test::black_box(UnicodeWidthStr::width(string.as_str())));
+}
+#[test]
+fn test_str() {
+ use super::UnicodeWidthStr;
+
+ assert_eq!(UnicodeWidthStr::width("hello"), 10);
+ assert_eq!("hello".width_cjk(), 10);
+ assert_eq!(UnicodeWidthStr::width("\0\0\0\x01\x01"), 0);
+ assert_eq!("\0\0\0\x01\x01".width_cjk(), 0);
+ assert_eq!(UnicodeWidthStr::width(""), 0);
+ assert_eq!("".width_cjk(), 0);
+ assert_eq!(UnicodeWidthStr::width("\u{2081}\u{2082}\u{2083}\u{2084}"), 4);
+ assert_eq!("\u{2081}\u{2082}\u{2083}\u{2084}".width_cjk(), 8);
+}
+
+#[test]
+fn test_emoji() {
+ // Example from the README.
+ use super::UnicodeWidthStr;
+
+ assert_eq!(UnicodeWidthStr::width("👩"), 2); // Woman
+ assert_eq!(UnicodeWidthStr::width("🔬"), 2); // Microscope
+ assert_eq!(UnicodeWidthStr::width("👩‍🔬"), 4); // Woman scientist
+}
+
+#[test]
+fn test_char() {
+ use super::UnicodeWidthChar;
+ #[cfg(feature = "no_std")]
+ use core::option::Option::{Some, None};
+
+ assert_eq!(UnicodeWidthChar::width('h'), Some(2));
+ assert_eq!('h'.width_cjk(), Some(2));
+ assert_eq!(UnicodeWidthChar::width('\x00'), Some(0));
+ assert_eq!('\x00'.width_cjk(), Some(0));
+ assert_eq!(UnicodeWidthChar::width('\x01'), None);
+ assert_eq!('\x01'.width_cjk(), None);
+ assert_eq!(UnicodeWidthChar::width('\u{2081}'), Some(1));
+ assert_eq!('\u{2081}'.width_cjk(), Some(2));
+}
+
+#[test]
+fn test_char2() {
+ use super::UnicodeWidthChar;
+ #[cfg(feature = "no_std")]
+ use core::option::Option::{Some, None};
+
+ assert_eq!(UnicodeWidthChar::width('\x00'),Some(0));
+ assert_eq!('\x00'.width_cjk(),Some(0));
+
+ assert_eq!(UnicodeWidthChar::width('\x0A'),None);
+ assert_eq!('\x0A'.width_cjk(),None);
+
+ assert_eq!(UnicodeWidthChar::width('w'),Some(1));
+ assert_eq!('w'.width_cjk(),Some(1));
+
+ assert_eq!(UnicodeWidthChar::width('h'),Some(2));
+ assert_eq!('h'.width_cjk(),Some(2));
+
+ assert_eq!(UnicodeWidthChar::width('\u{AD}'),Some(1));
+ assert_eq!('\u{AD}'.width_cjk(),Some(1));
+
+ assert_eq!(UnicodeWidthChar::width('\u{1160}'),Some(0));
+ assert_eq!('\u{1160}'.width_cjk(),Some(0));
+
+ assert_eq!(UnicodeWidthChar::width('\u{a1}'),Some(1));
+ assert_eq!('\u{a1}'.width_cjk(),Some(2));
+
+ assert_eq!(UnicodeWidthChar::width('\u{300}'),Some(0));
+ assert_eq!('\u{300}'.width_cjk(),Some(0));
+}
+
+#[test]
+fn unicode_12() {
+ use super::UnicodeWidthChar;
+ #[cfg(feature = "no_std")]
+ use core::option::Option::{Some, None};
+
+ assert_eq!(UnicodeWidthChar::width('\u{1F971}'), Some(2));
+}