diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-19 00:47:55 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-19 00:47:55 +0000 |
commit | 26a029d407be480d791972afb5975cf62c9360a6 (patch) | |
tree | f435a8308119effd964b339f76abb83a57c29483 /intl/bidi/rust/unicode-bidi-ffi | |
parent | Initial commit. (diff) | |
download | firefox-26a029d407be480d791972afb5975cf62c9360a6.tar.xz firefox-26a029d407be480d791972afb5975cf62c9360a6.zip |
Adding upstream version 124.0.1.upstream/124.0.1
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'intl/bidi/rust/unicode-bidi-ffi')
-rw-r--r-- | intl/bidi/rust/unicode-bidi-ffi/Cargo.toml | 10 | ||||
-rw-r--r-- | intl/bidi/rust/unicode-bidi-ffi/cbindgen.toml | 15 | ||||
-rw-r--r-- | intl/bidi/rust/unicode-bidi-ffi/src/lib.rs | 176 |
3 files changed, 201 insertions, 0 deletions
diff --git a/intl/bidi/rust/unicode-bidi-ffi/Cargo.toml b/intl/bidi/rust/unicode-bidi-ffi/Cargo.toml new file mode 100644 index 0000000000..9c39fc07e1 --- /dev/null +++ b/intl/bidi/rust/unicode-bidi-ffi/Cargo.toml @@ -0,0 +1,10 @@ +[package] +name = "unicode-bidi-ffi" +version = "0.1.0" +license = "MPL-2.0" +authors = ["Jonathan Kew <jkew@mozilla.com>"] +edition = "2021" + +[dependencies] +unicode-bidi = "0.3.14" +icu_properties = { version = "1.4.0", features = ["bidi"] } diff --git a/intl/bidi/rust/unicode-bidi-ffi/cbindgen.toml b/intl/bidi/rust/unicode-bidi-ffi/cbindgen.toml new file mode 100644 index 0000000000..a345d2b46a --- /dev/null +++ b/intl/bidi/rust/unicode-bidi-ffi/cbindgen.toml @@ -0,0 +1,15 @@ +header = """/* This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. */""" +autogen_warning = """/* DO NOT MODIFY THIS MANUALLY! This file was generated using cbindgen. See RunCbindgen.py */ +""" +include_version = true +braces = "SameLine" +line_length = 100 +tab_width = 2 +language = "C++" +namespaces = ["mozilla", "intl", "ffi"] + +[parse] +parse_deps = true +include = ["unicode-bidi"] diff --git a/intl/bidi/rust/unicode-bidi-ffi/src/lib.rs b/intl/bidi/rust/unicode-bidi-ffi/src/lib.rs new file mode 100644 index 0000000000..6dd2117b8b --- /dev/null +++ b/intl/bidi/rust/unicode-bidi-ffi/src/lib.rs @@ -0,0 +1,176 @@ +/* This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this file, + * You can obtain one at http://mozilla.org/MPL/2.0/. */ + +use icu_properties::bidi::BidiClassAdapter; +use icu_properties::maps; + +use unicode_bidi::level::Level; +use unicode_bidi::utf16; +use unicode_bidi::Direction; + +use core::ops::Range; +use core::slice; + +/// LevelRun type to be returned to C++. +/// 32-bit indexes (rather than usize) are sufficient here because Gecko works +/// with 32-bit indexes when collecting the text buffer for a paragraph. +#[repr(C)] +pub struct LevelRun { + start: u32, + length: u32, + level: u8, +} + +/// Bidi object to be exposed to Gecko via FFI. +pub struct UnicodeBidi<'a> { + paragraph_info: utf16::ParagraphBidiInfo<'a>, + resolved: Option<(Vec<Level>, Vec<Range<usize>>)>, +} + +impl UnicodeBidi<'_> { + /// Create a new UnicodeBidi object representing the given text. This creates + /// the unicode-bidi ParagraphBidiInfo struct, and will cache the resolved + /// levels and visual-runs array once created. + /// The caller is responsible to ensure the text buffer remains valid + /// as long as the UnicodeBidi object exists. + fn new<'a>(text: *const u16, length: usize, level: u8) -> Box<Self> { + let text = unsafe { slice::from_raw_parts(text, length) }; + let level = if let Ok(level) = Level::new(level) { + Some(level) + } else { + None + }; + let adapter = BidiClassAdapter::new(maps::bidi_class()); + Box::new(UnicodeBidi { + paragraph_info: utf16::ParagraphBidiInfo::<'a>::new_with_data_source( + &adapter, text, level, + ), + resolved: None, + }) + } + + #[inline] + fn resolved(&mut self) -> &(Vec<Level>, Vec<Range<usize>>) { + if self.resolved.is_none() { + let len = self.paragraph_info.text.len(); + self.resolved = Some(self.paragraph_info.visual_runs(0..len)); + } + &self.resolved.as_ref().unwrap() + } +} + +/// Create a new UnicodeBidi object for the given text. +/// NOTE that the text buffer must remain valid for the lifetime of this object! +#[no_mangle] +pub extern "C" fn bidi_new<'a>(text: *const u16, length: usize, level: u8) -> *mut UnicodeBidi<'a> { + Box::into_raw(UnicodeBidi::<'a>::new(text, length, level)) +} + +/// Destroy the Bidi object. +#[no_mangle] +pub extern "C" fn bidi_destroy(bidi: *mut UnicodeBidi) { + if bidi.is_null() { + return; + } + let _ = unsafe { Box::from_raw(bidi) }; +} + +/// Get the length of the text covered by the Bidi object. +#[no_mangle] +pub extern "C" fn bidi_get_length(bidi: *const UnicodeBidi) -> i32 { + let bidi = unsafe { &(*bidi) }; + bidi.paragraph_info.text.len().try_into().unwrap() +} + +/// Get the paragraph direction: LTR=1, RTL=-1, mixed=0. +#[no_mangle] +pub extern "C" fn bidi_get_direction(bidi: *const UnicodeBidi) -> i8 { + let bidi = unsafe { &(*bidi) }; + match bidi.paragraph_info.direction() { + Direction::Mixed => 0, + Direction::Ltr => 1, + Direction::Rtl => -1, + } +} + +/// Get the paragraph level. +#[no_mangle] +pub extern "C" fn bidi_get_paragraph_level(bidi: *const UnicodeBidi) -> u8 { + let bidi = unsafe { &(*bidi) }; + bidi.paragraph_info.paragraph_level.into() +} + +/// Get the number of runs present. +#[no_mangle] +pub extern "C" fn bidi_count_runs(bidi: *mut UnicodeBidi) -> i32 { + let bidi = unsafe { &mut (*bidi) }; + if bidi.paragraph_info.text.is_empty() { + return 0; + } + bidi.resolved().1.len().try_into().unwrap() +} + +/// Get a pointer to the Levels array. The resulting pointer is valid only as long as +/// the UnicodeBidi object exists! +#[no_mangle] +pub extern "C" fn bidi_get_levels(bidi: *mut UnicodeBidi) -> *const Level { + let bidi = unsafe { &mut (*bidi) }; + bidi.resolved().0.as_ptr() +} + +/// Get the extent of the run at the given index in the visual runs array. +/// This would panic!() if run_index is out of range (see bidi_count_runs), +/// or if the run's start or length exceeds u32::MAX (which cannot happen +/// because Gecko can't create such a huge text buffer). +#[no_mangle] +pub extern "C" fn bidi_get_visual_run(bidi: *mut UnicodeBidi, run_index: u32) -> LevelRun { + let bidi = unsafe { &mut (*bidi) }; + let level_runs = &bidi.resolved().1; + let start = level_runs[run_index as usize].start; + let length = level_runs[run_index as usize].end - start; + LevelRun { + start: start.try_into().unwrap(), + length: length.try_into().unwrap(), + level: bidi.resolved().0[start].into(), + } +} + +/// Return index map showing the result of reordering using the given levels array. +/// (This is a generic helper that does not use a UnicodeBidi object, it just takes an +/// arbitrary array of levels.) +#[no_mangle] +pub extern "C" fn bidi_reorder_visual(levels: *const u8, length: usize, index_map: *mut i32) { + let levels = unsafe { slice::from_raw_parts(levels as *const Level, length) }; + let result = unsafe { slice::from_raw_parts_mut(index_map, length) }; + let reordered = utf16::BidiInfo::reorder_visual(levels); + for i in 0..length { + result[i] = reordered[i].try_into().unwrap(); + } +} + +/// Get the base direction for the given text, returning 1 for LTR, -1 for RTL, +/// and 0 for neutral. If first_paragraph is true, only the first paragraph will be considered; +/// if false, subsequent paragraphs may be considered until a non-neutral character is found. +#[no_mangle] +pub extern "C" fn bidi_get_base_direction( + text: *const u16, + length: usize, + first_paragraph: bool, +) -> i8 { + let text = unsafe { slice::from_raw_parts(text, length) }; + let adapter = BidiClassAdapter::new(maps::bidi_class()); + if first_paragraph { + match unicode_bidi::get_base_direction_with_data_source(&adapter, text) { + Direction::Mixed => 0, + Direction::Ltr => 1, + Direction::Rtl => -1, + } + } else { + match unicode_bidi::get_base_direction_full_with_data_source(&adapter, text) { + Direction::Mixed => 0, + Direction::Ltr => 1, + Direction::Rtl => -1, + } + } +} |