/* This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this file, * You can obtain one at http://mozilla.org/MPL/2.0/. */ use icu_properties::CodePointMapData; use unicode_bidi::level::Level; use unicode_bidi::utf16; use unicode_bidi::Direction; use core::ops::Range; use core::slice; /// LevelRun type to be returned to C++. /// 32-bit indexes (rather than usize) are sufficient here because Gecko works /// with 32-bit indexes when collecting the text buffer for a paragraph. #[repr(C)] pub struct LevelRun { start: u32, length: u32, level: u8, } /// Bidi object to be exposed to Gecko via FFI. pub struct UnicodeBidi<'a> { paragraph_info: utf16::ParagraphBidiInfo<'a>, resolved: Option<(Vec, Vec>)>, } impl UnicodeBidi<'_> { /// Create a new UnicodeBidi object representing the given text. This creates /// the unicode-bidi ParagraphBidiInfo struct, and will cache the resolved /// levels and visual-runs array once created. /// The caller is responsible to ensure the text buffer remains valid /// as long as the UnicodeBidi object exists. fn new<'a>(text: *const u16, length: usize, level: u8) -> Box { let text = unsafe { slice::from_raw_parts(text, length) }; let level = if let Ok(level) = Level::new(level) { Some(level) } else { None }; let adapter = CodePointMapData::::new(); Box::new(UnicodeBidi { paragraph_info: utf16::ParagraphBidiInfo::new_with_data_source(&adapter, text, level), resolved: None, }) } #[inline] fn resolved(&mut self) -> &(Vec, Vec>) { if self.resolved.is_none() { let len = self.paragraph_info.text.len(); self.resolved = Some(self.paragraph_info.visual_runs(0..len)); } self.resolved.as_ref().unwrap() } } /// Create a new UnicodeBidi object for the given text. /// NOTE that the text buffer must remain valid for the lifetime of this object! #[no_mangle] pub extern "C" fn bidi_new<'a>(text: *const u16, length: usize, level: u8) -> *mut UnicodeBidi<'a> { Box::into_raw(UnicodeBidi::<'a>::new(text, length, level)) } /// Destroy the Bidi object. #[no_mangle] pub extern "C" fn bidi_destroy(bidi: *mut UnicodeBidi) { if bidi.is_null() { return; } let _ = unsafe { Box::from_raw(bidi) }; } /// Get the length of the text covered by the Bidi object. #[no_mangle] pub extern "C" fn bidi_get_length(bidi: &UnicodeBidi) -> i32 { bidi.paragraph_info.text.len().try_into().unwrap() } /// Get the paragraph direction: LTR=1, RTL=-1, mixed=0. #[no_mangle] pub extern "C" fn bidi_get_direction(bidi: &UnicodeBidi) -> i8 { match bidi.paragraph_info.direction() { Direction::Mixed => 0, Direction::Ltr => 1, Direction::Rtl => -1, } } /// Get the paragraph level. #[no_mangle] pub extern "C" fn bidi_get_paragraph_level(bidi: &UnicodeBidi) -> u8 { bidi.paragraph_info.paragraph_level.into() } /// Get the number of runs present. #[no_mangle] pub extern "C" fn bidi_count_runs(bidi: &mut UnicodeBidi) -> i32 { if bidi.paragraph_info.text.is_empty() { return 0; } bidi.resolved().1.len().try_into().unwrap() } /// Get a pointer to the Levels array. The resulting pointer is valid only as long as /// the UnicodeBidi object exists! #[no_mangle] pub extern "C" fn bidi_get_levels(bidi: &mut UnicodeBidi) -> *const Level { bidi.resolved().0.as_ptr() } /// Get the extent of the run at the given index in the visual runs array. /// This would panic!() if run_index is out of range (see bidi_count_runs), /// or if the run's start or length exceeds u32::MAX (which cannot happen /// because Gecko can't create such a huge text buffer). #[no_mangle] pub extern "C" fn bidi_get_visual_run(bidi: &mut UnicodeBidi, run_index: u32) -> LevelRun { let level_runs = &bidi.resolved().1; let start = level_runs[run_index as usize].start; let length = level_runs[run_index as usize].end - start; LevelRun { start: start.try_into().unwrap(), length: length.try_into().unwrap(), level: bidi.resolved().0[start].into(), } } /// Return index map showing the result of reordering using the given levels array. /// (This is a generic helper that does not use a UnicodeBidi object, it just takes an /// arbitrary array of levels.) #[no_mangle] pub extern "C" fn bidi_reorder_visual(levels: *const u8, length: usize, index_map: *mut i32) { let levels = unsafe { slice::from_raw_parts(levels as *const Level, length) }; let result = unsafe { slice::from_raw_parts_mut(index_map, length) }; let reordered = utf16::BidiInfo::reorder_visual(levels); for i in 0..length { result[i] = reordered[i].try_into().unwrap(); } } /// Get the base direction for the given text, returning 1 for LTR, -1 for RTL, /// and 0 for neutral. If first_paragraph is true, only the first paragraph will be considered; /// if false, subsequent paragraphs may be considered until a non-neutral character is found. #[no_mangle] pub extern "C" fn bidi_get_base_direction( text: *const u16, length: usize, first_paragraph: bool, ) -> i8 { let text = unsafe { slice::from_raw_parts(text, length) }; let adapter = CodePointMapData::::new(); let direction = if first_paragraph { unicode_bidi::get_base_direction_with_data_source(&adapter, text) } else { unicode_bidi::get_base_direction_full_with_data_source(&adapter, text) }; match direction { Direction::Mixed => 0, Direction::Ltr => 1, Direction::Rtl => -1, } }