// generated by diplomat-tool import { DataError } from "./DataError.mjs" import { DataProvider } from "./DataProvider.mjs" import { Locale } from "./Locale.mjs" import { SentenceBreakIteratorUtf16 } from "./SentenceBreakIteratorUtf16.mjs" import wasm from "./diplomat-wasm.mjs"; import * as diplomatRuntime from "./diplomat-runtime.mjs"; const SentenceSegmenter_box_destroy_registry = new FinalizationRegistry((ptr) => { wasm.icu4x_SentenceSegmenter_destroy_mv1(ptr); }); /** * An ICU4X sentence-break segmenter, capable of finding sentence breakpoints in strings. * * See the [Rust documentation for `SentenceSegmenter`](https://docs.rs/icu/2.1.1/icu/segmenter/struct.SentenceSegmenter.html) for more information. */ export class SentenceSegmenter { // Internal ptr reference: #ptr = null; // Lifetimes are only to keep dependencies alive. // Since JS won't garbage collect until there are no incoming edges. #selfEdge = []; #internalConstructor(symbol, ptr, selfEdge) { if (symbol !== diplomatRuntime.internalConstructor) { console.error("SentenceSegmenter is an Opaque type. You cannot call its constructor."); return; } this.#ptr = ptr; this.#selfEdge = selfEdge; // Are we being borrowed? If not, we can register. if (this.#selfEdge.length === 0) { SentenceSegmenter_box_destroy_registry.register(this, this.#ptr); } return this; } /** @internal */ get ffiValue() { return this.#ptr; } /** * Construct a {@link SentenceSegmenter} using compiled data. This does not assume any content locale. * * See the [Rust documentation for `new`](https://docs.rs/icu/2.1.1/icu/segmenter/struct.SentenceSegmenter.html#method.new) for more information. */ #defaultConstructor() { const result = wasm.icu4x_SentenceSegmenter_create_mv1(); try { return new SentenceSegmenter(diplomatRuntime.internalConstructor, result, []); } finally { } } /** * Construct a {@link SentenceSegmenter} for content known to be of a given locale, using compiled data. */ static createWithContentLocale(locale) { const diplomatReceive = new diplomatRuntime.DiplomatReceiveBuf(wasm, 5, 4, true); const result = wasm.icu4x_SentenceSegmenter_create_with_content_locale_mv1(diplomatReceive.buffer, locale.ffiValue); try { if (!diplomatReceive.resultFlag) { const cause = new DataError(diplomatRuntime.internalConstructor, diplomatRuntime.enumDiscriminant(wasm, diplomatReceive.buffer)); throw new globalThis.Error('DataError.' + cause.value, { cause }); } return new SentenceSegmenter(diplomatRuntime.internalConstructor, diplomatRuntime.ptrRead(wasm, diplomatReceive.buffer), []); } finally { diplomatReceive.free(); } } /** * Construct a {@link SentenceSegmenter} for content known to be of a given locale, using a particular data source. */ static createWithContentLocaleAndProvider(provider, locale) { const diplomatReceive = new diplomatRuntime.DiplomatReceiveBuf(wasm, 5, 4, true); const result = wasm.icu4x_SentenceSegmenter_create_with_content_locale_and_provider_mv1(diplomatReceive.buffer, provider.ffiValue, locale.ffiValue); try { if (!diplomatReceive.resultFlag) { const cause = new DataError(diplomatRuntime.internalConstructor, diplomatRuntime.enumDiscriminant(wasm, diplomatReceive.buffer)); throw new globalThis.Error('DataError.' + cause.value, { cause }); } return new SentenceSegmenter(diplomatRuntime.internalConstructor, diplomatRuntime.ptrRead(wasm, diplomatReceive.buffer), []); } finally { diplomatReceive.free(); } } /** * Segments a string. * * Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according * to the WHATWG Encoding Standard. * * See the [Rust documentation for `segment_utf16`](https://docs.rs/icu/2.1.1/icu/segmenter/struct.SentenceSegmenterBorrowed.html#method.segment_utf16) for more information. */ segment(input) { let functionGarbageCollectorGrip = new diplomatRuntime.GarbageCollectorGrip(); const inputSlice = functionGarbageCollectorGrip.alloc(diplomatRuntime.DiplomatBuf.sliceWrapper(wasm, diplomatRuntime.DiplomatBuf.str16(wasm, input))); // This lifetime edge depends on lifetimes 'a let aEdges = [this, inputSlice]; const result = wasm.icu4x_SentenceSegmenter_segment_utf16_mv1(this.ffiValue, inputSlice.ptr); try { return new SentenceBreakIteratorUtf16(diplomatRuntime.internalConstructor, result, [], aEdges); } finally { functionGarbageCollectorGrip.releaseToGarbageCollector(); } } /** * Construct a {@link SentenceSegmenter} using compiled data. This does not assume any content locale. * * See the [Rust documentation for `new`](https://docs.rs/icu/2.1.1/icu/segmenter/struct.SentenceSegmenter.html#method.new) for more information. */ constructor() { if (arguments[0] === diplomatRuntime.exposeConstructor) { return this.#internalConstructor(...Array.prototype.slice.call(arguments, 1)); } else if (arguments[0] === diplomatRuntime.internalConstructor) { return this.#internalConstructor(...arguments); } else { return this.#defaultConstructor(...arguments); } } }