SentenceSegmenter.d.ts (1519B)
1 // generated by diplomat-tool 2 import type { DataError } from "./DataError" 3 import type { DataProvider } from "./DataProvider" 4 import type { Locale } from "./Locale" 5 import type { SentenceBreakIteratorUtf16 } from "./SentenceBreakIteratorUtf16" 6 import type { pointer, codepoint } from "./diplomat-runtime.d.ts"; 7 8 9 /** 10 * An ICU4X sentence-break segmenter, capable of finding sentence breakpoints in strings. 11 * 12 * See the [Rust documentation for `SentenceSegmenter`](https://docs.rs/icu/latest/icu/segmenter/struct.SentenceSegmenter.html) for more information. 13 */ 14 15 16 export class SentenceSegmenter { 17 get ffiValue(): pointer; 18 19 20 /** 21 * Construct a [`SentenceSegmenter`] for content known to be of a given locale, using compiled data. 22 */ 23 static createWithContentLocale(locale: Locale): SentenceSegmenter; 24 25 /** 26 * Construct a [`SentenceSegmenter`] for content known to be of a given locale, using a particular data source. 27 */ 28 static createWithContentLocaleAndProvider(provider: DataProvider, locale: Locale): SentenceSegmenter; 29 30 /** 31 * Segments a string. 32 * 33 * Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according 34 * to the WHATWG Encoding Standard. 35 * 36 * See the [Rust documentation for `segment_utf16`](https://docs.rs/icu/latest/icu/segmenter/struct.SentenceSegmenterBorrowed.html#method.segment_utf16) for more information. 37 */ 38 segment(input: string): SentenceBreakIteratorUtf16; 39 40 constructor(); 41 }