tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

SentenceSegmenter.d.ts (1519B)


      1 // generated by diplomat-tool
      2 import type { DataError } from "./DataError"
      3 import type { DataProvider } from "./DataProvider"
      4 import type { Locale } from "./Locale"
      5 import type { SentenceBreakIteratorUtf16 } from "./SentenceBreakIteratorUtf16"
      6 import type { pointer, codepoint } from "./diplomat-runtime.d.ts";
      7 
      8 
      9 /**
     10 * An ICU4X sentence-break segmenter, capable of finding sentence breakpoints in strings.
     11 *
     12 * See the [Rust documentation for `SentenceSegmenter`](https://docs.rs/icu/latest/icu/segmenter/struct.SentenceSegmenter.html) for more information.
     13 */
     14 
     15 
     16 export class SentenceSegmenter {
     17    get ffiValue(): pointer;
     18 
     19 
     20    /**
     21     * Construct a [`SentenceSegmenter`] for content known to be of a given locale, using compiled data.
     22     */
     23    static createWithContentLocale(locale: Locale): SentenceSegmenter;
     24 
     25    /**
     26     * Construct a [`SentenceSegmenter`]  for content known to be of a given locale, using a particular data source.
     27     */
     28    static createWithContentLocaleAndProvider(provider: DataProvider, locale: Locale): SentenceSegmenter;
     29 
     30    /**
     31     * Segments a string.
     32     *
     33     * Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according
     34     * to the WHATWG Encoding Standard.
     35     *
     36     * See the [Rust documentation for `segment_utf16`](https://docs.rs/icu/latest/icu/segmenter/struct.SentenceSegmenterBorrowed.html#method.segment_utf16) for more information.
     37     */
     38    segment(input: string): SentenceBreakIteratorUtf16;
     39 
     40    constructor();
     41 }