1// generated by diplomat-tool 2import type { DataError } from "./DataError" 3import type { DataProvider } from "./DataProvider" 4import type { Locale } from "./Locale" 5import type { WordBreakIteratorUtf16 } from "./WordBreakIteratorUtf16" 6import type { pointer, codepoint } from "./diplomat-runtime.d.ts"; 7 8 9/** An ICU4X word-break segmenter, capable of finding word breakpoints in strings. 10* 11*See the [Rust documentation for `WordSegmenter`](https://docs.rs/icu/latest/icu/segmenter/struct.WordSegmenter.html) for more information. 12*/ 13 14 15export class WordSegmenter { 16 17 get ffiValue(): pointer; 18 19 static createAuto(): WordSegmenter; 20 21 static createAutoWithContentLocale(locale: Locale): WordSegmenter; 22 23 static createAutoWithContentLocaleAndProvider(provider: DataProvider, locale: Locale): WordSegmenter; 24 25 static createLstm(): WordSegmenter; 26 27 static createLstmWithContentLocale(locale: Locale): WordSegmenter; 28 29 static createLstmWithContentLocaleAndProvider(provider: DataProvider, locale: Locale): WordSegmenter; 30 31 static createDictionary(): WordSegmenter; 32 33 static createDictionaryWithContentLocale(locale: Locale): WordSegmenter; 34 35 static createDictionaryWithContentLocaleAndProvider(provider: DataProvider, locale: Locale): WordSegmenter; 36 37 segment(input: string): WordBreakIteratorUtf16; 38}