pub struct ICU4XLineSegmenter(LineSegmenter);Expand description
An ICU4X line-break segmenter, capable of finding breakpoints in strings.
Tuple Fields§
§0: LineSegmenterImplementations§
Source§impl ICU4XLineSegmenter
 
impl ICU4XLineSegmenter
Sourcepub fn create_auto(
    provider: &ICU4XDataProvider,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_auto( provider: &ICU4XDataProvider, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with default options. It automatically loads the best
available payload data for Burmese, Khmer, Lao, and Thai.
Sourcepub fn create_lstm(
    provider: &ICU4XDataProvider,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_lstm( provider: &ICU4XDataProvider, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with default options and LSTM payload data for
Burmese, Khmer, Lao, and Thai.
Sourcepub fn create_dictionary(
    provider: &ICU4XDataProvider,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_dictionary( provider: &ICU4XDataProvider, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with default options and dictionary payload data for
Burmese, Khmer, Lao, and Thai..
Sourcepub fn create_auto_with_options_v1(
    provider: &ICU4XDataProvider,
    options: ICU4XLineBreakOptionsV1,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_auto_with_options_v1( provider: &ICU4XDataProvider, options: ICU4XLineBreakOptionsV1, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with custom options. It automatically loads the best
available payload data for Burmese, Khmer, Lao, and Thai.
Sourcepub fn create_lstm_with_options_v1(
    provider: &ICU4XDataProvider,
    options: ICU4XLineBreakOptionsV1,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_lstm_with_options_v1( provider: &ICU4XDataProvider, options: ICU4XLineBreakOptionsV1, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with custom options and LSTM payload data for
Burmese, Khmer, Lao, and Thai.
Sourcepub fn create_dictionary_with_options_v1(
    provider: &ICU4XDataProvider,
    options: ICU4XLineBreakOptionsV1,
) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
 
pub fn create_dictionary_with_options_v1( provider: &ICU4XDataProvider, options: ICU4XLineBreakOptionsV1, ) -> Result<Box<ICU4XLineSegmenter>, ICU4XError>
Construct a ICU4XLineSegmenter with custom options and dictionary payload data for
Burmese, Khmer, Lao, and Thai.
Sourcepub fn segment_utf8<'a>(
    &'a self,
    input: &'a DiplomatStr,
) -> Box<ICU4XLineBreakIteratorUtf8<'a>>
 
pub fn segment_utf8<'a>( &'a self, input: &'a DiplomatStr, ) -> Box<ICU4XLineBreakIteratorUtf8<'a>>
Segments a string.
Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according to the WHATWG Encoding Standard.
Sourcepub fn segment_utf16<'a>(
    &'a self,
    input: &'a DiplomatStr16,
) -> Box<ICU4XLineBreakIteratorUtf16<'a>>
 
pub fn segment_utf16<'a>( &'a self, input: &'a DiplomatStr16, ) -> Box<ICU4XLineBreakIteratorUtf16<'a>>
Segments a string.
Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according to the WHATWG Encoding Standard.
Sourcepub fn segment_latin1<'a>(
    &'a self,
    input: &'a [u8],
) -> Box<ICU4XLineBreakIteratorLatin1<'a>>
 
pub fn segment_latin1<'a>( &'a self, input: &'a [u8], ) -> Box<ICU4XLineBreakIteratorLatin1<'a>>
Segments a Latin-1 string.