ICU4X
International Components for Unicode
Loading...
Searching...
No Matches
icu4x::LineSegmenter Class Reference

#include <LineSegmenter.d.hpp>

Public Member Functions

std::unique_ptr< icu4x::LineBreakIteratorUtf8segment (std::string_view input) const
 
std::unique_ptr< icu4x::LineBreakIteratorUtf16segment16 (std::u16string_view input) const
 
std::unique_ptr< icu4x::LineBreakIteratorLatin1segment_latin1 (diplomat::span< const uint8_t > input) const
 

Static Public Member Functions

static std::unique_ptr< icu4x::LineSegmentercreate_auto ()
 
static std::unique_ptr< icu4x::LineSegmentercreate_lstm ()
 
static std::unique_ptr< icu4x::LineSegmentercreate_dictionary ()
 
static std::unique_ptr< icu4x::LineSegmentercreate_auto_with_options_v2 (const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataErrorcreate_auto_with_options_v2_and_provider (const icu4x::DataProvider &provider, const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static std::unique_ptr< icu4x::LineSegmentercreate_lstm_with_options_v2 (const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataErrorcreate_lstm_with_options_v2_and_provider (const icu4x::DataProvider &provider, const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static std::unique_ptr< icu4x::LineSegmentercreate_dictionary_with_options_v2 (const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataErrorcreate_dictionary_with_options_v2_and_provider (const icu4x::DataProvider &provider, const icu4x::Locale *content_locale, icu4x::LineBreakOptionsV2 options)
 
static void operator delete (void *ptr)
 

Detailed Description

An ICU4X line-break segmenter, capable of finding breakpoints in strings.

See the Rust documentation for LineSegmenter for more information.

Member Function Documentation

◆ create_auto()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_auto ( )
inlinestatic

Construct a LineSegmenter with default options (no locale-based tailoring) using compiled data. It automatically loads the best available payload data for Burmese, Khmer, Lao, and Thai.

See the Rust documentation for new_auto for more information.

◆ create_auto_with_options_v2()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_auto_with_options_v2 ( const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options using compiled data. It automatically loads the best available payload data for Burmese, Khmer, Lao, and Thai.

See the Rust documentation for new_auto for more information.

◆ create_auto_with_options_v2_and_provider()

diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataError > icu4x::LineSegmenter::create_auto_with_options_v2_and_provider ( const icu4x::DataProvider & provider,
const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options. It automatically loads the best available payload data for Burmese, Khmer, Lao, and Thai, using a particular data source.

See the Rust documentation for new_auto for more information.

◆ create_dictionary()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_dictionary ( )
inlinestatic

Construct a LineSegmenter with default options (no locale-based tailoring) and dictionary payload data for Burmese, Khmer, Lao, and Thai, using compiled data

See the Rust documentation for new_dictionary for more information.

◆ create_dictionary_with_options_v2()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_dictionary_with_options_v2 ( const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options and dictionary payload data for Burmese, Khmer, Lao, and Thai, using compiled data.

See the Rust documentation for new_dictionary for more information.

◆ create_dictionary_with_options_v2_and_provider()

diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataError > icu4x::LineSegmenter::create_dictionary_with_options_v2_and_provider ( const icu4x::DataProvider & provider,
const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options and dictionary payload data for Burmese, Khmer, Lao, and Thai, using a particular data source.

See the Rust documentation for new_dictionary for more information.

◆ create_lstm()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_lstm ( )
inlinestatic

Construct a LineSegmenter with default options (no locale-based tailoring) and LSTM payload data for Burmese, Khmer, Lao, and Thai, using compiled data.

See the Rust documentation for new_lstm for more information.

◆ create_lstm_with_options_v2()

std::unique_ptr< icu4x::LineSegmenter > icu4x::LineSegmenter::create_lstm_with_options_v2 ( const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options and LSTM payload data for Burmese, Khmer, Lao, and Thai, using compiled data.

See the Rust documentation for new_lstm for more information.

◆ create_lstm_with_options_v2_and_provider()

diplomat::result< std::unique_ptr< icu4x::LineSegmenter >, icu4x::DataError > icu4x::LineSegmenter::create_lstm_with_options_v2_and_provider ( const icu4x::DataProvider & provider,
const icu4x::Locale * content_locale,
icu4x::LineBreakOptionsV2 options )
inlinestatic

Construct a LineSegmenter with custom options and LSTM payload data for Burmese, Khmer, Lao, and Thai, using a particular data source.

See the Rust documentation for new_lstm for more information.

◆ operator delete()

void icu4x::LineSegmenter::operator delete ( void * ptr)
inlinestatic

◆ segment()

std::unique_ptr< icu4x::LineBreakIteratorUtf8 > icu4x::LineSegmenter::segment ( std::string_view input) const
inline

Segments a string.

Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according to the WHATWG Encoding Standard.

See the Rust documentation for segment_utf8 for more information.

◆ segment16()

std::unique_ptr< icu4x::LineBreakIteratorUtf16 > icu4x::LineSegmenter::segment16 ( std::u16string_view input) const
inline

Segments a string.

Ill-formed input is treated as if errors had been replaced with REPLACEMENT CHARACTERs according to the WHATWG Encoding Standard.

See the Rust documentation for segment_utf16 for more information.

◆ segment_latin1()

std::unique_ptr< icu4x::LineBreakIteratorLatin1 > icu4x::LineSegmenter::segment_latin1 ( diplomat::span< const uint8_t > input) const
inline

Segments a Latin-1 string.

See the Rust documentation for segment_latin1 for more information.


The documentation for this class was generated from the following files: