icu_segmenter 2.1.2

Unicode line breaking and text segmentation algorithms for text boundaries analysis
Documentation
[[bench]]
harness = false
name = "bench"
path = "benches/bench.rs"

[dependencies.core_maths]
default-features = false
optional = true
version = "0.1.0"

[dependencies.databake]
default-features = false
features = ["derive"]
optional = true
version = "0.2.0"

[dependencies.icu_collections]
default-features = false
version = "~2.1.1"

[dependencies.icu_locale]
default-features = false
optional = true
version = "~2.1.1"

[dependencies.icu_provider]
default-features = false
version = "2.1.1"

[dependencies.icu_segmenter_data]
default-features = false
optional = true
version = "~2.1.1"

[dependencies.potential_utf]
default-features = false
features = ["alloc", "zerovec"]
version = "0.1.3"

[dependencies.serde]
default-features = false
features = ["derive", "alloc"]
optional = true
version = "1.0.220"

[dependencies.utf8_iter]
default-features = false
version = "1.0.2"

[dependencies.zerovec]
default-features = false
features = ["alloc", "yoke"]
version = "0.11.3"

[dev-dependencies.icu_locale_core]
default-features = false
version = "2.1.1"

[dev-dependencies.itertools]
version = "0.14.0"

[dev-dependencies.ndarray]
version = "0.16.0"

[dev-dependencies.serde]
default-features = false
features = ["derive"]
version = "1.0.220"

[dev-dependencies.serde_json]
version = "1.0.45"

[features]
auto = ["lstm"]
compiled_data = ["dep:icu_segmenter_data", "dep:icu_locale", "icu_locale?/compiled_data", "icu_provider/baked"]
datagen = ["serde", "dep:databake", "potential_utf/databake", "zerovec/databake", "icu_collections/databake", "icu_provider/export"]
default = ["compiled_data", "auto"]
lstm = ["dep:core_maths"]
serde = ["dep:serde", "potential_utf/serde", "zerovec/serde", "icu_collections/serde", "icu_provider/serde"]

[lib]
bench = false
name = "icu_segmenter"
path = "src/lib.rs"

[package]
authors = ["The ICU4X Project Developers"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = false
categories = ["internationalization"]
description = "Unicode line breaking and text segmentation algorithms for text boundaries analysis"
edition = "2021"
homepage = "https://icu4x.unicode.org"
include = ["data/**/*", "src/**/*", "examples/**/*", "benches/**/*", "tests/**/*", "Cargo.toml", "LICENSE", "README.md", "build.rs"]
license = "Unicode-3.0"
name = "icu_segmenter"
readme = "README.md"
repository = "https://github.com/unicode-org/icu4x"
rust-version = "1.83"
version = "2.1.2"

[package.metadata.docs.rs]
all-features = true

[target.'cfg(not(target_arch = "wasm32"))'.dev-dependencies.criterion]
version = "0.5.0"

[[test]]
name = "cnn"
path = "tests/cnn/main.rs"
required-features = []

[[test]]
name = "complex_word"
path = "tests/complex_word.rs"
required-features = ["auto"]

[[test]]
name = "css_line_break"
path = "tests/css_line_break.rs"

[[test]]
name = "css_word_break"
path = "tests/css_word_break.rs"

[[test]]
name = "locale"
path = "tests/locale.rs"

[[test]]
name = "spec_test"
path = "tests/spec_test.rs"

[[test]]
name = "word_rule_status"
path = "tests/word_rule_status.rs"