bpe-tokenizer 0.1.2

A BPE Tokenizer library.
[build-dependencies.bincode]
optional = true
version = "1.3.3"

[build-dependencies.lz4_flex]
optional = true
version = "0.11.3"

[build-dependencies.serde]
optional = true
version = "1.0.210"

[dependencies.bincode]
optional = true
version = "1.3.3"

[dependencies.lz4_flex]
optional = true
version = "0.11.3"

[dependencies.serde]
optional = true
version = "1.0.210"

[dependencies.thiserror]
version = "1.0.64"

[dependencies.unicode-segmentation]
version = "1.12.0"

[features]
default-large = ["bincode", "lz4_flex", "serde"]
default-medium = ["bincode", "lz4_flex", "serde"]
default-small = ["bincode", "lz4_flex", "serde"]

[lib]
name = "bpe_tokenizer"
path = "src/lib.rs"

[package]
authors = ["Stephen Waits <steve@waits.net>"]
autobenches = false
autobins = false
autoexamples = false
autotests = false
build = "build.rs"
categories = ["algorithms", "text-processing"]
description = "A BPE Tokenizer library."
documentation = "https://docs.rs/bpe-tokenizer/"
edition = "2021"
exclude = ["vocab/multi.wiki.bpe.vs1000000.vocab"]
homepage = "https://github.com/swaits/bpe-tokenizer/"
keywords = ["byte", "pair", "encoding", "bpe", "tokenizer"]
license-file = "LICENSE"
name = "bpe-tokenizer"
readme = "README.md"
repository = "https://github.com/swaits/bpe-tokenizer/"
rust-version = "1.64"
version = "0.1.2"

[package.metadata.docs.rs]
all-features = true

[profile.dev]
debug = 2
opt-level = 1
overflow-checks = true

[profile.release]
codegen-units = 1
debug = 0
lto = "thin"
opt-level = 3
overflow-checks = false
panic = "abort"
strip = "symbols"