1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
//! Bundled tokenizer + small JSON configs, embedded at compile time when
//! the `bundled` feature is enabled. ONNX model files are NOT bundled
//! (vision_encoder ~86 MB, decoder ~350 MB; can't fit under crates.io's
//! 10 MB include limit). Users must supply the ONNX directory separately.
//!
//! Total bundled size budget: <10 MB (crates.io hard limit). The actual
//! payload is ~4.5 MB (dominated by `tokenizer.json` at ~4.5 MB).
/// Bundled `tokenizer.json` bytes (~4.5 MB).
///
/// LFM2.5-VL-450M tokenizer: Qwen2-style, 151 665-token vocabulary.
/// Consumed by [`crate::engine::Engine::from_onnx_dir`] via
/// `write_bundled_tokenizer()` at runtime.
pub const TOKENIZER_JSON: & = include_bytes!;
/// Bundled `tokenizer_config.json` bytes.
///
/// Provided for downstream users that inspect model metadata at runtime.
pub const TOKENIZER_CONFIG_JSON: & = include_bytes!;
/// Bundled `preprocessor_config.json` bytes.
///
/// Provided for downstream users that inspect model metadata at runtime.
pub const PREPROCESSOR_CONFIG_JSON: & =
include_bytes!;
/// Bundled `processor_config.json` bytes.
///
/// Provided for downstream users that inspect model metadata at runtime.
pub const PROCESSOR_CONFIG_JSON: & = include_bytes!;
/// Bundled `generation_config.json` bytes.
///
/// Provided for downstream users that inspect model metadata at runtime.
pub const GENERATION_CONFIG_JSON: & = include_bytes!;
/// Bundled `config.json` bytes.
///
/// Provided for downstream users that inspect model metadata at runtime.
pub const CONFIG_JSON: & = include_bytes!;
/// Bundled `chat_template.jinja` bytes.
///
/// Used by `from_dir`'s strict prompt-contract drift check: a
/// model directory that ships a different chat template would
/// otherwise be accepted while the engine renders with the bundled
/// jinja, producing silent prompt-envelope drift. Only used for
/// the byte-equal cross-check; the actual runtime template is
/// `chat_template::BUNDLED_CHAT_TEMPLATE_JINJA`.
pub const CHAT_TEMPLATE_JINJA: & = include_bytes!;