provable_contracts/schema/kind.rs
1//! Contract kinds — declare which validation rules apply to a YAML file.
2
3use serde::{Deserialize, Serialize};
4
5/// The kind of contract artifact. Determines which validation rules apply.
6///
7/// - `Kernel` (default): a mathematical kernel contract — the provability
8/// invariant applies (must have `proof_obligations`, `falsification_tests`,
9/// `kani_harnesses`).
10/// - `Registry`: a data registry (lookup tables, enum definitions, config
11/// bounds) — exempt from provability, validated for `metadata` + entries.
12/// - `ModelFamily`: architecture metadata (`HuggingFace` family descriptors,
13/// size variants, vendor) — exempt from provability, validated for
14/// `metadata` fields. Custom top-level fields are preserved but not
15/// enforced by the kernel schema.
16/// - `ModelFamilyVariant`: a concrete size variant of a model family
17/// (e.g. Llama 370M sovereign). Freezes hyperparameters (vocab, hidden
18/// dim, layer count) and delta-dispatches invariants from the parent
19/// family. Exempt from provability.
20/// - `Tokenizer`: a concrete tokenizer contract — vocab bounds, required
21/// special tokens, round-trip gate, normalization form. Exempt from
22/// provability (gates are byte-exact tests, not Kani harnesses).
23/// - `TrainingLoop`: a training-loop contract — loss schedule, optimizer
24/// config, gradient-clipping policy, checkpoint cadence. Exempt from
25/// provability; validated for `metadata` + schedule fields.
26/// - `PretrainingCorpus`: a pretraining-corpus contract — dataset source,
27/// license, total-bytes bound, shard layout. Exempt from provability.
28/// - `TrainingPreconditionGate`: a hard precondition gate that must be
29/// satisfied before training starts (e.g. Chinchilla compute-optimal
30/// token/parameter ratio, GPU memory floor, dataset checksum). Exempt
31/// from provability; validated for `metadata` + gate-formula fields.
32/// - `CorpusAssembly`: a multi-source corpus assembly pipeline contract —
33/// declares input shards, dedup strategy, license-merge policy, and
34/// output manifest. Exempt from provability.
35/// - `Pattern`: a cross-cutting verification pattern (threading safety,
36/// async safety, compute parity) that applies across multiple kernels.
37/// Exempt from the kernel provability invariant but still validated for
38/// metadata and any proof/falsification data present.
39/// - `Schema`: a generic reference/schema document — exempt from provability,
40/// validated only for `metadata.id`, `metadata.version`, `metadata.description`,
41/// and `metadata.references`.
42#[derive(
43 Debug, Clone, Copy, Default, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize,
44)]
45#[serde(rename_all = "kebab-case")]
46pub enum ContractKind {
47 #[default]
48 Kernel,
49 Registry,
50 ModelFamily,
51 ModelFamilyVariant,
52 Tokenizer,
53 TrainingLoop,
54 PretrainingCorpus,
55 TrainingPreconditionGate,
56 CorpusAssembly,
57 Pattern,
58 Schema,
59}
60
61impl std::fmt::Display for ContractKind {
62 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
63 let s = match self {
64 Self::Kernel => "kernel",
65 Self::Registry => "registry",
66 Self::ModelFamily => "model-family",
67 Self::ModelFamilyVariant => "model-family-variant",
68 Self::Tokenizer => "tokenizer",
69 Self::TrainingLoop => "training-loop",
70 Self::PretrainingCorpus => "pretraining-corpus",
71 Self::TrainingPreconditionGate => "training-precondition-gate",
72 Self::CorpusAssembly => "corpus-assembly",
73 Self::Pattern => "pattern",
74 Self::Schema => "schema",
75 };
76 write!(f, "{s}")
77 }
78}