Skip to main content

provable_contracts/schema/
kind.rs

1//! Contract kinds — declare which validation rules apply to a YAML file.
2
3use serde::{Deserialize, Serialize};
4
5/// The kind of contract artifact. Determines which validation rules apply.
6///
7/// - `Kernel` (default): a mathematical kernel contract — the provability
8///   invariant applies (must have `proof_obligations`, `falsification_tests`,
9///   `kani_harnesses`).
10/// - `Registry`: a data registry (lookup tables, enum definitions, config
11///   bounds) — exempt from provability, validated for `metadata` + entries.
12/// - `ModelFamily`: architecture metadata (`HuggingFace` family descriptors,
13///   size variants, vendor) — exempt from provability, validated for
14///   `metadata` fields. Custom top-level fields are preserved but not
15///   enforced by the kernel schema.
16/// - `ModelFamilyVariant`: a concrete size variant of a model family
17///   (e.g. Llama 370M sovereign). Freezes hyperparameters (vocab, hidden
18///   dim, layer count) and delta-dispatches invariants from the parent
19///   family. Exempt from provability.
20/// - `Tokenizer`: a concrete tokenizer contract — vocab bounds, required
21///   special tokens, round-trip gate, normalization form. Exempt from
22///   provability (gates are byte-exact tests, not Kani harnesses).
23/// - `TrainingLoop`: a training-loop contract — loss schedule, optimizer
24///   config, gradient-clipping policy, checkpoint cadence. Exempt from
25///   provability; validated for `metadata` + schedule fields.
26/// - `PretrainingCorpus`: a pretraining-corpus contract — dataset source,
27///   license, total-bytes bound, shard layout. Exempt from provability.
28/// - `TrainingPreconditionGate`: a hard precondition gate that must be
29///   satisfied before training starts (e.g. Chinchilla compute-optimal
30///   token/parameter ratio, GPU memory floor, dataset checksum). Exempt
31///   from provability; validated for `metadata` + gate-formula fields.
32/// - `CorpusAssembly`: a multi-source corpus assembly pipeline contract —
33///   declares input shards, dedup strategy, license-merge policy, and
34///   output manifest. Exempt from provability.
35/// - `Pattern`: a cross-cutting verification pattern (threading safety,
36///   async safety, compute parity) that applies across multiple kernels.
37///   Exempt from the kernel provability invariant but still validated for
38///   metadata and any proof/falsification data present.
39/// - `Schema`: a generic reference/schema document — exempt from provability,
40///   validated only for `metadata.id`, `metadata.version`, `metadata.description`,
41///   and `metadata.references`.
42#[derive(
43    Debug, Clone, Copy, Default, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize,
44)]
45#[serde(rename_all = "kebab-case")]
46pub enum ContractKind {
47    #[default]
48    Kernel,
49    Registry,
50    ModelFamily,
51    ModelFamilyVariant,
52    Tokenizer,
53    TrainingLoop,
54    PretrainingCorpus,
55    TrainingPreconditionGate,
56    CorpusAssembly,
57    Pattern,
58    Schema,
59}
60
61impl std::fmt::Display for ContractKind {
62    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
63        let s = match self {
64            Self::Kernel => "kernel",
65            Self::Registry => "registry",
66            Self::ModelFamily => "model-family",
67            Self::ModelFamilyVariant => "model-family-variant",
68            Self::Tokenizer => "tokenizer",
69            Self::TrainingLoop => "training-loop",
70            Self::PretrainingCorpus => "pretraining-corpus",
71            Self::TrainingPreconditionGate => "training-precondition-gate",
72            Self::CorpusAssembly => "corpus-assembly",
73            Self::Pattern => "pattern",
74            Self::Schema => "schema",
75        };
76        write!(f, "{s}")
77    }
78}