bitrouter-attestation 1.0.0-alpha.17

Provider-agnostic confidential-inference verification (ConfidentialVerifier): client-side TEE attestation (L1) + exchange integrity (L1.5). First impl: NEAR AI Cloud.
Documentation
//! Normalized result types shared by every
//! [`ConfidentialVerifier`](crate::ConfidentialVerifier) impl.
//!
//! These mirror private-ai-gateway's `UpstreamVerifiedEvent` / `ChannelBinding`
//! normalization (`src/aci/receipt.rs`), but are produced **client-side** and
//! carry each provider's *native* integrity proof rather than a re-signed ACI
//! receipt. See the refactor spec §2.

/// The exact bytes of one request/response exchange to verify (L1.5).
///
/// Hashing is over these raw bytes verbatim — including any trailing newlines a
/// streamed response carries — because the TEE signs `sha256` of the same
/// bytes. Anything that re-serializes the body (e.g. NEAR's gateway) breaks the
/// match, so verifiable calls must use NEAR direct-completions (spec §3).
pub struct ExchangeInput<'a> {
    pub model: &'a str,
    /// Exact bytes the client sent.
    pub request_body: &'a [u8],
    /// Exact bytes the client received.
    pub response_body: &'a [u8],
    /// Chat id taken from the response body's `id` field; selects the signature.
    pub chat_id: &'a str,
    pub now_unix: u64,
}

/// The per-check breakdown of an attestation, mirroring private-ai-gateway's
/// `AciDcapVerifier` check set (`src/aci/verifier/dcap.rs`). Every field is
/// surfaced so a caller can see *why* a verdict is (un)verified, gateway-style.
#[derive(Debug, Clone, PartialEq, Eq, serde::Serialize, serde::Deserialize)]
pub struct AttestationChecks {
    /// NVIDIA NRAS verdict PASS, nonce echoed, EAT signature valid.
    pub gpu_nras_pass: bool,
    /// Intel signature + collateral + measurements (via `dcap-qvl`).
    pub dcap_quote_valid: bool,
    /// `report_data` embeds the attested signing key and the client nonce.
    pub report_data_binds_key_and_nonce: bool,
    /// `sha256(compose) == mr_config`.
    pub compose_matches_mr_config: bool,
    /// LOAD-BEARING (spec §1.5 cond. 1): `workload_id ∈ accepted_workload_ids`
    /// OR `image_digest ∈ accepted_image_digests`, under
    /// `accepted_kms_root_public_keys`. The policy fails to construct if
    /// unpinned; without this, every other check passes for an attacker-owned
    /// genuine TEE running a malicious model.
    pub policy_accepts: bool,
    /// TD debug-bit off.
    pub debug_disabled: bool,
    /// dstack RTMR3 / event-log replay, when the report carries an event log.
    pub event_log_rtmr_ok: Option<bool>,
    /// LOAD-BEARING (issue #567): the quote's firmware-measured base registers
    /// (`MRTD ‖ RTMR0 ‖ RTMR1 ‖ RTMR2`) match a pinned reference bundle. Those
    /// registers are set before the guest runs and cannot be forged on genuine
    /// TDX hardware, so without this gate a malicious base image could forge the
    /// guest-extended RTMR3 labels (`event_log_rtmr_ok`) and pass `policy_accepts`
    /// while running unauthorized code. `false` fail-closed when the quote never
    /// verified or its base registers aren't pinned.
    pub base_measurements_match: bool,
    /// The platform's Intel DCAP TCB status, surfaced as a claim (e.g.
    /// `"UpToDate"`, `"OutOfDate"`). `None` when no collateral verification
    /// produced one. The hard gate is [`Self::tcb_level_acceptable`].
    pub tcb_status: Option<String>,
    /// Whether [`Self::tcb_status`] meets the verifier's configured TCB floor
    /// (default: require `UpToDate`; advisories may be explicitly allow-listed).
    /// LOAD-BEARING: a signature-valid quote from a genuine TEE running
    /// **out-of-date** microcode passes every other DCAP check, so without this
    /// gate a known-vulnerable platform verifies. `false` fail-closed when the
    /// status is missing or below the floor.
    pub tcb_level_acceptable: bool,
}

impl AttestationChecks {
    /// All-false checks — the fail-closed default for a node whose evidence
    /// couldn't be gathered or fully evaluated.
    pub fn failed() -> Self {
        Self {
            gpu_nras_pass: false,
            dcap_quote_valid: false,
            report_data_binds_key_and_nonce: false,
            compose_matches_mr_config: false,
            policy_accepts: false,
            debug_disabled: false,
            event_log_rtmr_ok: None,
            base_measurements_match: false,
            tcb_status: None,
            tcb_level_acceptable: false,
        }
    }

    /// True iff every mandatory check passed. `tcb_status` is a surfaced claim,
    /// but `tcb_level_acceptable` (derived from it against the verifier's TCB
    /// floor) **is** a gate: a stale-but-signature-valid quote must not pass.
    /// `event_log_rtmr_ok` is **required** to be `Some(true)`: it is the anchor
    /// that binds the cloud-supplied `info` (and thus `policy_accepts`) to the
    /// genuine TEE measurement, so a `None` ("not checked") or `Some(false)`
    /// ("replay/binding failed") verdict must not pass. `base_measurements_match`
    /// is likewise a hard gate (issue #567): RTMR3 is only trustworthy once the
    /// firmware-measured base registers it sits above are pinned and matched.
    pub fn all_pass(&self) -> bool {
        self.gpu_nras_pass
            && self.dcap_quote_valid
            && self.report_data_binds_key_and_nonce
            && self.compose_matches_mr_config
            && self.policy_accepts
            && self.debug_disabled
            && self.event_log_rtmr_ok == Some(true)
            && self.base_measurements_match
            && self.tcb_level_acceptable
    }
}

/// L1 verdict: the model endpoint is genuine TEE hardware running the
/// *legitimate* (policy-pinned) model. Yields the attested signing identity set
/// that L1.5 binds a chat signature to.
#[derive(Debug, Clone, PartialEq, Eq, serde::Serialize, serde::Deserialize)]
pub struct AttestationVerdict {
    pub model: String,
    pub verified: bool,
    /// The attested signing addresses from `model_attestations[]` — a SET,
    /// because NEAR serves multi-node and caches per node. A chat signature is
    /// trusted iff it recovers to one of these AND `checks.policy_accepts`
    /// holds (spec §1.5 cond. 1 & 2).
    pub attested_addresses: Vec<String>,
    /// Honest trust-boundary label (gateway convention): `"near-ai-model"` when
    /// we verified the model quote directly; would be `"near-ai-gateway"` if we
    /// ever fell back to trusting NEAR's gateway (as `nearai.py` does).
    pub trust_boundary: String,
    pub nonce: String,
    pub checks: AttestationChecks,
    pub verified_at_unix: u64,
}

impl AttestationVerdict {
    /// A fully-failed, fail-closed verdict (spec §1.5 cond. 3) with every check
    /// false. Used when a fetch is withheld or a sub-check fails — never a
    /// silent pass.
    pub fn unverified(model: impl Into<String>, nonce: impl Into<String>, now_unix: u64) -> Self {
        Self {
            model: model.into(),
            verified: false,
            attested_addresses: Vec::new(),
            trust_boundary: String::new(),
            nonce: nonce.into(),
            checks: AttestationChecks::failed(),
            verified_at_unix: now_unix,
        }
    }
}

/// Each provider's *native* integrity proof — the portable artifact a third
/// party could re-check. Mirrors the gateway's evidence/`ChannelBinding`, but
/// kept provider-native rather than normalized to one receipt shape.
#[derive(Debug, Clone, PartialEq, Eq, serde::Serialize, serde::Deserialize)]
pub enum IntegrityProof {
    /// NEAR's per-chat signature over `{model}:{sha256(req)}:{sha256(resp)}`,
    /// EIP-191 ECDSA, recoverable to the attested signing address.
    NearChatSignature {
        text: String,
        signature: String,
        signing_address: String,
    },
    /// A real ACI gateway's signed receipt (future `AciGatewayVerifier`).
    AciReceipt {
        receipt: serde_json::Value,
        gateway_attestation: serde_json::Value,
    },
}

/// L1.5 result: a specific exchange provably ran in the attested TEE unmodified.
/// ← gateway's `UpstreamVerifiedEvent`, normalized and client-side.
#[derive(Debug, Clone, PartialEq, Eq, serde::Serialize, serde::Deserialize)]
pub struct VerifiedExchange {
    pub provider: String,
    pub model: String,
    /// `sha256(request_body)`, hex.
    pub request_hash: String,
    /// `sha256(response_body)`, hex.
    pub response_hash: String,
    pub attestation: AttestationVerdict,
    pub integrity: IntegrityProof,
    /// `attestation.verified && integrity holds && binds to attested key`.
    pub verified: bool,
}

/// Errors a [`ConfidentialVerifier`](crate::ConfidentialVerifier) can return.
/// Note that a *failed
/// verification* is not an error — it is a verdict with `verified=false`
/// (fail-closed). `VerifyError` is reserved for the verifier being unable to
/// even reach a verdict it can trust (misconfiguration, malformed input).
#[derive(Debug, thiserror::Error)]
pub enum VerifyError {
    /// A network fetch (report, signature, NRAS) failed.
    #[error("transport error fetching {what}: {source}")]
    Transport {
        what: &'static str,
        #[source]
        source: Box<dyn std::error::Error + Send + Sync>,
    },
    /// A wire payload could not be parsed into the expected shape.
    #[error("malformed {what}: {detail}")]
    Malformed { what: &'static str, detail: String },
    /// The DCAP policy was constructed without the mandatory pins (spec §1.5
    /// cond. 1). The verifier refuses to run unpinned.
    #[error("attestation policy misconfigured: {0}")]
    Policy(String),
    /// No verifier is registered for the requested provider.
    #[error("no confidential verifier registered for provider {0:?}")]
    UnknownProvider(String),
}