kanade_shared/manifest.rs
1use serde::{Deserialize, Serialize};
2
3use crate::ipc::jobs::JobCategory;
4use crate::wire::{RunAs, Shell, Staleness};
5
6/// YAML job manifest (= registered "what to run", v0.18.0+).
7///
8/// Owns only script-intrinsic fields. **Who** (`target`), **how to
9/// phase fanout** (`rollout`), and **when to stagger start**
10/// (`jitter`) all moved to the Schedule / exec request side — same
11/// script can now be fired against different targets / rollouts
12/// without copying the script body.
13///
14/// #492: these types are READ fleet-wide (agents decode them from
15/// BUCKET_JOBS / BUCKET_SCHEDULES and inside live Commands), so they
16/// must tolerate unknown fields — `deny_unknown_fields` here made a
17/// gradually-upgrading fleet's OLD agents reject the whole object
18/// the moment a newer backend added any field. Operator typo
19/// protection (the old reason for the attribute) lives at the WRITE
20/// boundaries instead: `kanade job/schedule create` and the backend
21/// POST extractor parse via [`crate::strict`], which rejects unknown
22/// keys with their full paths. The wire rule: new fields always get
23/// `#[serde(default)]` (+ `skip_serializing_if` while old readers
24/// may still be strict).
25#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
26pub struct Manifest {
27 pub id: String,
28 pub version: String,
29 #[serde(default)]
30 pub description: Option<String>,
31 pub execute: Execute,
32 #[serde(default)]
33 pub require_approval: bool,
34 /// Opt-in marker that this job produces a JSON inventory fact
35 /// payload on stdout. When present, the backend's results
36 /// projector parses `ExecResult.stdout` as JSON and upserts an
37 /// `inventory_facts` row keyed by `(pc_id, manifest.id)`. The
38 /// `display` sub-config drives the SPA's Inventory page render.
39 #[serde(default)]
40 pub inventory: Option<InventoryHint>,
41 /// Issue #246: opt-in marker that this job emits per-line
42 /// observability events on stdout (one JSON `ObsEvent` per
43 /// newline). When present, the agent — after the script exits
44 /// successfully — parses each non-empty stdout line as an
45 /// `ObsEvent`, publishes it on `obs.<pc_id>` via the
46 /// `obs_outbox`, and (intentionally) **omits the stdout from
47 /// the `ExecResult`** so the timeline data doesn't double up
48 /// in `execution_results.stdout` (which would multiply rows
49 /// by ~50/day/PC of noise).
50 ///
51 /// Distinct from `inventory:` (single JSON object → projector
52 /// upsert) — events are append-only timeline points consumed
53 /// by the dedicated `obs_events` table.
54 #[serde(default)]
55 pub emit: Option<EmitConfig>,
56 /// #290: opt-in marker that this job is an operator-defined
57 /// **health check** whose result feeds the Client App's Health
58 /// tab over KLP (`StateSnapshot.checks`). The script prints a
59 /// free-form JSON object on stdout (like any inventory job); the
60 /// agent reads the [`CheckHint::status_field`] value dynamically
61 /// into a [`crate::ipc::state::Check`] named `check.name`.
62 /// Cadence / windows / conditions come from
63 /// the job's Schedule (exactly like inventory) — there is
64 /// deliberately no interval here. **Composes with `inventory:`**:
65 /// the script's stdout is one JSON object, so a check can also
66 /// carry an `inventory:` block to project the rest of that object
67 /// (incl. `explode` sub-tables) for SPA fleet-querying. Only
68 /// `emit:` (NDJSON stdout) is incompatible.
69 #[serde(default)]
70 pub check: Option<CheckHint>,
71 /// v0.26: Layer 2 staleness policy (SPEC.md §2.6.2). Controls
72 /// what the agent does at fire time when it can't verify the
73 /// `script_current` / `script_status` KV values are fresh —
74 /// especially relevant for `runs_on: agent` schedules where
75 /// the agent may fire from cache while offline. Defaults to
76 /// `Staleness::Cached` (silently use cached values), which
77 /// matches every pre-v0.26 Manifest.
78 #[serde(default)]
79 pub staleness: Staleness,
80 /// #291: opt-in marker that this job is offered to **end users**
81 /// in the Client App's job tabs over KLP (`jobs.list` →
82 /// `jobs.execute`). Parallel to [`inventory`] / [`check`] /
83 /// [`emit`]: the block's mere presence is the opt-in, and it
84 /// groups the end-user presentation fields (name / category /
85 /// icon) that only make sense for a user-facing job. `None`
86 /// (the default) ⇒ an operator-only job — inventory, checks,
87 /// scheduled maintenance — that never surfaces in the catalog.
88 ///
89 /// The agent re-reads this at every `jobs.list` / `jobs.execute`
90 /// (SPEC §2.1), so removing the block takes a job out of a
91 /// running client on its next action.
92 ///
93 /// [`inventory`]: Manifest::inventory
94 /// [`check`]: Manifest::check
95 /// [`emit`]: Manifest::emit
96 #[serde(default, skip_serializing_if = "Option::is_none")]
97 pub client: Option<ClientHint>,
98}
99
100/// "Who + how + when-to-stagger" — the fanout-plan side of an exec.
101/// Used both as the POST `/api/exec/{job_id}` body and as the embedded
102/// `target` / `rollout` / `jitter` slot on [`Schedule`]. Centralising
103/// here keeps the validation + serialisation logic in one place.
104#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default)]
105pub struct FanoutPlan {
106 #[serde(default)]
107 pub target: Target,
108 /// Optional wave rollout — when present, the backend publishes
109 /// each wave's group subject on its own delay schedule instead
110 /// of fanning out the `target` block in one go. `target` then
111 /// only labels the deploy for the audit log.
112 #[serde(default, skip_serializing_if = "Option::is_none")]
113 pub rollout: Option<Rollout>,
114 /// Optional humantime jitter; agent uses it to randomise
115 /// execution start. Lives here (not on the script) so different
116 /// schedules / ad-hoc fires of the same job can pick different
117 /// stagger windows.
118 #[serde(default, skip_serializing_if = "Option::is_none")]
119 pub jitter: Option<String>,
120 /// Absolute time the scheduler stamps on each emitted Command
121 /// when this exec was driven by a [`Schedule`] with
122 /// `starting_deadline`. Agents receiving a Command after this
123 /// instant publish a synthetic skipped-result instead of
124 /// running the script. `None` (default) = no deadline / catch
125 /// up whenever delivered. Operators don't usually set this
126 /// directly — the scheduler computes it from `tick_at +
127 /// starting_deadline`.
128 #[serde(default, skip_serializing_if = "Option::is_none")]
129 pub deadline_at: Option<chrono::DateTime<chrono::Utc>>,
130}
131
132/// Manifest sub-section: how the SPA should render the inventory
133/// facts this job produces. Each field name (`field`) is a top-level
134/// key in the stdout JSON, e.g. `hostname`, `ram_gb`.
135///
136/// Two render modes:
137/// * `display` — vertical "field / value" per PC, used by the
138/// `/inventory?pc=<id>` detail view. ALL columns the operator
139/// wants visible on the detail page.
140/// * `summary` — horizontal table across the fleet (row = PC,
141/// column = field) on `/inventory`. Optional; when omitted the
142/// SPA falls back to `display`, but operators usually want a
143/// trimmer "hostname / OS / CPU / RAM" set for the fleet view.
144#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
145pub struct InventoryHint {
146 /// Detail-view columns, in order.
147 pub display: Vec<DisplayField>,
148 /// Optional fleet-list columns (row = PC). Defaults to `display`
149 /// when omitted, but operators usually pick a 3-5 column subset.
150 #[serde(default, skip_serializing_if = "Option::is_none")]
151 pub summary: Option<Vec<DisplayField>>,
152 /// v0.31 / #40: payload arrays that should be exploded into
153 /// per-element rows of a derived SQLite table. Lets operators
154 /// answer cross-PC questions ("which PCs still have Chrome <
155 /// 120?", "C: >90% full") with normal SQL filters + indexes
156 /// instead of grepping JSON. The projector creates the derived
157 /// table on register and replaces this PC's rows on each result
158 /// (DELETE WHERE pc_id=? AND job_id=? + bulk INSERT). See
159 /// [`ExplodeSpec`] for the per-spec schema.
160 #[serde(default, skip_serializing_if = "Option::is_none")]
161 pub explode: Option<Vec<ExplodeSpec>>,
162 /// v0.35 / #93: top-level scalar fields whose changes the
163 /// projector logs to `inventory_history` (one event per
164 /// changed field per scan). Pairs with `explode[].track_history`
165 /// — that covers array elements; this covers single-valued
166 /// fields like `ram_bytes` / `os_version` / `cpu_model` /
167 /// `os_build` that operators want to track for "did the RAM
168 /// get upgraded?" / "when did Win 11 land on this PC?" /
169 /// "BIOS / firmware bumped?" questions. Field name = `field_path`
170 /// in the history row, `identity_json` is NULL, `before_json`
171 /// / `after_json` each carry `{"value": <prior or new value>}`.
172 /// First-ever observation of a scalar (no prior facts row)
173 /// emits `added`; subsequent value changes emit `changed`. No
174 /// `removed` events — a scalar disappearing from the payload
175 /// is rare and the operator can still see the last value via
176 /// the `before_json` of the most recent change.
177 #[serde(default, skip_serializing_if = "Option::is_none")]
178 pub history_scalars: Option<Vec<String>>,
179}
180
181/// Manifest sub-section (#290): marks a job as an operator-defined
182/// **health check**. Parallel to [`InventoryHint`] / `EmitConfig`.
183/// The stdout contract is a free-form JSON object (same as any
184/// inventory job) from which the agent reads `status_field` /
185/// `detail_field` to build the KLP [`crate::ipc::state::Check`] shown
186/// on the Client App's Health tab.
187///
188/// There is deliberately **no timing field** — when / how often /
189/// in which window a check runs is driven by the job's Schedule,
190/// exactly like inventory jobs, so operators get the full `when:` /
191/// rollout / `runs_on` expressiveness for free.
192///
193/// A check's stdout is a **free-form inventory object** (arbitrary
194/// key/value pairs + arrays) — same as any inventory job — that also
195/// carries a status field. `check:` adds only the health semantics on
196/// top: which field is the ok/warn/fail/unknown status, an optional
197/// one-line summary field, and a remediation job. Everything else
198/// (rich per-PC detail, `explode` sub-tables like a software list) is
199/// driven by a co-present [`InventoryHint`] and rendered with the
200/// SAME display logic the SPA Inventory page uses — on the Client App
201/// too. This keeps checks maximally expressive without a bespoke
202/// payload type.
203#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
204pub struct CheckHint {
205 /// Stable check id → [`Check.name`](crate::ipc::state::Check),
206 /// the SPA/Client React key + analytics label. Unique within the
207 /// fleet's check set.
208 pub name: String,
209 /// Top-level stdout field whose string value
210 /// (`ok`/`warn`/`fail`/`unknown`) becomes the Health-tab light
211 /// ([`CheckStatus`](crate::ipc::state::CheckStatus)). Defaults to
212 /// `"status"`; a missing / unparseable value → `unknown`.
213 #[serde(default = "default_status_field")]
214 pub status_field: String,
215 /// Top-level stdout field used as the Health-tab row's one-line
216 /// summary. Defaults to `"detail"`; absent in the payload → no
217 /// detail line (the rich breakdown lives in the inventory view).
218 #[serde(default = "default_detail_field")]
219 pub detail_field: String,
220 /// Optional remediation job id →
221 /// [`Check.troubleshoot`](crate::ipc::state::Check). The Client
222 /// App shows a "修復する" button when present; that job must be
223 /// `user_invokable`.
224 #[serde(default, skip_serializing_if = "Option::is_none")]
225 pub troubleshoot: Option<String>,
226 /// #290 PR-E: when `true` (default), the backend also projects this
227 /// check's `status` / `detail` into the `check_status` table so the
228 /// operator SPA gets a fleet-wide compliance view for free — no
229 /// `inventory:` block needed. Set `fleet: false` for a client-only
230 /// check the operator doesn't want surfaced across the fleet.
231 #[serde(default = "default_fleet")]
232 pub fleet: bool,
233}
234
235fn default_status_field() -> String {
236 "status".to_string()
237}
238
239fn default_detail_field() -> String {
240 "detail".to_string()
241}
242
243fn default_fleet() -> bool {
244 true
245}
246
247/// Manifest sub-section (#291): marks a job as **user-invokable**
248/// from the Client App and carries how it presents to the end user.
249/// Parallel to [`InventoryHint`] / [`CheckHint`] / `EmitConfig` —
250/// the block's presence is the opt-in (no separate boolean), and its
251/// required fields (`name`, `category`) are enforced by serde at
252/// parse time, so a half-filled catalog entry fails
253/// `kanade job create` instead of rendering a nameless / tab-less row.
254///
255/// The agent maps this 1:1 into the KLP
256/// [`UserInvokableJob`](crate::ipc::jobs::UserInvokableJob) wire shape
257/// that `jobs.list` returns; the Client App renders one row per job in
258/// the tab named by `category`.
259#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
260pub struct ClientHint {
261 /// End-user-facing title for the job row. The operator-internal
262 /// `Manifest::id` slug is rarely what an end user should read, so
263 /// this is required (and validated non-empty by
264 /// [`Manifest::validate`]). Maps to `UserInvokableJob::display_name`.
265 pub name: String,
266 /// Optional one-line subtitle under `name` in the Client App.
267 /// Distinct from the operator-facing top-level
268 /// [`Manifest::description`] — this one is written for the end
269 /// user. Maps to `UserInvokableJob::display_description`.
270 #[serde(default, skip_serializing_if = "Option::is_none")]
271 pub description: Option<String>,
272 /// Which Client App tab the job lives in (`software_update` →
273 /// アップデート, `troubleshoot` → 困ったとき, `catalog` → software
274 /// catalog). Required — without it the agent can't place the job
275 /// in a tab.
276 pub category: JobCategory,
277 /// Optional icon hint for the job row — a lucide-react icon name
278 /// or a `data:` URL. `None` ⇒ the Client App falls back to the
279 /// category's default icon. Surfaced verbatim in
280 /// `jobs.list[].icon`.
281 #[serde(default, skip_serializing_if = "Option::is_none")]
282 pub icon: Option<String>,
283}
284
285/// Issue #246 — `emit:` manifest block for jobs whose stdout is
286/// NDJSON observability events (one `ObsEvent` per line). Parallel
287/// to `inventory:` but for the append-only timeline pipeline; see
288/// `Manifest::emit` for the full contract.
289#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
290pub struct EmitConfig {
291 /// What kind of payload the agent should expect on stdout. Only
292 /// `events` is defined today (parses each non-empty line as
293 /// `ObsEvent` and publishes on `obs.<pc_id>`); future variants
294 /// (e.g. metrics streams, structured trace events) plug in here.
295 #[serde(rename = "type")]
296 pub kind: EmitKind,
297 /// Operator hint for where the script keeps its own state — the
298 /// watermark file the PowerShell / sh body reads + writes
299 /// between runs so it only emits NEW events since the last
300 /// poll. The agent doesn't read this; it's documentation that
301 /// the SPA (and `kanade job edit`) can surface to operators
302 /// reviewing the manifest. Optional; the script is allowed to
303 /// keep state anywhere (registry, env, etc.) — the field's
304 /// presence makes the convention discoverable.
305 #[serde(default, skip_serializing_if = "Option::is_none")]
306 pub watermark_path: Option<String>,
307}
308
309/// `emit.type` enum. Lowercase serde so manifests read
310/// `type: events` rather than `Events`.
311#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq)]
312#[serde(rename_all = "lowercase")]
313pub enum EmitKind {
314 /// Per-line `ObsEvent` JSON. Agent parses + publishes on
315 /// `obs.<pc_id>`, drops the stdout from the resulting
316 /// `ExecResult`.
317 Events,
318}
319
320/// v0.31 / #40: declarative "flatten this JSON array into a real
321/// SQLite table" spec on an inventory manifest. The projector
322/// creates the table on first registration (CREATE TABLE IF NOT
323/// EXISTS + indexes) and writes a row per element of
324/// `payload[field]` on every result, scoped by (pc_id, job_id) so
325/// each PC's rows replace cleanly without a per-PC schema.
326#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
327pub struct ExplodeSpec {
328 /// JSON array key under the payload to explode. E.g. `"apps"`
329 /// for `payload: { apps: [{...}, {...}] }`.
330 pub field: String,
331 /// Derived SQLite table name. Operators choose this — pick
332 /// something namespaced + stable (`inventory_sw_apps`, not
333 /// `apps`) so multiple inventory manifests don't collide on a
334 /// generic name.
335 pub table: String,
336 /// Element-level fields that uniquely identify a row inside one
337 /// PC's payload. The full PK is `(pc_id, job_id) + these
338 /// columns`. Required — operators must think about uniqueness
339 /// (e.g. `["name", "source"]` for installed apps because the
340 /// same name appears in multiple uninstall hives).
341 ///
342 /// v0.31 / #41: same tuple drives history identity. When
343 /// `track_history` is on, the projector serialises these
344 /// fields' values into `inventory_history.identity_json` for
345 /// every change event, so queries like "every PC that ever
346 /// installed Chrome (any source)" filter on identity_json
347 /// content without a per-manifest schema.
348 pub primary_key: Vec<String>,
349 /// Per-element fields that become columns in the derived table.
350 pub columns: Vec<ExplodeColumn>,
351 /// v0.31 / #41: when true (default false), the projector
352 /// diffs each PC's incoming payload against the prior rows
353 /// for the same (pc_id, job_id) BEFORE the DELETE-then-INSERT
354 /// replace, and writes added / removed / changed events into
355 /// `inventory_history`. Lets operators answer time-dimension
356 /// questions ("when did Chrome 120 first appear on PC X?",
357 /// "what's the Win 11 23H2 rollout curve") without storing
358 /// per-scan snapshots. Off by default so operators opt in
359 /// per-spec — history has a real storage cost on long-lived
360 /// deployments (mitigated by the 90-day default retention
361 /// sweeper, see `cleanup` module).
362 #[serde(default)]
363 pub track_history: bool,
364}
365
366/// One column in an [`ExplodeSpec`]'s derived table.
367#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
368pub struct ExplodeColumn {
369 /// JSON key under each array element. Becomes the column name
370 /// in the derived SQLite table — we don't rename.
371 pub field: String,
372 /// SQLite affinity: `"text"` (default), `"integer"`, `"real"`.
373 /// Storage maps directly via `sqlx::query.bind(...)`; type
374 /// mismatches at INSERT-time fail loudly rather than silently
375 /// dropping the row.
376 #[serde(default, skip_serializing_if = "Option::is_none")]
377 #[serde(rename = "type")]
378 pub kind: Option<String>,
379 /// When true, the projector creates a `CREATE INDEX` on this
380 /// column at table-creation time. Boost for the common-filter
381 /// columns (`name`, `version`) — operators mark them
382 /// explicitly, the projector won't guess.
383 #[serde(default)]
384 pub index: bool,
385}
386
387#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
388pub struct DisplayField {
389 /// Top-level key in the stdout JSON.
390 pub field: String,
391 /// Human-readable column header.
392 pub label: String,
393 /// Optional render hint — `"number"`, `"bytes"`, `"timestamp"`,
394 /// or `"table"` (#39). Defaults to plain text rendering on the
395 /// SPA side. `"table"` expects the field's value to be a JSON
396 /// array of objects and renders a nested sub-table on the
397 /// per-PC detail page using `columns` as the schema; the fleet
398 /// summary view falls back to showing the row count for
399 /// `"table"` cells so the wide list stays compact.
400 #[serde(default, skip_serializing_if = "Option::is_none")]
401 #[serde(rename = "type")]
402 pub kind: Option<String>,
403 /// v0.30 / #39: when `kind == "table"`, the SPA renders the
404 /// field's value (an array of objects like
405 /// `disks: [{ device_id, size_bytes, ... }]`) as a nested
406 /// sub-table using these columns. Each column is itself a
407 /// `DisplayField`, so the nested cells reuse the same render
408 /// hints (`bytes`, `number`, `timestamp`) — no parallel format
409 /// pipeline. Ignored for any other `kind`.
410 #[serde(default, skip_serializing_if = "Option::is_none")]
411 pub columns: Option<Vec<DisplayField>>,
412}
413
414#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
415pub struct Rollout {
416 #[serde(default)]
417 pub strategy: RolloutStrategy,
418 pub waves: Vec<Wave>,
419}
420
421#[derive(
422 Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq, Default,
423)]
424#[serde(rename_all = "lowercase")]
425pub enum RolloutStrategy {
426 #[default]
427 Wave,
428}
429
430#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
431pub struct Wave {
432 pub group: String,
433 /// humantime delay measured from the deploy's publish time. wave[0]
434 /// typically has "0s"; subsequent waves use minutes / hours.
435 pub delay: String,
436}
437
438#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default)]
439pub struct Target {
440 #[serde(default)]
441 pub groups: Vec<String>,
442 #[serde(default)]
443 pub pcs: Vec<String>,
444 #[serde(default)]
445 pub all: bool,
446}
447
448impl Target {
449 /// At least one of all / groups / pcs is set.
450 pub fn is_specified(&self) -> bool {
451 self.all || !self.groups.is_empty() || !self.pcs.is_empty()
452 }
453}
454
455#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
456pub struct Execute {
457 pub shell: ExecuteShell,
458 /// Inline script body. Mutually exclusive with [`script_file`]
459 /// and [`script_object`]; exactly one of the three must be set
460 /// (enforced by [`Execute::validate_script_source`] at the
461 /// write-side parse boundaries — `kanade job create` and
462 /// `POST /api/jobs`).
463 ///
464 /// Empty string is treated as **unset** so operators can swap
465 /// to a `script_file:` / `script_object:` alternative just by
466 /// commenting out the body, without having to also drop the
467 /// `script:` key entirely.
468 ///
469 /// [`script_file`]: Self::script_file
470 /// [`script_object`]: Self::script_object
471 #[serde(default, skip_serializing_if = "Option::is_none")]
472 pub script: Option<String>,
473 /// Repo-local file path resolved by the operator-side CLI at
474 /// `kanade job create` time. The CLI reads the file, slots its
475 /// contents into `script`, and clears this field before
476 /// POSTing — so the backend / agents never see `script_file`
477 /// in stored manifests. SPEC §2.4.1.
478 ///
479 /// Resolver lands in a follow-up PR
480 /// (yukimemi/kanade#210); today this field passes parse-time
481 /// validation but the operator-side CLI bails with "not yet
482 /// implemented" until the resolver ships, so manifests that
483 /// reach the backend with `script_file` set are treated as a
484 /// schema-bug.
485 #[serde(default, skip_serializing_if = "Option::is_none")]
486 pub script_file: Option<String>,
487 /// Object Store reference (`<name>/<version>`) into the
488 /// `scripts` bucket (`OBJECT_SCRIPTS`). Agents fetch the body
489 /// at Execute time via `/api/script-objects/{name}/{version}`
490 /// and cache it locally. SPEC §2.4.1.
491 ///
492 /// Resolver lands in the same follow-up PR as `script_file`;
493 /// today this field passes parse-time validation but the
494 /// backend / agent exec paths bail with "not yet implemented"
495 /// when they see it.
496 #[serde(default, skip_serializing_if = "Option::is_none")]
497 pub script_object: Option<String>,
498 /// humantime duration string (e.g. "30s", "10m"). Script-intrinsic
499 /// — represents how long this script reasonably takes to run.
500 pub timeout: String,
501 /// Token + session combination the agent uses to launch the
502 /// script (v0.21). Default = [`RunAs::System`] (Session 0,
503 /// LocalSystem privileges, no GUI) — matches pre-v0.21 behavior.
504 #[serde(default)]
505 pub run_as: RunAs,
506 /// Working directory for the spawned child (v0.21.1). When
507 /// unset, the child inherits the agent's cwd — on Windows that
508 /// means `%SystemRoot%\System32` for the prod service, which is
509 /// almost never what operators actually want. Use an absolute
510 /// path; relative paths are passed through to the OS verbatim.
511 /// `%PROGRAMDATA%` works for `run_as: system`; for `run_as: user`
512 /// you'd want `%USERPROFILE%` (but expansion happens in the
513 /// shell, so write `$env:USERPROFILE` for PowerShell, or set
514 /// it via teravars before `kanade job create`).
515 #[serde(default, skip_serializing_if = "Option::is_none")]
516 pub cwd: Option<String>,
517}
518
519impl Execute {
520 /// Treat an empty `script:` body as "intentionally unset". Operators
521 /// commenting out a block-scalar tend to leave the key behind, and
522 /// failing the validator on `script: ""` would surprise them.
523 fn has_inline_script(&self) -> bool {
524 matches!(&self.script, Some(s) if !s.is_empty())
525 }
526
527 /// Enforce that exactly one of `script` / `script_file` /
528 /// `script_object` is set. Called at the write-side parse
529 /// boundaries (CLI `kanade job create` + backend
530 /// `POST /api/jobs`) so ambiguous YAML is rejected before it
531 /// reaches the JOBS KV. Read paths (projector, agent
532 /// scheduler, list endpoints) skip this check — they only ever
533 /// see what the write path already validated.
534 pub fn validate_script_source(&self) -> Result<(), String> {
535 let inline = self.has_inline_script();
536 let file = self.script_file.is_some();
537 let obj = self.script_object.is_some();
538 let set = [inline, file, obj].into_iter().filter(|b| *b).count();
539 match set {
540 1 => Ok(()),
541 0 => Err("execute: one of `script`, `script_file`, `script_object` must be set".into()),
542 _ => Err(format!(
543 "execute: only one of `script` / `script_file` / `script_object` may be set \
544 (got script={inline}, script_file={file}, script_object={obj})"
545 )),
546 }
547 }
548}
549
550impl Manifest {
551 /// Cross-field semantic checks that don't fit into pure serde
552 /// derive. Currently delegates to
553 /// [`Execute::validate_script_source`] — see that method's
554 /// docs for the rationale on which call sites should run this.
555 pub fn validate(&self) -> Result<(), String> {
556 self.execute.validate_script_source()?;
557 // Stdout-format compatibility. `inventory:` and `check:` both
558 // consume the SAME single JSON object — they COMPOSE: a check
559 // can extract `status`/`detail` for the Health tab while the
560 // projector explodes the rest into SPA sub-tables. `emit:` is
561 // different — its stdout is NDJSON and the agent omits it from
562 // the result entirely — so it can't be paired with either.
563 if self.emit.is_some() && (self.inventory.is_some() || self.check.is_some()) {
564 return Err(
565 "`emit:` is incompatible with `inventory:` / `check:` — emit's stdout is NDJSON \
566 timeline events (and omitted from the result), while inventory/check read a \
567 single JSON object from stdout"
568 .to_string(),
569 );
570 }
571 // A check's `name` is the Health-tab row id (React key); the
572 // field names tell the agent where to read status/detail.
573 // An empty value is an invisible runtime bug, and the serde
574 // defaults don't guard an operator who writes `status_field:
575 // ""` explicitly — reject all three here.
576 if let Some(check) = &self.check {
577 for (label, value) in [
578 ("check.name", &check.name),
579 ("check.status_field", &check.status_field),
580 ("check.detail_field", &check.detail_field),
581 ] {
582 if value.trim().is_empty() {
583 return Err(format!("{label} must not be empty"));
584 }
585 }
586 // A present-but-blank `troubleshoot` is a broken
587 // remediation job id (the "修復する" button would target
588 // an empty manifest id) — reject it too.
589 if let Some(troubleshoot) = &check.troubleshoot {
590 if troubleshoot.trim().is_empty() {
591 return Err("check.troubleshoot must not be empty when set".to_string());
592 }
593 }
594 }
595 // #291: a `client:` job is rendered in the Client App's
596 // catalog (`jobs.list` → `jobs.execute`). serde already makes
597 // `name` + `category` required at parse time; the only gap is
598 // a present-but-blank `name`, which would render an empty row
599 // title — reject it like the other display-id fields.
600 if let Some(client) = &self.client {
601 if client.name.trim().is_empty() {
602 return Err("client.name must not be empty".to_string());
603 }
604 // Optional display fields, when present, must be
605 // meaningful: a blank `description` renders an empty
606 // subtitle and a blank `icon` is a dangling lucide name.
607 // Same present-but-blank guard the `check:` block applies
608 // to its optional `troubleshoot` id.
609 for (label, value) in [
610 ("client.description", &client.description),
611 ("client.icon", &client.icon),
612 ] {
613 if let Some(v) = value {
614 if v.trim().is_empty() {
615 return Err(format!("{label} must not be empty when set"));
616 }
617 }
618 }
619 }
620 Ok(())
621 }
622}
623
624#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq)]
625#[serde(rename_all = "lowercase")]
626pub enum ExecuteShell {
627 Powershell,
628 Cmd,
629}
630
631impl From<ExecuteShell> for Shell {
632 fn from(s: ExecuteShell) -> Self {
633 match s {
634 ExecuteShell::Powershell => Shell::Powershell,
635 ExecuteShell::Cmd => Shell::Cmd,
636 }
637 }
638}
639
640#[cfg(test)]
641mod tests {
642 use super::*;
643
644 /// The example check-job + schedule YAMLs shipped under `configs/`
645 /// must stay valid as the schema evolves (#290 PR-C). `include_str!`
646 /// pins them at compile time so a breaking edit fails `cargo test`
647 /// rather than only `kanade job create` at deploy time.
648 #[test]
649 fn example_check_job_yamls_parse_and_validate() {
650 let jobs = [
651 (
652 "check-bitlocker",
653 include_str!("../../../configs/jobs/check-bitlocker.yaml"),
654 ),
655 (
656 "check-av-signature",
657 include_str!("../../../configs/jobs/check-av-signature.yaml"),
658 ),
659 (
660 "check-cert-expiry",
661 include_str!("../../../configs/jobs/check-cert-expiry.yaml"),
662 ),
663 ];
664 for (name, yaml) in jobs {
665 let m: Manifest =
666 serde_yaml::from_str(yaml).unwrap_or_else(|e| panic!("{name} parse: {e}"));
667 m.validate()
668 .unwrap_or_else(|e| panic!("{name} validate: {e}"));
669 let check = m
670 .check
671 .as_ref()
672 .unwrap_or_else(|| panic!("{name} must carry a check: hint"));
673 assert!(!check.name.trim().is_empty(), "{name} check.name empty");
674 // These three examples all read admin-only WMI namespaces,
675 // so they run_as system. NOTE: that's a property of these
676 // particular checks, NOT of the `check:` contract — a check
677 // probing user-session state could legitimately run_as user.
678 assert_eq!(
679 m.execute.run_as,
680 RunAs::System,
681 "{name} should run_as system"
682 );
683 }
684 }
685
686 /// The example user-invokable job YAMLs (#291) shipped under
687 /// `configs/jobs/` must stay valid as the `client:` schema
688 /// evolves. `include_str!` pins them at compile time so a breaking
689 /// edit fails `cargo test`, not `kanade job create` at deploy.
690 #[test]
691 fn example_client_job_yamls_parse_and_validate() {
692 let jobs = [
693 (
694 "fix-teams-cache",
695 JobCategory::Troubleshoot,
696 include_str!("../../../configs/jobs/fix-teams-cache.yaml"),
697 ),
698 (
699 "chrome-update",
700 JobCategory::SoftwareUpdate,
701 include_str!("../../../configs/jobs/chrome-update.yaml"),
702 ),
703 (
704 "install-slack",
705 JobCategory::Catalog,
706 include_str!("../../../configs/jobs/install-slack.yaml"),
707 ),
708 ];
709 for (id, category, yaml) in jobs {
710 let m: Manifest =
711 serde_yaml::from_str(yaml).unwrap_or_else(|e| panic!("{id} parse: {e}"));
712 m.validate()
713 .unwrap_or_else(|e| panic!("{id} validate: {e}"));
714 assert_eq!(m.id, id, "{id} id mismatch");
715 let client = m
716 .client
717 .as_ref()
718 .unwrap_or_else(|| panic!("{id} must carry a client: block"));
719 assert!(!client.name.trim().is_empty(), "{id} client.name empty");
720 assert_eq!(client.category, category, "{id} category");
721 }
722 }
723
724 #[test]
725 fn example_check_schedule_yamls_parse_and_validate() {
726 let schedules = [
727 (
728 "check-bitlocker",
729 include_str!("../../../configs/schedules/check-bitlocker.yaml"),
730 ),
731 (
732 "check-av-signature",
733 include_str!("../../../configs/schedules/check-av-signature.yaml"),
734 ),
735 (
736 "check-cert-expiry",
737 include_str!("../../../configs/schedules/check-cert-expiry.yaml"),
738 ),
739 ];
740 for (name, yaml) in schedules {
741 let s: Schedule =
742 serde_yaml::from_str(yaml).unwrap_or_else(|e| panic!("{name} schedule parse: {e}"));
743 s.validate()
744 .unwrap_or_else(|e| panic!("{name} schedule validate: {e}"));
745 assert_eq!(s.job_id, name, "{name} schedule must reference its job");
746 }
747 }
748
749 #[test]
750 fn target_is_specified_requires_at_least_one_field() {
751 let empty = Target::default();
752 assert!(!empty.is_specified());
753
754 let with_all = Target {
755 all: true,
756 ..Target::default()
757 };
758 assert!(with_all.is_specified());
759
760 let with_groups = Target {
761 groups: vec!["canary".into()],
762 ..Target::default()
763 };
764 assert!(with_groups.is_specified());
765
766 let with_pcs = Target {
767 pcs: vec!["pc-01".into()],
768 ..Target::default()
769 };
770 assert!(with_pcs.is_specified());
771 }
772
773 #[test]
774 fn manifest_deserialises_minimal_yaml() {
775 // Matches jobs/echo-test.yaml. v0.18: no target/rollout/jitter
776 // — those live on the schedule / exec request now.
777 let yaml = r#"
778id: echo-test
779version: 0.0.1
780execute:
781 shell: powershell
782 script: "echo 'kanade'"
783 timeout: 30s
784"#;
785 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
786 assert_eq!(m.id, "echo-test");
787 assert_eq!(m.version, "0.0.1");
788 assert!(matches!(m.execute.shell, ExecuteShell::Powershell));
789 assert_eq!(
790 m.execute.script.as_deref().map(str::trim),
791 Some("echo 'kanade'")
792 );
793 assert!(m.execute.script_file.is_none());
794 assert!(m.execute.script_object.is_none());
795 assert_eq!(m.execute.timeout, "30s");
796 assert!(!m.require_approval);
797 m.validate()
798 .expect("inline-script manifest passes validation");
799 }
800
801 #[test]
802 fn manifest_parses_check_job_and_validates() {
803 // An operator-defined health check (#290): a `check:` hint +
804 // a PowerShell script that prints {status, detail}.
805 let yaml = r#"
806id: check-bitlocker
807version: 0.1.0
808execute:
809 shell: powershell
810 run_as: system
811 timeout: 15s
812 script: |
813 [pscustomobject]@{ status = 'ok'; detail = 'all volumes protected' } | ConvertTo-Json -Compress
814check:
815 name: bitlocker
816 troubleshoot: fix-bitlocker
817"#;
818 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
819 let check = m.check.as_ref().expect("check hint present");
820 assert_eq!(check.name, "bitlocker");
821 assert_eq!(check.troubleshoot.as_deref(), Some("fix-bitlocker"));
822 // Field names default to the conventional "status" / "detail".
823 assert_eq!(check.status_field, "status");
824 assert_eq!(check.detail_field, "detail");
825 assert!(m.inventory.is_none() && m.emit.is_none());
826 m.validate().expect("check-only manifest passes validation");
827 }
828
829 #[test]
830 fn manifest_check_defaults_and_custom_fields() {
831 // Minimal: only `name`; status/detail fields default.
832 let m: Manifest = serde_yaml::from_str(
833 r#"
834id: check-disk
835version: 0.1.0
836execute:
837 shell: powershell
838 script: "[pscustomobject]@{ status = 'ok' } | ConvertTo-Json -Compress"
839 timeout: 10s
840check:
841 name: disk_free
842"#,
843 )
844 .expect("parse");
845 let c = m.check.as_ref().unwrap();
846 assert_eq!(c.name, "disk_free");
847 assert_eq!(c.status_field, "status");
848 assert_eq!(c.detail_field, "detail");
849 assert!(c.troubleshoot.is_none());
850 m.validate().expect("validates");
851
852 // The operator can point status/detail at any field of their
853 // free-form inventory object.
854 let m2: Manifest = serde_yaml::from_str(
855 r#"
856id: check-custom
857version: 0.1.0
858execute:
859 shell: powershell
860 script: "echo x"
861 timeout: 10s
862check:
863 name: patch_level
864 status_field: compliance
865 detail_field: summary
866"#,
867 )
868 .expect("parse");
869 let c2 = m2.check.as_ref().unwrap();
870 assert_eq!(c2.status_field, "compliance");
871 assert_eq!(c2.detail_field, "summary");
872 }
873
874 #[test]
875 fn manifest_allows_check_composed_with_inventory() {
876 // `check:` + `inventory:` COMPOSE on the same stdout object:
877 // status/detail → Health tab, the rest → SPA projection +
878 // explode sub-tables. Must pass validation.
879 let yaml = r#"
880id: check-bitlocker-detailed
881version: 0.1.0
882execute:
883 shell: powershell
884 script: "echo x"
885 timeout: 10s
886check:
887 name: bitlocker
888inventory:
889 display:
890 - { field: status, label: Status }
891"#;
892 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
893 assert!(m.check.is_some() && m.inventory.is_some());
894 m.validate().expect("check + inventory compose");
895 }
896
897 #[test]
898 fn manifest_rejects_check_combined_with_emit() {
899 // `emit:` stdout is NDJSON (and omitted from the result), so
900 // it can't pair with `check:` (which needs a single JSON
901 // object on stdout).
902 let yaml = r#"
903id: bad-mix
904version: 0.1.0
905execute:
906 shell: powershell
907 script: "echo x"
908 timeout: 10s
909check:
910 name: bitlocker
911emit:
912 type: events
913"#;
914 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
915 let err = m.validate().expect_err("emit + check must fail");
916 assert!(err.contains("incompatible"), "err: {err}");
917 }
918
919 #[test]
920 fn manifest_rejects_emit_combined_with_inventory() {
921 // The other half of the emit-incompatibility condition.
922 let yaml = r#"
923id: bad-mix-2
924version: 0.1.0
925execute:
926 shell: powershell
927 script: "echo x"
928 timeout: 10s
929emit:
930 type: events
931inventory:
932 display:
933 - { field: status, label: Status }
934"#;
935 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
936 let err = m.validate().expect_err("emit + inventory must fail");
937 assert!(err.contains("incompatible"), "err: {err}");
938 }
939
940 #[test]
941 fn manifest_rejects_empty_check_field_names() {
942 // Empty name / status_field / detail_field are invisible
943 // runtime bugs (empty React key, agent reads the wrong field)
944 // — reject them even though serde supplies non-empty defaults.
945 let base = |inner: &str| {
946 format!(
947 "id: c\nversion: 0.1.0\nexecute:\n shell: powershell\n script: \"echo x\"\n timeout: 10s\ncheck:\n{inner}"
948 )
949 };
950 for inner in [
951 " name: \"\"\n",
952 " name: ok\n status_field: \"\"\n",
953 " name: ok\n detail_field: \" \"\n",
954 // present-but-blank troubleshoot → broken remediation id.
955 " name: ok\n troubleshoot: \" \"\n",
956 ] {
957 let m: Manifest = serde_yaml::from_str(&base(inner)).expect("parse");
958 let err = m.validate().expect_err("empty field must fail");
959 assert!(err.contains("must not be empty"), "err: {err}");
960 }
961 }
962
963 #[test]
964 fn manifest_client_absent_by_default() {
965 // A plain operator job (the overwhelming majority) carries no
966 // `client:` block, so it never surfaces in the end-user
967 // catalog.
968 let yaml = r#"
969id: echo-test
970version: 0.0.1
971execute:
972 shell: powershell
973 script: "echo 'kanade'"
974 timeout: 30s
975"#;
976 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
977 assert!(m.client.is_none());
978 m.validate().expect("operator-only job validates");
979 }
980
981 #[test]
982 fn manifest_client_parses_and_validates() {
983 // The Client App "困ったとき" remediation job shape: a
984 // user-invokable troubleshoot job with the end-user fields the
985 // KLP `jobs.list` wire needs, grouped under `client:`.
986 let yaml = r#"
987id: fix-teams-cache
988version: 1.0.0
989execute:
990 shell: powershell
991 script: "echo clearing"
992 timeout: 60s
993client:
994 name: "Teams のキャッシュをクリア"
995 description: "Teams が重いときに試してください"
996 category: troubleshoot
997 icon: brush-cleaning
998"#;
999 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
1000 let c = m.client.as_ref().expect("client block present");
1001 assert_eq!(c.name, "Teams のキャッシュをクリア");
1002 assert_eq!(
1003 c.description.as_deref(),
1004 Some("Teams が重いときに試してください")
1005 );
1006 assert_eq!(c.category, JobCategory::Troubleshoot);
1007 assert_eq!(c.icon.as_deref(), Some("brush-cleaning"));
1008 m.validate().expect("user-invokable job validates");
1009 }
1010
1011 #[test]
1012 fn manifest_client_minimal_only_name_and_category() {
1013 // description + icon are optional; name + category are the
1014 // serde-required minimum.
1015 let yaml = r#"
1016id: install-slack
1017version: 1.0.0
1018execute:
1019 shell: powershell
1020 script: "echo install"
1021 timeout: 600s
1022client:
1023 name: Slack
1024 category: catalog
1025"#;
1026 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
1027 let c = m.client.as_ref().expect("client present");
1028 assert_eq!(c.category, JobCategory::Catalog);
1029 assert!(c.description.is_none() && c.icon.is_none());
1030 m.validate().expect("minimal client validates");
1031 }
1032
1033 #[test]
1034 fn manifest_client_rejects_blank_name() {
1035 // serde guarantees `name`/`category` are present; the one gap
1036 // is a present-but-blank name → empty catalog row title.
1037 let yaml = r#"
1038id: j
1039version: 1.0.0
1040execute:
1041 shell: powershell
1042 script: "echo x"
1043 timeout: 30s
1044client:
1045 name: " "
1046 category: catalog
1047"#;
1048 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
1049 let err = m.validate().expect_err("blank name must fail");
1050 assert!(err.contains("client.name"), "err: {err}");
1051 }
1052
1053 #[test]
1054 fn manifest_client_rejects_blank_optional_fields() {
1055 // description / icon are optional, but a present-but-blank
1056 // value is a bug (empty subtitle / dangling icon name) — reject
1057 // it, mirroring the check: block's troubleshoot guard.
1058 for (field, line) in [
1059 ("client.description", " description: \" \"\n"),
1060 ("client.icon", " icon: \"\"\n"),
1061 ] {
1062 let yaml = format!(
1063 "id: j\nversion: 1.0.0\nexecute:\n shell: powershell\n script: \"echo x\"\n timeout: 30s\nclient:\n name: A\n category: catalog\n{line}"
1064 );
1065 let m: Manifest = serde_yaml::from_str(&yaml).expect("parse");
1066 let err = m.validate().expect_err("blank optional field must fail");
1067 assert!(err.contains(field), "expected {field} in err: {err}");
1068 }
1069 }
1070
1071 #[test]
1072 fn manifest_client_requires_category_at_parse() {
1073 // A `client:` block missing `category` is a hard parse error
1074 // (serde required field) — no manual validate() needed.
1075 let yaml = r#"
1076id: j
1077version: 1.0.0
1078execute:
1079 shell: powershell
1080 script: "echo x"
1081 timeout: 30s
1082client:
1083 name: "A job"
1084"#;
1085 let r: Result<Manifest, _> = serde_yaml::from_str(yaml);
1086 assert!(
1087 r.is_err(),
1088 "missing category must be a parse error, got {r:?}"
1089 );
1090 }
1091
1092 #[test]
1093 fn manifest_client_rejects_unknown_field() {
1094 // #492: the strict create boundary catches a fat-fingered
1095 // `displayname:` (with its path) instead of silently
1096 // dropping it; the tolerant read path accepts it.
1097 let yaml = r#"
1098id: j
1099version: 1.0.0
1100execute:
1101 shell: powershell
1102 script: "echo x"
1103 timeout: 30s
1104client:
1105 name: "A job"
1106 category: catalog
1107 displayname: oops
1108"#;
1109 let r = crate::strict::from_yaml_str::<Manifest>(yaml);
1110 let err = r.expect_err("unknown client field must be rejected at the write boundary");
1111 // serde_ignored renders the Option layer as `?`:
1112 // `client.?.displayname`. Assert on the leaf key.
1113 assert!(err.contains("displayname"), "{err}");
1114 // The READ path tolerates the same payload (gradual-upgrade
1115 // contract: an old agent must accept a newer writer's field).
1116 let m: Manifest = serde_yaml::from_str(yaml).expect("tolerant read");
1117 assert_eq!(m.client.as_ref().map(|c| c.name.as_str()), Some("A job"));
1118 }
1119
1120 fn execute_with(
1121 script: Option<&str>,
1122 script_file: Option<&str>,
1123 script_object: Option<&str>,
1124 ) -> Execute {
1125 Execute {
1126 shell: ExecuteShell::Powershell,
1127 script: script.map(str::to_owned),
1128 script_file: script_file.map(str::to_owned),
1129 script_object: script_object.map(str::to_owned),
1130 timeout: "30s".into(),
1131 run_as: RunAs::default(),
1132 cwd: None,
1133 }
1134 }
1135
1136 #[test]
1137 fn validate_accepts_inline_script() {
1138 let e = execute_with(Some("echo hi"), None, None);
1139 assert!(e.validate_script_source().is_ok());
1140 }
1141
1142 #[test]
1143 fn validate_accepts_script_file_alone() {
1144 let e = execute_with(None, Some("scripts/cleanup.ps1"), None);
1145 assert!(e.validate_script_source().is_ok());
1146 }
1147
1148 #[test]
1149 fn validate_accepts_script_object_alone() {
1150 let e = execute_with(None, None, Some("cleanup/1.0.0"));
1151 assert!(e.validate_script_source().is_ok());
1152 }
1153
1154 #[test]
1155 fn validate_treats_empty_inline_script_as_unset() {
1156 // `script: ""` + `script_object` set is the natural shape
1157 // when an operator comments out the YAML block-scalar body
1158 // but leaves the key. Should pass.
1159 let e = execute_with(Some(""), None, Some("cleanup/1.0.0"));
1160 assert!(e.validate_script_source().is_ok());
1161 }
1162
1163 #[test]
1164 fn validate_rejects_zero_sources() {
1165 let e = execute_with(None, None, None);
1166 let err = e.validate_script_source().unwrap_err();
1167 assert!(err.contains("must be set"), "got: {err}");
1168 }
1169
1170 #[test]
1171 fn validate_rejects_empty_inline_only() {
1172 let e = execute_with(Some(""), None, None);
1173 let err = e.validate_script_source().unwrap_err();
1174 assert!(err.contains("must be set"), "got: {err}");
1175 }
1176
1177 #[test]
1178 fn validate_rejects_inline_plus_file() {
1179 let e = execute_with(Some("echo hi"), Some("scripts/cleanup.ps1"), None);
1180 let err = e.validate_script_source().unwrap_err();
1181 assert!(err.contains("only one of"), "got: {err}");
1182 }
1183
1184 #[test]
1185 fn validate_rejects_inline_plus_object() {
1186 let e = execute_with(Some("echo hi"), None, Some("cleanup/1.0.0"));
1187 let err = e.validate_script_source().unwrap_err();
1188 assert!(err.contains("only one of"), "got: {err}");
1189 }
1190
1191 #[test]
1192 fn validate_rejects_file_plus_object() {
1193 let e = execute_with(None, Some("scripts/cleanup.ps1"), Some("cleanup/1.0.0"));
1194 let err = e.validate_script_source().unwrap_err();
1195 assert!(err.contains("only one of"), "got: {err}");
1196 }
1197
1198 #[test]
1199 fn validate_rejects_all_three() {
1200 let e = execute_with(
1201 Some("echo hi"),
1202 Some("scripts/cleanup.ps1"),
1203 Some("cleanup/1.0.0"),
1204 );
1205 let err = e.validate_script_source().unwrap_err();
1206 assert!(err.contains("only one of"), "got: {err}");
1207 }
1208
1209 #[test]
1210 fn manifest_deserialises_script_object_yaml() {
1211 // SPEC §2.4.1 example shape with the Object Store
1212 // reference picked over inline.
1213 let yaml = r#"
1214id: cleanup-disk-temp
1215version: 1.0.1
1216execute:
1217 shell: powershell
1218 script_object: cleanup-disk-temp/1.0.1
1219 timeout: 600s
1220"#;
1221 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
1222 assert_eq!(
1223 m.execute.script_object.as_deref(),
1224 Some("cleanup-disk-temp/1.0.1")
1225 );
1226 assert!(m.execute.script.is_none());
1227 m.validate()
1228 .expect("script_object-only manifest passes validation");
1229 }
1230
1231 #[test]
1232 fn manifest_rejects_typo_in_script_field_name() {
1233 // #492: the strict create boundary catches `script_objectt`
1234 // and similar fat-fingers (with the full path) instead of
1235 // letting them silently fall through to "all three unset".
1236 let yaml = r#"
1237id: typo
1238version: 1.0.0
1239execute:
1240 shell: powershell
1241 script_objectt: oops
1242 timeout: 30s
1243"#;
1244 let err = crate::strict::from_yaml_str::<Manifest>(yaml)
1245 .expect_err("typo'd execute field must be rejected at the write boundary");
1246 assert!(err.contains("execute.script_objectt"), "{err}");
1247 }
1248
1249 #[test]
1250 fn schedule_carries_target_and_rollout() {
1251 let yaml = r#"
1252id: hourly-cleanup-canary
1253when:
1254 per_pc: { every: 1h }
1255job_id: cleanup
1256enabled: true
1257target:
1258 groups: [canary, wave1]
1259jitter: 30s
1260rollout:
1261 strategy: wave
1262 waves:
1263 - { group: canary, delay: 0s }
1264 - { group: wave1, delay: 5s }
1265"#;
1266 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
1267 assert_eq!(s.id, "hourly-cleanup-canary");
1268 assert_eq!(s.job_id, "cleanup");
1269 assert_eq!(s.plan.target.groups, vec!["canary", "wave1"]);
1270 assert_eq!(s.plan.jitter.as_deref(), Some("30s"));
1271 let rollout = s.plan.rollout.expect("rollout present");
1272 assert_eq!(rollout.waves.len(), 2);
1273 assert_eq!(rollout.waves[0].group, "canary");
1274 assert_eq!(rollout.waves[1].delay, "5s");
1275 assert_eq!(rollout.strategy, RolloutStrategy::Wave);
1276 }
1277
1278 #[test]
1279 fn schedule_minimal_target_all() {
1280 let yaml = r#"
1281id: kitting
1282when:
1283 per_pc: once
1284enabled: true
1285job_id: scheduled-echo
1286target: { all: true }
1287"#;
1288 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
1289 assert_eq!(s.id, "kitting");
1290 assert_eq!(s.when, When::PerPc(PerPolicy::Once(OnceLiteral::Once)));
1291 assert!(s.enabled);
1292 assert_eq!(s.job_id, "scheduled-echo");
1293 assert!(s.plan.target.all);
1294 assert!(s.plan.rollout.is_none());
1295 assert!(s.plan.jitter.is_none());
1296 assert!(s.active.is_empty());
1297 }
1298
1299 #[test]
1300 fn schedule_enabled_defaults_to_true() {
1301 let yaml = r#"
1302id: x
1303when:
1304 per_pc: once
1305job_id: y
1306target: { all: true }
1307"#;
1308 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
1309 assert!(s.enabled);
1310 }
1311
1312 // ---- `when` parsing (#418 Phase 1) ----
1313
1314 fn schedule_yaml_with(when_block: &str) -> String {
1315 format!(
1316 r#"
1317id: x
1318when:
1319{when_block}
1320job_id: y
1321target: {{ all: true }}
1322"#
1323 )
1324 }
1325
1326 #[test]
1327 fn when_per_pc_every_parses_unquoted_humantime() {
1328 // `6h` is digit-led but non-numeric → YAML string, same as
1329 // the old `cooldown: 6h` convention. No quotes needed.
1330 let s: Schedule =
1331 serde_yaml::from_str(&schedule_yaml_with(" per_pc: { every: 6h }")).expect("parse");
1332 assert_eq!(
1333 s.when,
1334 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() }))
1335 );
1336 }
1337
1338 #[test]
1339 fn when_per_target_every_parses() {
1340 let s: Schedule = serde_yaml::from_str(&schedule_yaml_with(" per_target: { every: 24h }"))
1341 .expect("parse");
1342 assert_eq!(
1343 s.when,
1344 When::PerTarget(PerPolicy::Every(EverySpec {
1345 every: "24h".into()
1346 }))
1347 );
1348 }
1349
1350 #[test]
1351 fn when_per_target_once_parses() {
1352 // Falls out of the shared PerPolicy shape and decide_fire
1353 // already implements it ("any one pc succeeds → skip the
1354 // target forever"), so it is allowed, not rejected.
1355 let s: Schedule =
1356 serde_yaml::from_str(&schedule_yaml_with(" per_target: once")).expect("parse");
1357 assert_eq!(s.when, When::PerTarget(PerPolicy::Once(OnceLiteral::Once)));
1358 }
1359
1360 #[test]
1361 fn when_calendar_time_parses() {
1362 let s: Schedule = serde_yaml::from_str(&schedule_yaml_with(
1363 " calendar:\n at: \"09:00\"\n days: [mon-fri]",
1364 ))
1365 .expect("parse");
1366 match &s.when {
1367 When::Calendar(c) => {
1368 assert_eq!(c.at, "09:00");
1369 assert_eq!(c.days, vec!["mon-fri"]);
1370 }
1371 other => panic!("expected calendar, got {other:?}"),
1372 }
1373 }
1374
1375 #[test]
1376 fn when_calendar_days_default_empty() {
1377 let s: Schedule =
1378 serde_yaml::from_str(&schedule_yaml_with(" calendar:\n at: \"09:00\""))
1379 .expect("parse");
1380 match &s.when {
1381 When::Calendar(c) => assert!(c.days.is_empty(), "days defaults to empty (= daily)"),
1382 other => panic!("expected calendar, got {other:?}"),
1383 }
1384 }
1385
1386 #[test]
1387 fn when_calendar_datetime_parses_all_separators() {
1388 // one-shot: date+time in hyphen / ISO-T / slash forms
1389 for at in ["2026-06-10 09:00", "2026-06-10T09:00", "2026/06/10 09:00"] {
1390 let block = format!(" calendar:\n at: \"{at}\"");
1391 let s: Schedule = serde_yaml::from_str(&schedule_yaml_with(&block))
1392 .unwrap_or_else(|e| panic!("parse '{at}': {e}"));
1393 match &s.when {
1394 When::Calendar(c) => {
1395 use chrono::Datelike;
1396 let p = c.parse_at().expect("parse_at");
1397 let d = p.date.expect("datetime at carries a date");
1398 assert_eq!((d.year(), d.month(), d.day()), (2026, 6, 10), "for '{at}'");
1399 }
1400 other => panic!("expected calendar, got {other:?}"),
1401 }
1402 }
1403 }
1404
1405 #[test]
1406 fn when_rejects_bad_once_keyword() {
1407 // `onec` must be a parse error, not a silently-absorbed
1408 // string (OnceLiteral is a single-variant enum for exactly
1409 // this reason).
1410 let r: Result<Schedule, _> = serde_yaml::from_str(&schedule_yaml_with(" per_pc: onec"));
1411 assert!(r.is_err(), "expected parse error, got {r:?}");
1412 }
1413
1414 #[test]
1415 fn when_rejects_unknown_key_in_every() {
1416 // `{ evry: 6h }` still fails on the tolerant read path: the
1417 // required `every` key is missing, so no PerPolicy variant
1418 // matches (#492 removed deny_unknown_fields, but required
1419 // keys keep the untagged disambiguation honest).
1420 let r: Result<Schedule, _> =
1421 serde_yaml::from_str(&schedule_yaml_with(" per_pc: { evry: 6h }"));
1422 assert!(r.is_err(), "expected parse error, got {r:?}");
1423 }
1424
1425 #[test]
1426 fn when_rejects_unknown_variant() {
1427 let r: Result<Schedule, _> =
1428 serde_yaml::from_str(&schedule_yaml_with(" per_galaxy: once"));
1429 assert!(r.is_err(), "expected parse error, got {r:?}");
1430 }
1431
1432 #[test]
1433 fn when_rejects_old_top_level_cron_field() {
1434 // Pre-#418 shape: top-level `cron:` + no `when:`. Must fail
1435 // loudly (missing `when`), which is what turns stale KV
1436 // blobs into warn-skips after the upgrade.
1437 let yaml = r#"
1438id: x
1439cron: "* * * * * *"
1440job_id: y
1441target: { all: true }
1442"#;
1443 let r: Result<Schedule, _> = serde_yaml::from_str(yaml);
1444 assert!(r.is_err(), "expected parse error, got {r:?}");
1445 }
1446
1447 #[test]
1448 fn when_rejects_retired_cron_escape_hatch() {
1449 // #418 Phase 2 retired `when: { cron: "..." }`. A raw cron
1450 // is now an unknown variant → parse error (operators use the
1451 // calendar form instead).
1452 let r: Result<Schedule, _> =
1453 serde_yaml::from_str(&schedule_yaml_with(" cron: \"0 0 9 * * mon-fri\""));
1454 assert!(
1455 r.is_err(),
1456 "expected parse error for retired cron, got {r:?}"
1457 );
1458 }
1459
1460 #[test]
1461 fn when_round_trips_json_and_yaml() {
1462 // Round-trip through the full Schedule: that is the wire
1463 // unit for both stores (JSON catalog KV + YAML mirror), and
1464 // it exercises the singleton_map field attribute that keeps
1465 // serde_yaml on the map shape instead of `!per_pc` tags.
1466 for when in [
1467 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1468 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1469 When::PerTarget(PerPolicy::Once(OnceLiteral::Once)),
1470 When::PerTarget(PerPolicy::Every(EverySpec {
1471 every: "24h".into(),
1472 })),
1473 calendar("09:00", &["mon-fri"]),
1474 calendar("2026-06-10 09:00", &[]),
1475 When::On(vec![OnTrigger::Startup]),
1476 When::On(vec![OnTrigger::Startup, OnTrigger::Logon]),
1477 When::On(vec![OnTrigger::Lock, OnTrigger::Unlock]),
1478 When::On(vec![OnTrigger::NetworkChange]),
1479 ] {
1480 // Event triggers are agent-only; the rest validate on backend.
1481 let runs_on = if matches!(when, When::On(_)) {
1482 RunsOn::Agent
1483 } else {
1484 RunsOn::Backend
1485 };
1486 let s = schedule_with(when.clone(), runs_on);
1487
1488 let json = serde_json::to_string(&s).expect("json serialise");
1489 let back: Schedule = serde_json::from_str(&json).expect("json deserialise");
1490 assert_eq!(back.when, when, "json round-trip for {when}");
1491
1492 let yaml = serde_yaml::to_string(&s).expect("yaml serialise");
1493 assert!(
1494 !yaml.contains('!'),
1495 "yaml must use the map shape, not tags: {yaml}"
1496 );
1497 let back: Schedule = serde_yaml::from_str(&yaml).expect("yaml deserialise");
1498 assert_eq!(back.when, when, "yaml round-trip for {when}");
1499 }
1500 }
1501
1502 #[test]
1503 fn when_once_serialises_as_bare_keyword() {
1504 // The wire shape operators see in the YAML mirror must stay
1505 // the ergonomic `per_pc: once`, not a one-variant map.
1506 let json = serde_json::to_value(When::PerPc(PerPolicy::Once(OnceLiteral::Once)))
1507 .expect("serialise");
1508 assert_eq!(json, serde_json::json!({ "per_pc": "once" }));
1509 }
1510
1511 #[test]
1512 fn when_displays_operator_summary() {
1513 for (when, expected) in [
1514 (
1515 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1516 "per_pc once",
1517 ),
1518 (
1519 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1520 "per_pc every 6h",
1521 ),
1522 (
1523 When::PerTarget(PerPolicy::Every(EverySpec {
1524 every: "24h".into(),
1525 })),
1526 "per_target every 24h",
1527 ),
1528 (calendar("09:00", &["mon-fri"]), "at 09:00 [mon-fri]"),
1529 (calendar("2026-06-10 09:00", &[]), "at 2026-06-10 09:00"),
1530 (When::On(vec![OnTrigger::Startup]), "on [startup]"),
1531 (
1532 When::On(vec![OnTrigger::Startup, OnTrigger::Logon]),
1533 "on [startup,logon]",
1534 ),
1535 (
1536 When::On(vec![OnTrigger::Lock, OnTrigger::Unlock]),
1537 "on [lock,unlock]",
1538 ),
1539 (
1540 When::On(vec![OnTrigger::NetworkChange]),
1541 "on [network_change]",
1542 ),
1543 ] {
1544 assert_eq!(when.to_string(), expected);
1545 }
1546 }
1547
1548 // ---- lowering (#418: when → engine vocabulary) ----
1549
1550 fn schedule_with(when: When, runs_on: RunsOn) -> Schedule {
1551 Schedule {
1552 id: "x".into(),
1553 when,
1554 job_id: "y".into(),
1555 plan: FanoutPlan::default(),
1556 active: Active::default(),
1557 constraints: Constraints::default(),
1558 on_failure: OnFailure::default(),
1559 tz: ScheduleTz::default(),
1560 starting_deadline: None,
1561 runs_on,
1562 enabled: true,
1563 }
1564 }
1565
1566 fn calendar(at: &str, days: &[&str]) -> When {
1567 When::Calendar(CalendarSpec {
1568 at: at.into(),
1569 days: days.iter().map(|d| (*d).to_string()).collect(),
1570 })
1571 }
1572
1573 #[test]
1574 fn next_calendar_fire_returns_next_utc_occurrence() {
1575 use chrono::TimeZone;
1576 // Daily 09:00, evaluated in UTC. From 08:00 the same day, the
1577 // next strict occurrence is 09:00 that day.
1578 let mut s = schedule_with(calendar("09:00", &[]), RunsOn::Backend);
1579 s.tz = ScheduleTz::Utc;
1580 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 9, 8, 0, 0).unwrap();
1581 let next = s.next_calendar_fire(now).expect("calendar has a next fire");
1582 assert_eq!(
1583 next,
1584 chrono::Utc.with_ymd_and_hms(2026, 6, 9, 9, 0, 0).unwrap()
1585 );
1586 }
1587
1588 #[test]
1589 fn next_calendar_fire_is_strictly_after_now() {
1590 use chrono::TimeZone;
1591 // Standing exactly on a fire instant must preview the *next*
1592 // one (inclusive = false), not the one firing right now.
1593 let mut s = schedule_with(calendar("09:00", &[]), RunsOn::Backend);
1594 s.tz = ScheduleTz::Utc;
1595 let on_fire = chrono::Utc.with_ymd_and_hms(2026, 6, 9, 9, 0, 0).unwrap();
1596 let next = s
1597 .next_calendar_fire(on_fire)
1598 .expect("calendar has a next fire");
1599 assert_eq!(
1600 next,
1601 chrono::Utc.with_ymd_and_hms(2026, 6, 10, 9, 0, 0).unwrap()
1602 );
1603 }
1604
1605 #[test]
1606 fn next_calendar_fire_none_for_reconcile_shapes() {
1607 // `per_pc` / `per_target` lower to the every-minute poll cron —
1608 // no discrete upcoming event to preview, so `None`.
1609 let now = chrono::Utc::now();
1610 for when in [
1611 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1612 When::PerTarget(PerPolicy::Once(OnceLiteral::Once)),
1613 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1614 When::PerTarget(PerPolicy::Every(EverySpec {
1615 every: "24h".into(),
1616 })),
1617 ] {
1618 let s = schedule_with(when, RunsOn::Backend);
1619 assert!(
1620 s.next_calendar_fire(now).is_none(),
1621 "reconcile shapes have no calendar fire",
1622 );
1623 }
1624 }
1625
1626 // ---- preview_fires (#418 dry-run / preview) ----
1627
1628 fn cal_utc(at: &str, days: &[&str]) -> Schedule {
1629 let mut s = schedule_with(calendar(at, days), RunsOn::Backend);
1630 s.tz = ScheduleTz::Utc; // host-independent assertions
1631 s
1632 }
1633
1634 #[test]
1635 fn preview_lists_next_calendar_occurrences() {
1636 use chrono::TimeZone;
1637 // Weekday 09:00, from Wed 2026-06-10 00:00 UTC: the next five
1638 // fires skip the weekend (Sat 13 / Sun 14).
1639 let s = cal_utc("09:00", &["mon-fri"]);
1640 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 10, 0, 0, 0).unwrap();
1641 let got = s.preview_fires(now, 5);
1642 let want: Vec<_> = [
1643 (2026, 6, 10), // Wed
1644 (2026, 6, 11), // Thu
1645 (2026, 6, 12), // Fri
1646 (2026, 6, 15), // Mon (skips Sat 13 / Sun 14)
1647 (2026, 6, 16), // Tue
1648 ]
1649 .iter()
1650 .map(|(y, m, d)| chrono::Utc.with_ymd_and_hms(*y, *m, *d, 9, 0, 0).unwrap())
1651 .collect();
1652 assert_eq!(got, want);
1653 }
1654
1655 #[test]
1656 fn preview_handles_nth_and_last_weekday() {
1657 use chrono::TimeZone;
1658 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 1, 0, 0, 0).unwrap();
1659 // 2nd Tuesday (Patch Tuesday): Jun 9, Jul 14 2026.
1660 let nth = cal_utc("09:00", &["tue#2"]).preview_fires(now, 2);
1661 assert_eq!(
1662 nth,
1663 vec![
1664 chrono::Utc.with_ymd_and_hms(2026, 6, 9, 9, 0, 0).unwrap(),
1665 chrono::Utc.with_ymd_and_hms(2026, 7, 14, 9, 0, 0).unwrap(),
1666 ]
1667 );
1668 // Last Friday of the month: Jun 26, Jul 31 2026.
1669 let last = cal_utc("22:00", &["friL"]).preview_fires(now, 2);
1670 assert_eq!(
1671 last,
1672 vec![
1673 chrono::Utc.with_ymd_and_hms(2026, 6, 26, 22, 0, 0).unwrap(),
1674 chrono::Utc.with_ymd_and_hms(2026, 7, 31, 22, 0, 0).unwrap(),
1675 ]
1676 );
1677 }
1678
1679 #[test]
1680 fn preview_is_empty_for_reconcile_and_zero_count() {
1681 let now = chrono::Utc::now();
1682 // reconcile shapes have no discrete fire times
1683 let recon = schedule_with(
1684 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1685 RunsOn::Backend,
1686 );
1687 assert!(recon.preview_fires(now, 5).is_empty());
1688 // count == 0 yields nothing even for a calendar
1689 assert!(cal_utc("09:00", &[]).preview_fires(now, 0).is_empty());
1690 }
1691
1692 #[test]
1693 fn preview_skips_outside_active_window() {
1694 use chrono::TimeZone;
1695 // Daily 09:00, active only [2026-06-15, 2026-06-17). Occurrences
1696 // before `from` are skipped; `until` is exclusive, so 06-17's
1697 // fire is out — leaving exactly the 15th and 16th.
1698 let mut s = cal_utc("09:00", &[]);
1699 s.active = Active {
1700 from: Some("2026-06-15".into()),
1701 until: Some("2026-06-17".into()),
1702 };
1703 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 10, 0, 0, 0).unwrap();
1704 let got = s.preview_fires(now, 5);
1705 assert_eq!(
1706 got,
1707 vec![
1708 chrono::Utc.with_ymd_and_hms(2026, 6, 15, 9, 0, 0).unwrap(),
1709 chrono::Utc.with_ymd_and_hms(2026, 6, 16, 9, 0, 0).unwrap(),
1710 ]
1711 );
1712 }
1713
1714 #[test]
1715 fn preview_empty_when_calendar_time_outside_window() {
1716 use chrono::TimeZone;
1717 // Fires at 09:00 but the maintenance window is overnight — it can
1718 // never run, so the preview is empty (matches
1719 // `calendar_outside_window`), and the scan still terminates.
1720 let mut s = cal_utc("09:00", &[]);
1721 s.constraints = Constraints {
1722 window: Some("22:00-05:00".into()),
1723 ..Constraints::default()
1724 };
1725 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 10, 0, 0, 0).unwrap();
1726 assert!(s.preview_fires(now, 5).is_empty());
1727 // Every candidate tick is rejected, so this also exercises the
1728 // SCAN_CAP bound: a large `count` must still terminate (and
1729 // return empty) rather than spin (claude #578 review).
1730 assert!(s.preview_fires(now, 50).is_empty());
1731 }
1732
1733 #[test]
1734 fn preview_past_one_shot_is_empty() {
1735 use chrono::TimeZone;
1736 // A dated one-shot whose instant has passed never fires again.
1737 let s = cal_utc("2026-06-10 09:00", &[]);
1738 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 11, 0, 0, 0).unwrap();
1739 assert!(s.preview_fires(now, 5).is_empty());
1740 // …but from before it, the single future fire shows up.
1741 let before = chrono::Utc.with_ymd_and_hms(2026, 6, 1, 0, 0, 0).unwrap();
1742 assert_eq!(
1743 s.preview_fires(before, 5),
1744 vec![chrono::Utc.with_ymd_and_hms(2026, 6, 10, 9, 0, 0).unwrap()]
1745 );
1746 }
1747
1748 #[test]
1749 fn lowering_matches_the_418_table() {
1750 let cases = [
1751 (
1752 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1753 (POLL_CRON, ExecMode::OncePerPc, None),
1754 ),
1755 (
1756 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1757 (POLL_CRON, ExecMode::OncePerPc, Some("6h")),
1758 ),
1759 (
1760 When::PerTarget(PerPolicy::Once(OnceLiteral::Once)),
1761 (POLL_CRON, ExecMode::OncePerTarget, None),
1762 ),
1763 (
1764 When::PerTarget(PerPolicy::Every(EverySpec {
1765 every: "24h".into(),
1766 })),
1767 (POLL_CRON, ExecMode::OncePerTarget, Some("24h")),
1768 ),
1769 // calendar repeating → 6-field cron
1770 (
1771 calendar("09:00", &["mon-fri"]),
1772 ("0 0 9 * * mon-fri", ExecMode::EveryTick, None),
1773 ),
1774 // calendar daily (no days) → DOW *
1775 (
1776 calendar("18:30", &[]),
1777 ("0 30 18 * * *", ExecMode::EveryTick, None),
1778 ),
1779 // calendar one-shot → 7-field year cron
1780 (
1781 calendar("2026-06-10 09:00", &[]),
1782 ("0 0 9 10 6 * 2026", ExecMode::EveryTick, None),
1783 ),
1784 ];
1785 for (when, (cron, mode, cooldown)) in cases {
1786 let l = schedule_with(when.clone(), RunsOn::Backend).lowered();
1787 assert_eq!(l.cron, cron, "cron for {when}");
1788 assert_eq!(l.mode, mode, "mode for {when}");
1789 assert_eq!(l.cooldown.as_deref(), cooldown, "cooldown for {when}");
1790 }
1791 }
1792
1793 #[test]
1794 fn lowered_carries_schedule_tz() {
1795 for (tz, want) in [
1796 (ScheduleTz::Local, ScheduleTz::Local),
1797 (ScheduleTz::Utc, ScheduleTz::Utc),
1798 ] {
1799 let mut s = schedule_with(calendar("09:00", &["mon-fri"]), RunsOn::Backend);
1800 s.tz = tz;
1801 assert_eq!(s.lowered().tz, want, "calendar carries tz");
1802 // reconcile shapes carry tz too (for the active-window check)
1803 let mut s = schedule_with(
1804 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1805 RunsOn::Backend,
1806 );
1807 s.tz = tz;
1808 assert_eq!(s.lowered().tz, want, "reconcile carries tz");
1809 }
1810 }
1811
1812 #[test]
1813 fn poll_cron_is_accepted_by_the_engine_parser() {
1814 // POLL_CRON is system-generated — if the engine's parser
1815 // ever rejected it every reconcile schedule would die at
1816 // register time. Validate it with the same croner config
1817 // (Seconds::Required, dom_and_dow, year optional).
1818 croner::parser::CronParser::builder()
1819 .seconds(croner::parser::Seconds::Required)
1820 .dom_and_dow(true)
1821 .build()
1822 .parse(POLL_CRON)
1823 .expect("POLL_CRON must parse");
1824 }
1825
1826 // ---- Schedule::validate() (#418 decision F) ----
1827
1828 #[test]
1829 fn validate_accepts_reconcile_shapes() {
1830 for when in [
1831 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
1832 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
1833 When::PerTarget(PerPolicy::Once(OnceLiteral::Once)),
1834 When::PerTarget(PerPolicy::Every(EverySpec {
1835 every: "24h".into(),
1836 })),
1837 ] {
1838 schedule_with(when.clone(), RunsOn::Backend)
1839 .validate()
1840 .unwrap_or_else(|e| panic!("{when} should validate: {e}"));
1841 }
1842 }
1843
1844 #[test]
1845 fn validate_accepts_per_pc_on_agent() {
1846 schedule_with(
1847 When::PerPc(PerPolicy::Every(EverySpec { every: "1h".into() })),
1848 RunsOn::Agent,
1849 )
1850 .validate()
1851 .expect("per_pc + agent is the offline-inventory shape");
1852 }
1853
1854 // ---- #418 event triggers (when: { on }) ----
1855
1856 #[test]
1857 fn validate_accepts_event_on_agent() {
1858 for triggers in [
1859 vec![OnTrigger::Startup],
1860 vec![OnTrigger::Logon],
1861 vec![OnTrigger::Lock],
1862 vec![OnTrigger::Unlock],
1863 vec![OnTrigger::NetworkChange],
1864 vec![
1865 OnTrigger::Startup,
1866 OnTrigger::Logon,
1867 OnTrigger::Lock,
1868 OnTrigger::Unlock,
1869 OnTrigger::NetworkChange,
1870 ],
1871 ] {
1872 schedule_with(When::On(triggers), RunsOn::Agent)
1873 .validate()
1874 .expect("when.on is valid on runs_on: agent");
1875 }
1876 }
1877
1878 #[test]
1879 fn validate_rejects_event_on_backend() {
1880 let err = schedule_with(When::On(vec![OnTrigger::Startup]), RunsOn::Backend)
1881 .validate()
1882 .unwrap_err();
1883 assert!(err.contains("when.on"), "got: {err}");
1884 assert!(err.contains("runs_on: agent"), "got: {err}");
1885 }
1886
1887 #[test]
1888 fn validate_rejects_empty_event_list() {
1889 let err = schedule_with(When::On(vec![]), RunsOn::Agent)
1890 .validate()
1891 .unwrap_err();
1892 assert!(err.contains("when.on"), "got: {err}");
1893 assert!(err.contains("at least one"), "got: {err}");
1894 }
1895
1896 #[test]
1897 fn event_schedule_lowers_to_event_mode_and_is_event() {
1898 let s = schedule_with(When::On(vec![OnTrigger::Startup]), RunsOn::Agent);
1899 assert!(s.is_event());
1900 assert_eq!(s.lowered().mode, ExecMode::Event);
1901 assert_eq!(s.event_triggers(), &[OnTrigger::Startup]);
1902 // non-event schedules report no triggers.
1903 let cal = schedule_with(calendar("09:00", &[]), RunsOn::Backend);
1904 assert!(!cal.is_event());
1905 assert!(cal.event_triggers().is_empty());
1906 }
1907
1908 // ---- #418 constraints.require (env gates) ----
1909
1910 fn require_schedule(req: Require, runs_on: RunsOn) -> Schedule {
1911 let mut s = schedule_with(
1912 When::PerPc(PerPolicy::Every(EverySpec { every: "1m".into() })),
1913 runs_on,
1914 );
1915 s.constraints.require = Some(req);
1916 s
1917 }
1918
1919 #[test]
1920 fn require_met_combinations() {
1921 use std::time::Duration;
1922 let idle = |m: u64| Some(Duration::from_secs(m * 60));
1923 // Empty require — always met regardless of sensed state.
1924 assert!(require_met(&Require::default(), false, None, None));
1925 // ac_power: only on AC.
1926 let ac = Require {
1927 ac_power: true,
1928 ..Default::default()
1929 };
1930 assert!(!require_met(&ac, false, None, None));
1931 assert!(require_met(&ac, true, None, None));
1932 // idle: needs >= the configured min; None idle never satisfies.
1933 let idle10 = Require {
1934 idle: Some("10m".into()),
1935 ..Default::default()
1936 };
1937 assert!(!require_met(&idle10, true, None, None));
1938 assert!(!require_met(&idle10, true, idle(5), None));
1939 assert!(require_met(&idle10, true, idle(15), None));
1940 assert!(require_met(&idle10, true, idle(10), None)); // boundary inclusive
1941 // cpu_below: needs CPU strictly < threshold; None cpu never satisfies.
1942 let cpu20 = Require {
1943 cpu_below: Some(20.0),
1944 ..Default::default()
1945 };
1946 assert!(!require_met(&cpu20, true, None, None)); // no sample → fail-closed
1947 assert!(!require_met(&cpu20, true, None, Some(20.0))); // == threshold (not strictly below)
1948 assert!(!require_met(&cpu20, true, None, Some(55.0))); // busy
1949 assert!(require_met(&cpu20, true, None, Some(5.0))); // quiet
1950 // all three: AND.
1951 let all = Require {
1952 ac_power: true,
1953 idle: Some("10m".into()),
1954 cpu_below: Some(20.0),
1955 };
1956 assert!(!require_met(&all, false, idle(20), Some(5.0))); // on battery
1957 assert!(!require_met(&all, true, idle(1), Some(5.0))); // not idle enough
1958 assert!(!require_met(&all, true, idle(20), Some(50.0))); // busy
1959 assert!(require_met(&all, true, idle(20), Some(5.0)));
1960 // An unparseable idle is treated as no-requirement by require_met
1961 // (validate rejects it at create time, so this only guards a
1962 // hand-edited blob): ac still gates.
1963 let bad = Require {
1964 ac_power: true,
1965 idle: Some("garbage".into()),
1966 ..Default::default()
1967 };
1968 assert!(require_met(&bad, true, None, None));
1969 assert!(!require_met(&bad, false, None, None));
1970 }
1971
1972 #[test]
1973 fn validate_accepts_and_rejects_cpu_below() {
1974 // In-range accepted.
1975 require_schedule(
1976 Require {
1977 cpu_below: Some(20.0),
1978 ..Default::default()
1979 },
1980 RunsOn::Agent,
1981 )
1982 .validate()
1983 .expect("cpu_below 20 is valid");
1984 // Upper boundary: 100.0 is accepted (fires unless CPU is exactly
1985 // 100%). Pins the inclusive upper bound against a future c < 100.0.
1986 require_schedule(
1987 Require {
1988 cpu_below: Some(100.0),
1989 ..Default::default()
1990 },
1991 RunsOn::Agent,
1992 )
1993 .validate()
1994 .expect("cpu_below 100 is valid");
1995 // Out of range rejected (0 and >100).
1996 for bad in [0.0, -5.0, 100.1] {
1997 let err = require_schedule(
1998 Require {
1999 cpu_below: Some(bad),
2000 ..Default::default()
2001 },
2002 RunsOn::Agent,
2003 )
2004 .validate()
2005 .unwrap_err();
2006 assert!(
2007 err.contains("constraints.require.cpu_below"),
2008 "cpu_below {bad}: {err}"
2009 );
2010 }
2011 }
2012
2013 #[test]
2014 fn validate_accepts_require_on_agent() {
2015 require_schedule(
2016 Require {
2017 ac_power: true,
2018 idle: Some("10m".into()),
2019 cpu_below: Some(20.0),
2020 },
2021 RunsOn::Agent,
2022 )
2023 .validate()
2024 .expect("constraints.require is valid on runs_on: agent");
2025 }
2026
2027 #[test]
2028 fn validate_rejects_require_on_backend() {
2029 let err = require_schedule(
2030 Require {
2031 ac_power: true,
2032 ..Default::default()
2033 },
2034 RunsOn::Backend,
2035 )
2036 .validate()
2037 .unwrap_err();
2038 assert!(err.contains("constraints.require"), "got: {err}");
2039 assert!(err.contains("runs_on: agent"), "got: {err}");
2040
2041 // An idle-only require (ac_power: false) is also non-empty
2042 // (is_empty folds the fields) and must reject on backend too —
2043 // guards against a regression in Require::is_empty.
2044 let err = require_schedule(
2045 Require {
2046 idle: Some("10m".into()),
2047 ..Default::default()
2048 },
2049 RunsOn::Backend,
2050 )
2051 .validate()
2052 .unwrap_err();
2053 assert!(
2054 err.contains("constraints.require"),
2055 "idle-only on backend: {err}"
2056 );
2057 }
2058
2059 #[test]
2060 fn validate_rejects_bad_require_idle() {
2061 let err = require_schedule(
2062 Require {
2063 idle: Some("not-a-duration".into()),
2064 ..Default::default()
2065 },
2066 RunsOn::Agent,
2067 )
2068 .validate()
2069 .unwrap_err();
2070 assert!(err.contains("constraints.require.idle"), "got: {err}");
2071 }
2072
2073 #[test]
2074 fn require_round_trips_and_skips_empty() {
2075 // ac_power: false is skipped; an all-default require nested in
2076 // constraints is omitted (is_empty folds it in).
2077 let yaml = "id: s\nwhen: { per_pc: { every: 1m } }\njob_id: j\nruns_on: agent\n\
2078 constraints: { require: { ac_power: true, idle: 10m, cpu_below: 20 } }\n";
2079 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
2080 let req = s.constraints.require.as_ref().expect("require present");
2081 assert!(req.ac_power);
2082 assert_eq!(req.idle.as_deref(), Some("10m"));
2083 assert_eq!(req.cpu_below, Some(20.0));
2084 // Re-serialize: idle + cpu_below present, ac_power present (true).
2085 let back = serde_json::to_string(&s.constraints).unwrap();
2086 assert!(back.contains("\"idle\":\"10m\""), "got: {back}");
2087 assert!(back.contains("\"cpu_below\":20"), "got: {back}");
2088 // An empty require is omitted entirely by is_empty.
2089 let mut empty = s.clone();
2090 empty.constraints.require = Some(Require::default());
2091 assert!(empty.constraints.is_empty());
2092 }
2093
2094 #[test]
2095 fn validate_rejects_per_target_on_agent() {
2096 let err = schedule_with(
2097 When::PerTarget(PerPolicy::Every(EverySpec {
2098 every: "24h".into(),
2099 })),
2100 RunsOn::Agent,
2101 )
2102 .validate()
2103 .unwrap_err();
2104 assert!(err.contains("per_target"), "got: {err}");
2105 assert!(err.contains("runs_on: agent"), "got: {err}");
2106
2107 // per_target: once is also backend-only.
2108 let err = schedule_with(
2109 When::PerTarget(PerPolicy::Once(OnceLiteral::Once)),
2110 RunsOn::Agent,
2111 )
2112 .validate()
2113 .unwrap_err();
2114 assert!(err.contains("per_target"), "got (once): {err}");
2115 assert!(err.contains("runs_on: agent"), "got (once): {err}");
2116 }
2117
2118 #[test]
2119 fn validate_rejects_bad_every_duration() {
2120 let err = schedule_with(
2121 When::PerPc(PerPolicy::Every(EverySpec { every: "6x".into() })),
2122 RunsOn::Backend,
2123 )
2124 .validate()
2125 .unwrap_err();
2126 assert!(err.contains("when.every"), "got: {err}");
2127 }
2128
2129 #[test]
2130 fn validate_rejects_bad_jitter_and_starting_deadline() {
2131 let mut s = schedule_with(
2132 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2133 RunsOn::Backend,
2134 );
2135 s.plan.jitter = Some("5x".into());
2136 let err = s.validate().unwrap_err();
2137 assert!(err.contains("jitter"), "got: {err}");
2138
2139 let mut s = schedule_with(
2140 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2141 RunsOn::Backend,
2142 );
2143 s.starting_deadline = Some("soon".into());
2144 let err = s.validate().unwrap_err();
2145 assert!(err.contains("starting_deadline"), "got: {err}");
2146 }
2147
2148 #[test]
2149 fn validate_accepts_calendar_shapes() {
2150 for when in [
2151 calendar("09:00", &["mon-fri"]), // weekday morning
2152 calendar("00:00", &["sun"]), // weekly
2153 calendar("18:30", &[]), // daily
2154 calendar("2026-06-10 09:00", &[]), // one-shot
2155 calendar("2026/12/25 00:00", &[]), // one-shot, slash form
2156 ] {
2157 schedule_with(when.clone(), RunsOn::Backend)
2158 .validate()
2159 .unwrap_or_else(|e| panic!("{when} should validate: {e}"));
2160 }
2161 }
2162
2163 #[test]
2164 fn validate_rejects_bad_at() {
2165 for bad in ["25:00", "09:60", "9", "noon", "2026-13-01 09:00"] {
2166 let err = schedule_with(calendar(bad, &[]), RunsOn::Backend)
2167 .validate()
2168 .unwrap_err();
2169 assert!(err.contains("when.at"), "for '{bad}', got: {err}");
2170 }
2171 }
2172
2173 #[test]
2174 fn validate_rejects_datetime_at_with_days() {
2175 // A dated `at` is a one-shot — pairing it with days is a
2176 // contradiction (the date already pins the day).
2177 let err = schedule_with(calendar("2026-06-10 09:00", &["mon"]), RunsOn::Backend)
2178 .validate()
2179 .unwrap_err();
2180 assert!(
2181 err.contains("one-shot") && err.contains("days"),
2182 "got: {err}"
2183 );
2184 }
2185
2186 #[test]
2187 fn validate_rejects_bad_day_name() {
2188 // A garbage DOW token is caught by the days pre-flight and
2189 // reported against `when.days`, not the confusing
2190 // "when.at lowered to invalid cron" (claude #432 review).
2191 let err = schedule_with(calendar("09:00", &["funday"]), RunsOn::Backend)
2192 .validate()
2193 .unwrap_err();
2194 assert!(err.contains("when.days"), "got: {err}");
2195 assert!(err.contains("funday"), "names the bad token: {err}");
2196 // a degenerate range like `mon-` reports the whole token, not
2197 // a cryptic empty part (claude #432 follow-up)
2198 let err = schedule_with(calendar("09:00", &["mon-"]), RunsOn::Backend)
2199 .validate()
2200 .unwrap_err();
2201 assert!(err.contains("'mon-'"), "names the whole token: {err}");
2202 // valid names / ranges / numeric / * all pass
2203 for ok in [
2204 calendar("09:00", &["mon-fri"]),
2205 calendar("09:00", &["mon", "wed", "sun"]),
2206 calendar("09:00", &["1-5"]),
2207 ] {
2208 schedule_with(ok.clone(), RunsOn::Backend)
2209 .validate()
2210 .unwrap_or_else(|e| panic!("{ok} should validate: {e}"));
2211 }
2212 }
2213
2214 #[test]
2215 fn validate_accepts_nth_weekday() {
2216 // #418: nth-weekday (Patch Tuesday). validate() also lowers to
2217 // a cron and parses it with croner, so passing here proves the
2218 // whole chain — token → DOW field → engine-acceptable cron.
2219 for ok in [
2220 calendar("09:00", &["tue#2"]), // 2nd Tuesday
2221 calendar("09:00", &["fri#1"]), // 1st Friday
2222 calendar("03:00", &["sun#5"]), // 5th Sunday
2223 calendar("09:00", &["tue#2", "thu#2"]), // a list of nths
2224 calendar("09:00", &["2#2"]), // numeric DOW + ordinal
2225 // Case-insensitive both sides: validate lowercases, croner
2226 // upper-cases the whole pattern before aliasing (claude #547).
2227 calendar("09:00", &["TUE#2"]),
2228 ] {
2229 schedule_with(ok.clone(), RunsOn::Backend)
2230 .validate()
2231 .unwrap_or_else(|e| panic!("{ok} should validate: {e}"));
2232 }
2233 }
2234
2235 #[test]
2236 fn validate_rejects_bad_nth_weekday() {
2237 // ordinal out of 1..5, a range with #, and a bad day before #.
2238 for bad in ["tue#0", "tue#6", "tue#x", "mon-fri#2", "funday#2"] {
2239 let err = schedule_with(calendar("09:00", &[bad]), RunsOn::Backend)
2240 .validate()
2241 .unwrap_err();
2242 assert!(err.contains("when.days"), "for '{bad}', got: {err}");
2243 }
2244 }
2245
2246 #[test]
2247 fn validate_accepts_last_weekday() {
2248 // #418: last-weekday (`friL` = last Friday). Like the nth case,
2249 // validate() lowers to a cron and round-trips it through croner,
2250 // so passing proves token → DOW field → engine-acceptable cron
2251 // with the verified last-<dow>-of-month semantics.
2252 for ok in [
2253 calendar("09:00", &["friL"]), // last Friday
2254 calendar("03:00", &["sunL"]), // last Sunday
2255 calendar("22:00", &["5L"]), // numeric DOW + last
2256 calendar("00:00", &["0L"]), // numeric Sunday (0…
2257 calendar("00:00", &["7L"]), // …and its 7 alias)
2258 calendar("09:00", &["monL", "friL"]), // a list of last-weekdays
2259 // Case-insensitive both the weekday and the `L` suffix:
2260 // validate lowercases the day, croner upper-cases the whole
2261 // pattern before aliasing (claude #547).
2262 calendar("09:00", &["FRIL"]),
2263 calendar("09:00", &["fril"]),
2264 ] {
2265 schedule_with(ok.clone(), RunsOn::Backend)
2266 .validate()
2267 .unwrap_or_else(|e| panic!("{ok} should validate: {e}"));
2268 }
2269 }
2270
2271 #[test]
2272 fn validate_rejects_bad_last_weekday() {
2273 // bare `L` (no weekday — a footgun croner reads as Saturday), a
2274 // range with L, a bad day before L, and an internal space that
2275 // would otherwise leak a malformed cron downstream (gemini #560).
2276 for bad in ["L", "l", "mon-friL", "fundayL", "8L", "*L", "fri L"] {
2277 let err = schedule_with(calendar("09:00", &[bad]), RunsOn::Backend)
2278 .validate()
2279 .unwrap_err();
2280 assert!(err.contains("when.days"), "for '{bad}', got: {err}");
2281 }
2282 }
2283
2284 #[test]
2285 fn calendar_oneshot_instant_detects_past() {
2286 use chrono::TimeZone;
2287 // a dated `at` resolves to an absolute instant…
2288 let c = CalendarSpec {
2289 at: "2024-01-01 09:00".into(),
2290 days: vec![],
2291 };
2292 let t = c
2293 .oneshot_instant(ScheduleTz::Utc)
2294 .expect("one-shot instant");
2295 assert_eq!(
2296 t,
2297 chrono::Utc.with_ymd_and_hms(2024, 1, 1, 9, 0, 0).unwrap()
2298 );
2299 assert!(t < chrono::Utc::now(), "2024 is in the past");
2300 // …while a repeating (time-only) calendar has no instant
2301 let rep = CalendarSpec {
2302 at: "09:00".into(),
2303 days: vec!["mon-fri".into()],
2304 };
2305 assert!(rep.oneshot_instant(ScheduleTz::Utc).is_none());
2306 }
2307
2308 fn schedule_with_active(from: Option<&str>, until: Option<&str>) -> Schedule {
2309 let mut s = schedule_with(
2310 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2311 RunsOn::Backend,
2312 );
2313 s.active = Active {
2314 from: from.map(str::to_owned),
2315 until: until.map(str::to_owned),
2316 };
2317 s
2318 }
2319
2320 #[test]
2321 fn validate_accepts_active_window() {
2322 schedule_with_active(Some("2026-07-01"), Some("2026-08-01T12:00:00+09:00"))
2323 .validate()
2324 .expect("date + rfc3339 bounds should validate");
2325 }
2326
2327 #[test]
2328 fn validate_rejects_unparseable_active_bound() {
2329 let err = schedule_with_active(Some("July 1st"), None)
2330 .validate()
2331 .unwrap_err();
2332 assert!(err.contains("active"), "got: {err}");
2333 }
2334
2335 #[test]
2336 fn validate_rejects_from_not_before_until() {
2337 let err = schedule_with_active(Some("2026-08-01"), Some("2026-07-01"))
2338 .validate()
2339 .unwrap_err();
2340 assert!(err.contains("strictly before"), "got: {err}");
2341
2342 let err = schedule_with_active(Some("2026-07-01"), Some("2026-07-01"))
2343 .validate()
2344 .unwrap_err();
2345 assert!(err.contains("strictly before"), "got: {err}");
2346 }
2347
2348 // ---- Active window semantics ----
2349
2350 #[test]
2351 fn active_window_is_half_open() {
2352 use chrono::TimeZone;
2353 let active = Active {
2354 from: Some("2026-07-01".into()),
2355 until: Some("2026-08-01".into()),
2356 };
2357 // UTC tz so the date bounds are UTC midnight.
2358 let at = |y, m, d, h| chrono::Utc.with_ymd_and_hms(y, m, d, h, 0, 0).unwrap();
2359 let c = |t| active.contains(t, ScheduleTz::Utc);
2360 assert!(!c(at(2026, 6, 30, 23)), "before from");
2361 assert!(c(at(2026, 7, 1, 0)), "at from (inclusive)");
2362 assert!(c(at(2026, 7, 15, 12)), "inside");
2363 assert!(!c(at(2026, 8, 1, 0)), "at until (exclusive)");
2364 assert!(!c(at(2026, 8, 2, 0)), "after until");
2365 }
2366
2367 #[test]
2368 fn active_empty_window_is_always_active() {
2369 assert!(Active::default().contains(chrono::Utc::now(), ScheduleTz::Local));
2370 }
2371
2372 #[test]
2373 fn active_rfc3339_bound_honours_offset_regardless_of_tz() {
2374 use chrono::TimeZone;
2375 let active = Active {
2376 from: Some("2026-07-01T09:00:00+09:00".into()),
2377 until: None,
2378 };
2379 // RFC3339 carries its own offset → tz arg is ignored.
2380 // 09:00 JST = 00:00 UTC.
2381 for tz in [ScheduleTz::Utc, ScheduleTz::Local] {
2382 assert!(
2383 !active.contains(
2384 chrono::Utc
2385 .with_ymd_and_hms(2026, 6, 30, 23, 59, 0)
2386 .unwrap(),
2387 tz
2388 )
2389 );
2390 assert!(active.contains(
2391 chrono::Utc.with_ymd_and_hms(2026, 7, 1, 0, 0, 0).unwrap(),
2392 tz
2393 ));
2394 }
2395 }
2396
2397 #[test]
2398 fn active_date_bound_respects_tz() {
2399 // A bare `YYYY-MM-DD` bound is midnight *in the schedule's
2400 // tz* (#418 Phase 2). The UTC interpretation is exact and
2401 // host-independent; assert that precisely.
2402 use chrono::TimeZone;
2403 let utc = Active::parse_bound("2026-07-01", ScheduleTz::Utc).expect("utc");
2404 assert_eq!(
2405 utc,
2406 chrono::Utc.with_ymd_and_hms(2026, 7, 1, 0, 0, 0).unwrap()
2407 );
2408
2409 // The local interpretation must equal what chrono::Local
2410 // computes for the same wall-clock midnight — proves the tz
2411 // path is wired to the host zone (the magnitude vs UTC is
2412 // host-dependent, so we compare against Local directly rather
2413 // than hard-coding the JST offset, keeping CI green on UTC
2414 // runners).
2415 let local = Active::parse_bound("2026-07-01", ScheduleTz::Local).expect("local");
2416 let want = chrono::Local
2417 .with_ymd_and_hms(2026, 7, 1, 0, 0, 0)
2418 .single()
2419 .expect("local midnight is unambiguous")
2420 .with_timezone(&chrono::Utc);
2421 assert_eq!(local, want, "date bound resolved in host-local tz");
2422 }
2423
2424 #[test]
2425 fn active_empty_is_skipped_when_serialising() {
2426 let s = schedule_with(
2427 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2428 RunsOn::Backend,
2429 );
2430 let json = serde_json::to_value(&s).expect("serialise");
2431 assert!(
2432 json.get("active").is_none(),
2433 "empty active must not appear on the wire: {json}"
2434 );
2435 }
2436
2437 // ---- constraints.window (#418 Phase 3) ----
2438
2439 fn with_window(win: &str) -> Schedule {
2440 let mut s = schedule_with(
2441 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
2442 RunsOn::Backend,
2443 );
2444 s.constraints.window = Some(win.into());
2445 s
2446 }
2447
2448 #[test]
2449 fn constraints_window_parses_and_round_trips() {
2450 let yaml = r#"
2451id: x
2452when:
2453 per_pc: { every: 6h }
2454job_id: y
2455target: { all: true }
2456constraints:
2457 window: "22:00-05:00"
2458"#;
2459 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
2460 assert_eq!(s.constraints.window.as_deref(), Some("22:00-05:00"));
2461 let back: Schedule =
2462 serde_json::from_str(&serde_json::to_string(&s).expect("ser")).expect("de");
2463 assert_eq!(back.constraints.window.as_deref(), Some("22:00-05:00"));
2464 }
2465
2466 #[test]
2467 fn constraints_empty_is_skipped_when_serialising() {
2468 let s = schedule_with(
2469 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2470 RunsOn::Backend,
2471 );
2472 let json = serde_json::to_value(&s).expect("serialise");
2473 assert!(
2474 json.get("constraints").is_none(),
2475 "empty constraints must not appear on the wire: {json}"
2476 );
2477 }
2478
2479 #[test]
2480 fn window_no_constraint_always_allows() {
2481 let c = Constraints::default();
2482 assert!(c.allows(chrono::Utc::now(), ScheduleTz::Local));
2483 }
2484
2485 #[test]
2486 fn window_same_day_is_half_open() {
2487 use chrono::TimeZone;
2488 let s = with_window("09:00-17:00");
2489 let at = |h, m| chrono::Utc.with_ymd_and_hms(2026, 6, 9, h, m, 0).unwrap();
2490 let a = |t| s.constraints.allows(t, ScheduleTz::Utc);
2491 assert!(!a(at(8, 59)), "before start");
2492 assert!(a(at(9, 0)), "at start (inclusive)");
2493 assert!(a(at(16, 59)), "inside");
2494 assert!(!a(at(17, 0)), "at end (exclusive)");
2495 assert!(!a(at(23, 0)), "after end");
2496 }
2497
2498 #[test]
2499 fn window_crossing_midnight() {
2500 use chrono::TimeZone;
2501 let s = with_window("22:00-05:00");
2502 let at = |h, m| chrono::Utc.with_ymd_and_hms(2026, 6, 9, h, m, 0).unwrap();
2503 let a = |t| s.constraints.allows(t, ScheduleTz::Utc);
2504 assert!(a(at(22, 0)), "at start tonight");
2505 assert!(a(at(23, 30)), "late tonight");
2506 assert!(a(at(3, 0)), "early tomorrow");
2507 assert!(!a(at(5, 0)), "at end (exclusive)");
2508 assert!(!a(at(12, 0)), "midday outside");
2509 assert!(!a(at(21, 59)), "just before start");
2510 }
2511
2512 #[test]
2513 fn window_respects_tz() {
2514 // The same instant is inside the window under one tz and may
2515 // be outside under another. Compare UTC vs Local via the
2516 // host's own offset (kept CI-green on UTC runners like the
2517 // active tz test does).
2518 use chrono::TimeZone;
2519 let s = with_window("09:00-17:00");
2520 let noon_utc = chrono::Utc.with_ymd_and_hms(2026, 6, 9, 12, 0, 0).unwrap();
2521 // Under UTC, 12:00 is inside 09:00-17:00.
2522 assert!(s.constraints.allows(noon_utc, ScheduleTz::Utc));
2523 // Under Local, the verdict tracks the host wall-clock time;
2524 // assert it matches a direct wall_time membership check.
2525 let local_t = noon_utc.with_timezone(&chrono::Local).time();
2526 let in_local = local_t >= chrono::NaiveTime::from_hms_opt(9, 0, 0).unwrap()
2527 && local_t < chrono::NaiveTime::from_hms_opt(17, 0, 0).unwrap();
2528 assert_eq!(s.constraints.allows(noon_utc, ScheduleTz::Local), in_local);
2529 }
2530
2531 #[test]
2532 fn validate_accepts_good_window() {
2533 for w in ["09:00-17:00", "22:00-05:00", "00:00-23:59"] {
2534 with_window(w)
2535 .validate()
2536 .unwrap_or_else(|e| panic!("'{w}' should validate: {e}"));
2537 }
2538 }
2539
2540 #[test]
2541 fn validate_rejects_bad_window() {
2542 for bad in ["9-5", "22:00", "22:00-22:00", "25:00-05:00", "09:00_17:00"] {
2543 let err = with_window(bad).validate().unwrap_err();
2544 assert!(
2545 err.contains("constraints.window"),
2546 "for '{bad}', got: {err}"
2547 );
2548 }
2549 }
2550
2551 // ---- constraints.skip_dates (#418 holiday exclusion) ----
2552
2553 fn with_skip_dates(dates: &[&str]) -> Schedule {
2554 let mut s = schedule_with(calendar("09:00", &[]), RunsOn::Backend);
2555 s.tz = ScheduleTz::Utc; // host-independent date assertions
2556 s.constraints.skip_dates = dates.iter().map(|d| (*d).to_string()).collect();
2557 s
2558 }
2559
2560 #[test]
2561 fn allows_blocks_listed_skip_date() {
2562 use chrono::TimeZone;
2563 let s = with_skip_dates(&["2026-06-10", "2026-12-25"]);
2564 // Any time on a listed date is blocked (whole day).
2565 let on = chrono::Utc.with_ymd_and_hms(2026, 6, 10, 9, 0, 0).unwrap();
2566 assert!(!s.constraints.allows(on, ScheduleTz::Utc));
2567 let on_midnight = chrono::Utc.with_ymd_and_hms(2026, 12, 25, 0, 0, 0).unwrap();
2568 assert!(!s.constraints.allows(on_midnight, ScheduleTz::Utc));
2569 // A date not in the list fires normally.
2570 let off = chrono::Utc.with_ymd_and_hms(2026, 6, 11, 9, 0, 0).unwrap();
2571 assert!(s.constraints.allows(off, ScheduleTz::Utc));
2572 }
2573
2574 #[test]
2575 fn allows_corrupt_skip_date_fails_closed() {
2576 use chrono::TimeZone;
2577 // A garbled entry (only reachable via hand-edited KV) blocks
2578 // rather than silently re-enabling fires — same posture as a
2579 // corrupt window.
2580 let s = with_skip_dates(&["not-a-date"]);
2581 let any = chrono::Utc.with_ymd_and_hms(2026, 6, 11, 9, 0, 0).unwrap();
2582 assert!(!s.constraints.allows(any, ScheduleTz::Utc));
2583 }
2584
2585 #[test]
2586 fn validate_accepts_good_skip_dates() {
2587 with_skip_dates(&["2026-01-01", "2026-12-25", "2027-05-03"])
2588 .validate()
2589 .expect("well-formed skip dates should validate");
2590 }
2591
2592 #[test]
2593 fn validate_rejects_bad_skip_date() {
2594 for bad in ["2026-13-01", "01-01-2026", "nope", "2026/01/01"] {
2595 let err = with_skip_dates(&[bad]).validate().unwrap_err();
2596 assert!(
2597 err.contains("constraints.skip_dates"),
2598 "for '{bad}', got: {err}"
2599 );
2600 }
2601 }
2602
2603 #[test]
2604 fn preview_skips_holidays() {
2605 use chrono::TimeZone;
2606 // Daily 09:00 with two of the next five days marked as holidays
2607 // — preview drops exactly those, since it gates on `allows`.
2608 let mut s = cal_utc("09:00", &[]);
2609 s.constraints.skip_dates = vec!["2026-06-11".into(), "2026-06-13".into()];
2610 let now = chrono::Utc.with_ymd_and_hms(2026, 6, 10, 0, 0, 0).unwrap();
2611 let got = s.preview_fires(now, 4);
2612 let want: Vec<_> = [
2613 (2026, 6, 10),
2614 (2026, 6, 12), // skips 06-11
2615 (2026, 6, 14), // skips 06-13
2616 (2026, 6, 15),
2617 ]
2618 .iter()
2619 .map(|(y, m, d)| chrono::Utc.with_ymd_and_hms(*y, *m, *d, 9, 0, 0).unwrap())
2620 .collect();
2621 assert_eq!(got, want);
2622 }
2623
2624 // ---- constraints.max_concurrent (#418) ----
2625
2626 fn with_max_concurrent(max: u32, runs_on: RunsOn) -> Schedule {
2627 let mut s = schedule_with(
2628 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
2629 runs_on,
2630 );
2631 s.constraints.max_concurrent = Some(max);
2632 s
2633 }
2634
2635 #[test]
2636 fn validate_accepts_backend_max_concurrent() {
2637 with_max_concurrent(5, RunsOn::Backend)
2638 .validate()
2639 .expect("backend max_concurrent should validate");
2640 }
2641
2642 #[test]
2643 fn validate_rejects_max_concurrent_on_agent() {
2644 // Decision E: a central running-instance cap needs a central
2645 // counter, which agents don't have.
2646 let err = with_max_concurrent(5, RunsOn::Agent)
2647 .validate()
2648 .unwrap_err();
2649 assert!(err.contains("constraints.max_concurrent"), "got: {err}");
2650 assert!(err.contains("runs_on: agent"), "got: {err}");
2651 }
2652
2653 #[test]
2654 fn validate_rejects_zero_max_concurrent() {
2655 let err = with_max_concurrent(0, RunsOn::Backend)
2656 .validate()
2657 .unwrap_err();
2658 assert!(err.contains("max_concurrent must be >= 1"), "got: {err}");
2659 }
2660
2661 #[test]
2662 fn max_concurrent_round_trips_and_skips_when_absent() {
2663 let s = with_max_concurrent(3, RunsOn::Backend);
2664 let json = serde_json::to_value(&s.constraints).expect("ser");
2665 assert_eq!(json.get("max_concurrent").and_then(|v| v.as_u64()), Some(3));
2666 // A schedule with no constraints omits the whole block.
2667 let bare = schedule_with(
2668 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2669 RunsOn::Backend,
2670 );
2671 assert!(bare.constraints.is_empty());
2672 }
2673
2674 #[test]
2675 fn window_fail_closed_on_corrupt_blob() {
2676 // A malformed window (only reachable via a hand-edited KV
2677 // blob — validate() rejects it at create) must BLOCK, not
2678 // silently allow fires during a change-freeze (gemini #452).
2679 let s = with_window("22:00_05:00");
2680 assert!(
2681 !s.constraints.allows(chrono::Utc::now(), ScheduleTz::Utc),
2682 "corrupt window fails closed"
2683 );
2684 // …and the scheduler can surface why it's stuck.
2685 assert!(
2686 s.bad_window().is_some(),
2687 "bad_window reports the parse error"
2688 );
2689 assert!(with_window("22:00-05:00").bad_window().is_none());
2690 }
2691
2692 #[test]
2693 fn calendar_outside_window_is_flagged() {
2694 // at 09:00 can never fall in 22:00-05:00 → never fires.
2695 let mut s = schedule_with(calendar("09:00", &["mon-fri"]), RunsOn::Backend);
2696 s.constraints.window = Some("22:00-05:00".into());
2697 assert!(s.calendar_outside_window(), "09:00 is not in 22:00-05:00");
2698
2699 // at 23:00 IS inside the overnight window → fine.
2700 let mut s = schedule_with(calendar("23:00", &[]), RunsOn::Backend);
2701 s.constraints.window = Some("22:00-05:00".into());
2702 assert!(!s.calendar_outside_window(), "23:00 is in 22:00-05:00");
2703
2704 // reconcile shapes are never flagged (they poll every minute).
2705 let mut s = schedule_with(
2706 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
2707 RunsOn::Backend,
2708 );
2709 s.constraints.window = Some("22:00-05:00".into());
2710 assert!(!s.calendar_outside_window(), "reconcile is unaffected");
2711
2712 // no window → never flagged.
2713 let s = schedule_with(calendar("09:00", &[]), RunsOn::Backend);
2714 assert!(!s.calendar_outside_window());
2715 }
2716
2717 // ---- on_failure.retry (#418 Phase 4) ----
2718
2719 fn with_retry(max: u32, backoff: &str) -> Schedule {
2720 let mut s = schedule_with(
2721 When::PerPc(PerPolicy::Every(EverySpec { every: "6h".into() })),
2722 RunsOn::Backend,
2723 );
2724 s.on_failure.retry = Some(Retry {
2725 max,
2726 backoff: backoff.into(),
2727 });
2728 s
2729 }
2730
2731 #[test]
2732 fn on_failure_parses_and_round_trips() {
2733 let yaml = r#"
2734id: x
2735when:
2736 per_pc: { every: 6h }
2737job_id: y
2738target: { all: true }
2739on_failure:
2740 retry: { max: 3, backoff: 10m }
2741"#;
2742 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
2743 let r = s.on_failure.retry.as_ref().expect("retry present");
2744 assert_eq!(r.max, 3);
2745 assert_eq!(r.backoff, "10m");
2746 let back: Schedule =
2747 serde_json::from_str(&serde_json::to_string(&s).expect("ser")).expect("de");
2748 assert_eq!(back.on_failure, s.on_failure);
2749 }
2750
2751 #[test]
2752 fn on_failure_empty_is_skipped_when_serialising() {
2753 let s = schedule_with(
2754 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2755 RunsOn::Backend,
2756 );
2757 let json = serde_json::to_value(&s).expect("serialise");
2758 assert!(
2759 json.get("on_failure").is_none(),
2760 "empty on_failure must not appear on the wire: {json}"
2761 );
2762 }
2763
2764 #[test]
2765 fn validate_accepts_good_retry() {
2766 for (max, backoff) in [(1, "30s"), (3, "10m"), (10, "1h")] {
2767 with_retry(max, backoff)
2768 .validate()
2769 .unwrap_or_else(|e| panic!("retry {{max:{max}, backoff:{backoff}}}: {e}"));
2770 }
2771 }
2772
2773 #[test]
2774 fn validate_rejects_bad_backoff() {
2775 let err = with_retry(3, "soon").validate().unwrap_err();
2776 assert!(err.contains("on_failure.retry.backoff"), "got: {err}");
2777 }
2778
2779 #[test]
2780 fn validate_rejects_sub_second_backoff() {
2781 // "500ms" parses as humantime but lowers to 0s on the wire —
2782 // reject it so the operator doesn't get a silent no-wait
2783 // (coderabbit #466).
2784 for bad in ["500ms", "0s", "999ms"] {
2785 let err = with_retry(3, bad).validate().unwrap_err();
2786 assert!(
2787 err.contains("on_failure.retry.backoff must be >= 1s"),
2788 "for '{bad}', got: {err}"
2789 );
2790 }
2791 }
2792
2793 #[test]
2794 fn validate_rejects_out_of_range_max() {
2795 for bad in [0u32, 11, 1000] {
2796 let err = with_retry(bad, "10m").validate().unwrap_err();
2797 assert!(
2798 err.contains("on_failure.retry.max"),
2799 "for max={bad}, got: {err}"
2800 );
2801 }
2802 }
2803
2804 #[test]
2805 fn lowered_retry_reduces_backoff_to_seconds() {
2806 let s = with_retry(3, "10m");
2807 let spec = s.on_failure.lowered_retry().expect("a retry policy");
2808 assert_eq!(spec.max, 3);
2809 assert_eq!(spec.backoff_secs, 600);
2810 }
2811
2812 #[test]
2813 fn lowered_retry_is_none_without_policy() {
2814 let s = schedule_with(
2815 When::PerPc(PerPolicy::Once(OnceLiteral::Once)),
2816 RunsOn::Backend,
2817 );
2818 assert!(s.on_failure.lowered_retry().is_none());
2819 }
2820
2821 // ---- global change-freeze (#418 Phase 5) ----
2822
2823 #[test]
2824 fn freeze_empty_window_is_always_active() {
2825 // The big-red-button shape: no bounds = frozen until cleared.
2826 let f = Freeze::default();
2827 assert!(f.is_active(chrono::Utc::now()));
2828 }
2829
2830 #[test]
2831 fn freeze_window_is_half_open() {
2832 use chrono::TimeZone;
2833 let f = Freeze {
2834 from: Some("2026-12-20T00:00:00+00:00".into()),
2835 until: Some("2027-01-05T00:00:00+00:00".into()),
2836 reason: Some("year-end".into()),
2837 tz: ScheduleTz::Utc,
2838 };
2839 let at = |y, mo, d| chrono::Utc.with_ymd_and_hms(y, mo, d, 0, 0, 0).unwrap();
2840 assert!(!f.is_active(at(2026, 12, 19)), "before from = not frozen");
2841 assert!(f.is_active(at(2026, 12, 20)), "from is inclusive");
2842 assert!(f.is_active(at(2026, 12, 31)), "inside window");
2843 assert!(!f.is_active(at(2027, 1, 5)), "until is exclusive");
2844 assert!(!f.is_active(at(2027, 1, 6)), "after until = not frozen");
2845 }
2846
2847 #[test]
2848 fn freeze_fails_closed_on_corrupt_bound() {
2849 // A freeze is a safety switch: an unparseable bound (only
2850 // reachable via a hand-edited KV blob) must read as FROZEN, not
2851 // "fire normally" (coderabbit #472) — the opposite of `active`,
2852 // which fail-opens.
2853 let f = Freeze {
2854 from: Some("not-a-date".into()),
2855 until: None,
2856 reason: None,
2857 tz: ScheduleTz::Utc,
2858 };
2859 assert!(f.is_active(chrono::Utc::now()), "corrupt bound → frozen");
2860 }
2861
2862 #[test]
2863 fn freeze_validate_accepts_good_bounds() {
2864 Freeze {
2865 from: Some("2026-12-20".into()),
2866 until: Some("2027-01-05T12:00:00+09:00".into()),
2867 reason: None,
2868 tz: ScheduleTz::Local,
2869 }
2870 .validate()
2871 .expect("date + rfc3339 bounds should validate");
2872 // Empty (indefinite) freeze is valid.
2873 Freeze::default().validate().expect("empty freeze is valid");
2874 }
2875
2876 #[test]
2877 fn freeze_validate_rejects_bad_bound_and_inverted_window() {
2878 let err = Freeze {
2879 from: Some("never".into()),
2880 ..Default::default()
2881 }
2882 .validate()
2883 .unwrap_err();
2884 assert!(err.contains("freeze:"), "got: {err}");
2885
2886 let inverted = Freeze {
2887 from: Some("2027-01-05".into()),
2888 until: Some("2026-12-20".into()),
2889 ..Default::default()
2890 }
2891 .validate()
2892 .unwrap_err();
2893 assert!(inverted.contains("freeze.from"), "got: {inverted}");
2894 }
2895
2896 #[test]
2897 fn freeze_round_trips_and_skips_empty_fields() {
2898 let f = Freeze {
2899 from: None,
2900 until: Some("2027-01-05".into()),
2901 reason: Some("INC-1234".into()),
2902 tz: ScheduleTz::Utc,
2903 };
2904 let json = serde_json::to_value(&f).expect("serialise");
2905 assert!(json.get("from").is_none(), "empty from omitted: {json}");
2906 let back: Freeze = serde_json::from_value(json).expect("round-trip");
2907 assert_eq!(back, f);
2908 }
2909
2910 #[test]
2911 fn shipped_schedule_configs_parse_and_validate() {
2912 // Every YAML under configs/schedules/ must parse with the
2913 // current Schedule serde AND pass validate() — keeps the
2914 // shipped examples from drifting out of sync with the model
2915 // (#418 removed back-compat, so drift = broken at create).
2916 let dir = std::path::Path::new(env!("CARGO_MANIFEST_DIR")).join("../../configs/schedules");
2917 let mut seen = 0;
2918 for entry in std::fs::read_dir(&dir).expect("read configs/schedules") {
2919 let path = entry.expect("dir entry").path();
2920 if path.extension().and_then(|e| e.to_str()) != Some("yaml") {
2921 continue;
2922 }
2923 let body = std::fs::read_to_string(&path).expect("read yaml");
2924 let s: Schedule = serde_yaml::from_str(&body)
2925 .unwrap_or_else(|e| panic!("{} failed to parse: {e}", path.display()));
2926 s.validate()
2927 .unwrap_or_else(|e| panic!("{} failed validate(): {e}", path.display()));
2928 seen += 1;
2929 }
2930 assert!(seen > 0, "no schedule YAMLs found in {}", dir.display());
2931 }
2932
2933 // ---- pre-existing enum wire formats (unchanged by #418) ----
2934
2935 #[test]
2936 fn exec_mode_serialises_snake_case() {
2937 for (mode, expected) in [
2938 (ExecMode::EveryTick, "every_tick"),
2939 (ExecMode::OncePerPc, "once_per_pc"),
2940 (ExecMode::OncePerTarget, "once_per_target"),
2941 ] {
2942 let s = serde_json::to_value(mode).expect("serialise");
2943 assert_eq!(s, serde_json::Value::String(expected.into()));
2944 let back: ExecMode = serde_json::from_value(serde_json::Value::String(expected.into()))
2945 .expect("deserialise");
2946 assert_eq!(back, mode, "round-trip for {expected}");
2947 }
2948 }
2949
2950 #[test]
2951 fn schedule_runs_on_defaults_to_backend() {
2952 let yaml = r#"
2953id: x
2954when:
2955 per_pc: once
2956job_id: y
2957target: { all: true }
2958"#;
2959 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
2960 assert_eq!(s.runs_on, RunsOn::Backend);
2961 }
2962
2963 #[test]
2964 fn schedule_runs_on_agent_parses() {
2965 let yaml = r#"
2966id: offline-inv
2967when:
2968 per_pc: { every: 1h }
2969job_id: inventory-hw
2970target: { all: true }
2971runs_on: agent
2972"#;
2973 let s: Schedule = serde_yaml::from_str(yaml).expect("parse");
2974 assert_eq!(s.runs_on, RunsOn::Agent);
2975 assert_eq!(s.lowered().mode, ExecMode::OncePerPc);
2976 }
2977
2978 #[test]
2979 fn runs_on_serialises_snake_case() {
2980 for (mode, expected) in [(RunsOn::Backend, "backend"), (RunsOn::Agent, "agent")] {
2981 let s = serde_json::to_value(mode).expect("serialise");
2982 assert_eq!(s, serde_json::Value::String(expected.into()));
2983 let back: RunsOn = serde_json::from_value(serde_json::Value::String(expected.into()))
2984 .expect("deserialise");
2985 assert_eq!(back, mode);
2986 }
2987 }
2988
2989 #[test]
2990 fn execute_shell_into_wire_shell() {
2991 assert_eq!(Shell::from(ExecuteShell::Powershell), Shell::Powershell);
2992 assert_eq!(Shell::from(ExecuteShell::Cmd), Shell::Cmd);
2993 }
2994
2995 #[test]
2996 fn manifest_staleness_defaults_to_cached() {
2997 let yaml = r#"
2998id: x
2999version: 1.0.0
3000execute:
3001 shell: powershell
3002 script: "echo"
3003 timeout: 1s
3004"#;
3005 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
3006 assert_eq!(m.staleness, Staleness::Cached);
3007 }
3008
3009 #[test]
3010 fn manifest_strict_staleness_parses() {
3011 let yaml = r#"
3012id: urgent-patch
3013version: 2.5.1
3014execute:
3015 shell: powershell
3016 script: Install-Hotfix
3017 timeout: 5m
3018staleness:
3019 mode: strict
3020 max_cache_age: 0s
3021"#;
3022 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
3023 match m.staleness {
3024 Staleness::Strict { max_cache_age } => assert_eq!(max_cache_age, "0s"),
3025 other => panic!("expected strict, got {other:?}"),
3026 }
3027 }
3028
3029 #[test]
3030 fn manifest_unchecked_staleness_parses() {
3031 let yaml = r#"
3032id: legacy
3033version: 0.1.0
3034execute:
3035 shell: cmd
3036 script: "echo"
3037 timeout: 1s
3038staleness:
3039 mode: unchecked
3040"#;
3041 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
3042 assert_eq!(m.staleness, Staleness::Unchecked);
3043 }
3044
3045 #[test]
3046 fn missing_required_field_errors() {
3047 // `id` missing.
3048 let yaml = r#"
3049version: 1.0.0
3050target: { all: true }
3051execute:
3052 shell: powershell
3053 script: "echo"
3054 timeout: 1s
3055"#;
3056 let r: Result<Manifest, _> = serde_yaml::from_str(yaml);
3057 assert!(r.is_err(), "expected error, got {:?}", r);
3058 }
3059
3060 #[test]
3061 fn display_field_table_kind_round_trips_with_nested_columns() {
3062 // #39: `type: table` + `columns:` on a DisplayField gets
3063 // round-tripped through serde so the SPA receives the
3064 // nested schema verbatim. Nested columns themselves are
3065 // DisplayFields so they can carry `type: bytes` /
3066 // `type: number` for cell formatting.
3067 let yaml = r#"
3068id: inv-hw
3069version: 1.0.0
3070execute:
3071 shell: powershell
3072 script: "echo"
3073 timeout: 60s
3074inventory:
3075 display:
3076 - field: hostname
3077 label: Hostname
3078 - field: disks
3079 label: Disks
3080 type: table
3081 columns:
3082 - field: device_id
3083 label: Drive
3084 - field: size_bytes
3085 label: Size
3086 type: bytes
3087 - field: free_bytes
3088 label: Free
3089 type: bytes
3090 - field: file_system
3091 label: FS
3092"#;
3093 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
3094 let inv = m.inventory.as_ref().expect("inventory hint");
3095 let disks = inv
3096 .display
3097 .iter()
3098 .find(|d| d.field == "disks")
3099 .expect("disks display row");
3100 assert_eq!(disks.kind.as_deref(), Some("table"));
3101 let cols = disks.columns.as_ref().expect("table needs columns");
3102 assert_eq!(cols.len(), 4);
3103 assert_eq!(cols[1].field, "size_bytes");
3104 assert_eq!(cols[1].kind.as_deref(), Some("bytes"));
3105 }
3106
3107 #[test]
3108 fn display_field_scalar_kind_keeps_columns_none() {
3109 // Defensive: when type is a scalar (`bytes` / `number` /
3110 // `timestamp`) the `columns` field stays None — the SPA
3111 // uses its presence as the "render nested table" signal,
3112 // so it must not leak in via serde defaults.
3113 let yaml = r#"
3114id: x
3115version: 1.0.0
3116execute:
3117 shell: powershell
3118 script: "echo"
3119 timeout: 5s
3120inventory:
3121 display:
3122 - { field: ram_bytes, label: RAM, type: bytes }
3123"#;
3124 let m: Manifest = serde_yaml::from_str(yaml).expect("parse");
3125 let inv = m.inventory.as_ref().unwrap();
3126 assert!(inv.display[0].columns.is_none());
3127 }
3128
3129 // ---- checked-in JSON Schema freshness (docs/schemas/) ----
3130
3131 /// The JSON Schemas under `docs/schemas/` must match what
3132 /// `schema_for!` produces today — a Cargo.lock-style freshness guard
3133 /// so a `Schedule` / `Manifest` field change can't silently drift
3134 /// the operator-facing schema. The SPA editor, the backend
3135 /// `/api/schemas/*` endpoints, and these files all read the same
3136 /// derived shape; this test fails CI if the checked-in copy lags.
3137 /// Regenerate with:
3138 /// `UPDATE_SCHEMAS=1 cargo test -p kanade-shared schema_files_are_current`
3139 #[test]
3140 fn schema_files_are_current() {
3141 assert_schema_file("schedule.schema.json", &schemars::schema_for!(Schedule));
3142 assert_schema_file("job.schema.json", &schemars::schema_for!(Manifest));
3143 }
3144
3145 fn assert_schema_file(name: &str, schema: &schemars::Schema) {
3146 let generated = serde_json::to_string_pretty(schema).expect("serialize schema") + "\n";
3147 let path = std::path::Path::new(env!("CARGO_MANIFEST_DIR"))
3148 .join("../../docs/schemas")
3149 .join(name);
3150 if std::env::var_os("UPDATE_SCHEMAS").is_some() {
3151 std::fs::create_dir_all(path.parent().unwrap()).expect("mkdir docs/schemas");
3152 std::fs::write(&path, &generated).unwrap_or_else(|e| panic!("write {path:?}: {e}"));
3153 return;
3154 }
3155 // Normalize CRLF→LF before comparing: `.gitattributes` already
3156 // pins these files to `eol=lf`, but a stray CRLF working-tree
3157 // copy (autocrlf, a tool rewrite) shouldn't turn a *content*-
3158 // freshness check into a confusing line-ending failure — that's
3159 // .gitattributes' job, not this test's (gemini #588).
3160 let on_disk = std::fs::read_to_string(&path)
3161 .unwrap_or_else(|e| {
3162 panic!(
3163 "read {path:?}: {e}\n\
3164 generate it with: UPDATE_SCHEMAS=1 cargo test -p kanade-shared schema_files_are_current"
3165 )
3166 })
3167 .replace("\r\n", "\n");
3168 assert_eq!(
3169 on_disk, generated,
3170 "{name} is stale — a Schedule/Manifest schema change isn't reflected in docs/schemas/. \
3171 Refresh with: UPDATE_SCHEMAS=1 cargo test -p kanade-shared schema_files_are_current"
3172 );
3173 }
3174}
3175
3176/// Periodic schedule (spec §2.4.3). v0.18.0 carries the fanout plan
3177/// (target + optional rollout + optional jitter) inline; the
3178/// referenced job (`job_id` → [`BUCKET_JOBS`]) supplies only the
3179/// script body. Two schedules of the same job can target different
3180/// groups on different cadences without copying the manifest.
3181///
3182/// #418 Phase 1: the cadence is the single [`When`] field. The old
3183/// `cron` × `mode` × `cooldown` × `auto_disable_when_done` quartet
3184/// is gone (no back-compat — pre-Phase-1 KV blobs fail to parse and
3185/// are warn-skipped; re-`schedule create` to upgrade them). The
3186/// engine underneath is unchanged: [`Schedule::lowered`] maps `when`
3187/// onto the same (cron, ExecMode, cooldown) trio the scheduler and
3188/// `decide_fire` always ran on.
3189#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone)]
3190pub struct Schedule {
3191 pub id: String,
3192 /// When to fire — a reconcile cadence (`per_pc` / `per_target`)
3193 /// or a calendar time trigger (`at` / `days`). See [`When`].
3194 ///
3195 /// `singleton_map`: serde_yaml 0.9 renders externally-tagged
3196 /// enums as `!per_pc` YAML tags by default; this keeps the
3197 /// operator-facing map shape (`when: { per_pc: once }`). JSON
3198 /// output is identical either way, and the schemars schema
3199 /// (external tagging = oneOf of single-key objects) already
3200 /// matches the singleton-map wire shape.
3201 #[serde(with = "serde_yaml::with::singleton_map")]
3202 #[schemars(with = "When")]
3203 pub when: When,
3204 /// Key into [`crate::kv::BUCKET_JOBS`]. Must equal a registered
3205 /// Manifest's `id`.
3206 pub job_id: String,
3207 /// Who + how-to-phase + when-to-stagger. The Manifest doesn't
3208 /// carry these any more — same job + different fanout = different
3209 /// schedule.
3210 #[serde(flatten)]
3211 pub plan: FanoutPlan,
3212 /// Optional validity window. Outside `[from, until)` the
3213 /// schedule is dormant — still registered, still visible, but
3214 /// every tick is skipped (deleted ≠ dormant: a campaign that
3215 /// ended stays inspectable and can be re-armed by editing the
3216 /// window). Checked at tick time on both the backend scheduler
3217 /// and the agent's local scheduler.
3218 #[serde(default, skip_serializing_if = "Active::is_empty")]
3219 pub active: Active,
3220 /// #418 operational constraints gating *when within an active
3221 /// period* a fire may happen: a maintenance `window`, a fleet
3222 /// `max_concurrent` cap, and `skip_dates` (holiday exclusion). The
3223 /// wall-clock ones are evaluated in the schedule's `tz`; future
3224 /// `require` (env gates) lands in the same namespace. Checked at
3225 /// tick time on both schedulers (and surfaced by `preview`).
3226 #[serde(default, skip_serializing_if = "Constraints::is_empty")]
3227 pub constraints: Constraints,
3228 /// #418 Phase 4: what to do after a fire's script comes back
3229 /// failed. Currently just `retry` (fixed-backoff in-process
3230 /// re-run); future `notify` / `disable` join the same namespace.
3231 /// Applied fire-side in `handle_command` (the retry policy is
3232 /// lowered onto every Command this schedule produces), so it
3233 /// covers both `runs_on` locations.
3234 #[serde(default, skip_serializing_if = "OnFailure::is_empty")]
3235 pub on_failure: OnFailure,
3236 /// #418 Phase 2: the timezone this schedule's wall-clock fields
3237 /// are evaluated in — both the calendar `at` firing time AND the
3238 /// `active.{from,until}` window bounds. `local` (default) = the
3239 /// running host's TZ (the agent's for `runs_on: agent`, the
3240 /// backend server's otherwise); `utc` for TZ-independent
3241 /// schedules. Reconcile shapes (`per_pc`/`per_target`) ignore it
3242 /// for firing (poll cron runs every minute regardless) but still
3243 /// honor it for the `active` window.
3244 #[serde(default)]
3245 pub tz: ScheduleTz,
3246 /// v0.22: optional humantime window after a cron tick during
3247 /// which the Command is still considered "live". The scheduler
3248 /// computes `tick_at + starting_deadline` and stamps it onto
3249 /// each Command as `deadline_at`; agents skip Commands they
3250 /// receive after that absolute time. `None` (default) = no
3251 /// deadline, meaning a Command queued in the broker / stream
3252 /// during agent downtime runs whenever the agent reconnects —
3253 /// good for kitting / inventory / cleanup. Set this for
3254 /// time-of-day notifications, lunch reminders, etc., where
3255 /// "fire 3 hours late" would be wrong.
3256 #[serde(default, skip_serializing_if = "Option::is_none")]
3257 pub starting_deadline: Option<String>,
3258 /// v0.23: where does the cron tick happen? `Backend` (default,
3259 /// historical) = backend's scheduler fires Commands via NATS;
3260 /// agents passively receive. `Agent` = each targeted agent runs
3261 /// its own internal cron and fires locally, so the schedule
3262 /// keeps ticking even when the broker is unreachable (laptop on
3263 /// the train, broker maintenance window, full WAN outage). The
3264 /// two locations are mutually exclusive — when `Agent`, the
3265 /// backend scheduler stays out and just keeps the definition in
3266 /// KV for agents to read.
3267 #[serde(default)]
3268 pub runs_on: RunsOn,
3269 #[serde(default = "default_true")]
3270 pub enabled: bool,
3271}
3272
3273/// v0.23 — where the cron tick fires from.
3274#[derive(
3275 Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq, Default,
3276)]
3277#[serde(rename_all = "snake_case")]
3278pub enum RunsOn {
3279 /// Backend's central scheduler ticks and publishes Commands to
3280 /// NATS. Historical default, what every pre-v0.23 schedule
3281 /// uses. Agent offline ⇒ Command queued in STREAM_EXEC; agent
3282 /// reconnects ⇒ catch-up via [`command_replay`](crate)
3283 /// (see kanade-agent's command_replay module).
3284 #[default]
3285 Backend,
3286 /// Each targeted agent runs the cron tick locally. Survives
3287 /// broker / WAN outages. Best for laptops / mobile devices that
3288 /// roam off the corporate network. Agent must be online for the
3289 /// initial schedule + job-catalog pull, but once cached the
3290 /// agent fires the script standalone.
3291 Agent,
3292}
3293
3294/// Per-pc/per-target dedup semantics for a [`Schedule`] (v0.19).
3295#[derive(
3296 Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq, Default,
3297)]
3298#[serde(rename_all = "snake_case")]
3299pub enum ExecMode {
3300 /// Fire on every cron tick at the whole target. Historical
3301 /// (pre-v0.19) behavior; no dedup.
3302 #[default]
3303 EveryTick,
3304 /// Fire at each pc until that pc succeeds; then skip it until
3305 /// the optional cooldown elapses (or forever if no cooldown).
3306 /// Use for kitting / first-boot / per-pc compliance checks.
3307 OncePerPc,
3308 /// Fire at the whole target until **any** pc succeeds; then
3309 /// skip the whole target until the optional cooldown elapses
3310 /// (or forever if no cooldown). Use for "one delegate is
3311 /// enough" tasks like license check-in.
3312 OncePerTarget,
3313 /// #418 OS-native event trigger (`when: { on: [...] }`). There is
3314 /// no cron — the agent fires it from an OS event source (boot /
3315 /// session-change), not a tick — so the scheduler skips
3316 /// `tokio-cron` registration for it. Each event occurrence fires
3317 /// once, gated by the standard freeze / active / window /
3318 /// skip_dates checks.
3319 Event,
3320}
3321
3322/// #418 Phase 1 — the single "when does this fire" axis.
3323///
3324/// Replaces the old `cron` + `mode` + `cooldown` trio whose
3325/// interactions were implicit (cron doubled as both a real
3326/// time-of-day trigger and a reconcile poll period; contradictory
3327/// combinations silently no-opped). Two shapes:
3328///
3329/// * **reconcile** (`per_pc` / `per_target`) — desired-state: "each
3330/// pc (or one delegate) should have run this within `every`".
3331/// The poll period is system-generated ([`POLL_CRON`], every
3332/// minute) and no longer the operator's concern.
3333/// * **calendar** (`{ at, days }`) — a wall-clock time trigger
3334/// (#418 Phase 2, replacing the old raw-cron escape hatch). Fires
3335/// the whole target at the given time, no dedup. `at: "09:00"` +
3336/// `days` repeats; `at: "2026-06-10 09:00"` (a date+time) fires
3337/// exactly once. Evaluated in the schedule's top-level `tz`.
3338#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, PartialEq, Eq)]
3339#[serde(rename_all = "snake_case")]
3340pub enum When {
3341 /// Fire at each targeted pc: `once` (kitting — succeed once,
3342 /// skip forever, forever catching brand-new / re-imaged pcs)
3343 /// or `{ every: <humantime> }` (patrol — re-arm per pc after
3344 /// the interval).
3345 PerPc(PerPolicy),
3346 /// Fire until **any** one pc of the target succeeds, then skip
3347 /// the whole target (`once`) or re-arm after `every`. Needs
3348 /// fleet-wide completion data, so it is backend-only —
3349 /// `runs_on: agent` + `per_target` is rejected by
3350 /// [`Schedule::validate`].
3351 PerTarget(PerPolicy),
3352 /// Calendar time trigger: `{ at: "09:00", days: [mon-fri] }`
3353 /// (repeating) or `{ at: "2026-06-10 09:00" }` (one-shot). Fires
3354 /// the whole target at that wall-clock time in the schedule's
3355 /// `tz` — no dedup, no cooldown.
3356 Calendar(CalendarSpec),
3357 /// #418 OS-native event trigger: `when: { on: [startup, logon] }`.
3358 /// Fires when the agent observes the listed OS event(s) rather than
3359 /// on a clock — there is no cron. `runs_on: agent` only (the agent
3360 /// owns the event source); [`Schedule::validate`] rejects it on
3361 /// `backend` and rejects an empty list. Each event occurrence fires
3362 /// once, gated by the same freeze / active / `constraints.window` /
3363 /// `skip_dates` checks as the cron path. `startup` fires once per OS
3364 /// boot (deduped via the host boot time); a `starting_deadline`, if
3365 /// set, limits it to "agent came up within that long after boot".
3366 On(Vec<OnTrigger>),
3367}
3368
3369/// An OS event the agent can fire a schedule on (#418 `when: { on }`).
3370#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq, Hash)]
3371#[serde(rename_all = "snake_case")]
3372pub enum OnTrigger {
3373 /// Once per OS boot (the agent's first run for that boot). Catches
3374 /// freshly-imaged / reinstalled hosts at their next startup.
3375 Startup,
3376 /// On an interactive-session user logon — console, RDP, or
3377 /// auto-logon (Windows `WTS_SESSION_LOGON`). Does not fire for
3378 /// service / network / batch logons (no interactive session).
3379 Logon,
3380 /// When the workstation is locked (Win+L / idle lock; Windows
3381 /// `WTS_SESSION_LOCK`). Use for step-away compliance / cleanup.
3382 Lock,
3383 /// When the workstation is unlocked — the user returns to a locked
3384 /// session (Windows `WTS_SESSION_UNLOCK`). Use to re-check
3385 /// compliance / refresh state when work resumes.
3386 Unlock,
3387 /// When the host's network changes — IP address table change on
3388 /// connect / disconnect / DHCP renew / VPN / Wi-Fi roam (Windows
3389 /// `NotifyAddrChange`). Debounced agent-side (a burst of changes
3390 /// from one transition fires once after the network settles), so
3391 /// use it for "re-check connectivity / re-register on network move"
3392 /// rather than expecting one fire per raw adapter event.
3393 ///
3394 /// IPv4 only: `NotifyAddrChange` watches the IPv4 address table, so a
3395 /// transition that touches only IPv6 addresses won't fire. In practice
3396 /// dual-stack networks change both tables together, but a pure-IPv6
3397 /// move (e.g. an IPv6-only Wi-Fi roam) is not detected.
3398 NetworkChange,
3399}
3400
3401/// Calendar time trigger (#418 Phase 2). `at` is either a time of
3402/// day (`"HH:MM"`, repeating — combine with `days`) or a full
3403/// date+time (`"YYYY-MM-DD HH:MM"`, a one-shot that fires once and
3404/// never again). Evaluated in the schedule's top-level `tz`.
3405#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, PartialEq, Eq)]
3406pub struct CalendarSpec {
3407 /// `"HH:MM"` (24h) for a repeating trigger, or
3408 /// `"YYYY-MM-DD HH:MM"` (hyphen / slash / `T` separators all
3409 /// accepted) for a one-shot. Parsed lazily —
3410 /// [`Schedule::validate`] rejects garbage at create time.
3411 pub at: String,
3412 /// Day-of-week filter for a time-of-day `at`: `["mon-fri"]`,
3413 /// `["mon","wed","fri"]`, … (passed verbatim to the cron DOW
3414 /// field, so ranges and names both work). An **nth-weekday**
3415 /// `["tue#2"]` fires only on the 2nd Tuesday of each month
3416 /// ("Patch Tuesday"); the ordinal is `1..5`. A **last-weekday**
3417 /// `["friL"]` fires only on the last Friday of each month (handy
3418 /// for monthly maintenance). Empty = every day. Must be empty
3419 /// when `at` carries a date (the date already pins the day).
3420 #[serde(default, skip_serializing_if = "Vec::is_empty")]
3421 pub days: Vec<String>,
3422}
3423
3424/// Parsed `CalendarSpec.at`: the wall-clock minute/hour, plus the
3425/// date for a one-shot (`None` = repeating time-of-day).
3426struct ParsedAt {
3427 minute: u32,
3428 hour: u32,
3429 date: Option<chrono::NaiveDate>,
3430}
3431
3432impl CalendarSpec {
3433 /// Parse `at`: a date+time (`YYYY-MM-DD HH:MM`, hyphen / slash /
3434 /// `T` separators) is a one-shot; a bare `HH:MM` is repeating.
3435 fn parse_at(&self) -> Result<ParsedAt, String> {
3436 use chrono::Timelike;
3437 let s = self.at.trim();
3438 for fmt in ["%Y-%m-%d %H:%M", "%Y-%m-%dT%H:%M", "%Y/%m/%d %H:%M"] {
3439 if let Ok(dt) = chrono::NaiveDateTime::parse_from_str(s, fmt) {
3440 return Ok(ParsedAt {
3441 minute: dt.minute(),
3442 hour: dt.hour(),
3443 date: Some(dt.date()),
3444 });
3445 }
3446 }
3447 if let Ok(t) = chrono::NaiveTime::parse_from_str(s, "%H:%M") {
3448 return Ok(ParsedAt {
3449 minute: t.minute(),
3450 hour: t.hour(),
3451 date: None,
3452 });
3453 }
3454 Err(format!(
3455 "when.at: unparseable '{}' (want HH:MM or YYYY-MM-DD HH:MM)",
3456 self.at
3457 ))
3458 }
3459
3460 /// Pre-flight check on the `days` tokens so a bad day name gives
3461 /// a `when.days:`-scoped error instead of croner's confusing
3462 /// "when.at lowered to invalid cron" (claude #432 review). Each
3463 /// token is a day name (`mon`..`sun`), a numeric DOW (`0`..`7`),
3464 /// `*`, a `-` range of those, an **nth-weekday** like `tue#2`
3465 /// (2nd Tuesday of the month — "Patch Tuesday"), or a
3466 /// **last-weekday** like `friL` (last Friday of the month).
3467 fn validate_days(&self) -> Result<(), String> {
3468 const NAMES: [&str; 7] = ["mon", "tue", "wed", "thu", "fri", "sat", "sun"];
3469 let is_day = |p: &str| NAMES.contains(&p) || p.parse::<u8>().is_ok_and(|n| n <= 7);
3470 for tok in &self.days {
3471 // Report the whole token on a malformed range like `mon-`
3472 // (which would otherwise split to a cryptic empty part —
3473 // claude #432 follow-up).
3474 let invalid = |reason: &str| {
3475 Err(format!(
3476 "when.days: invalid day token '{tok}' ({reason}; \
3477 want mon..sun, 0-7, a range like mon-fri, an nth-weekday \
3478 like tue#2, a last-weekday like friL, or *)"
3479 ))
3480 };
3481 // #418: nth-weekday suffix (`tue#2` = 2nd Tuesday). Croner
3482 // accepts `<dow>#<n>` (n = 1..5) in the DOW field, and
3483 // `to_cron` passes the token through verbatim, so the
3484 // engine fires only on that occurrence. It's a single
3485 // weekday + ordinal — not combinable with a range.
3486 if let Some((day_part, nth_part)) = tok.split_once('#') {
3487 // Normalize once and use `d` consistently (gemini #547);
3488 // the outer `invalid` already echoes the raw `tok`.
3489 let d = day_part.trim().to_ascii_lowercase();
3490 if d.contains('-') || !is_day(&d) {
3491 return invalid("the part before # must be a single weekday");
3492 }
3493 match nth_part.trim().parse::<u8>() {
3494 Ok(n) if (1..=5).contains(&n) => {}
3495 _ => return invalid("the # ordinal must be 1..5 (e.g. tue#2 = 2nd Tuesday)"),
3496 }
3497 continue;
3498 }
3499 // #418: last-weekday suffix (`friL` = last Friday of the
3500 // month — the monthly-maintenance sibling of Patch Tuesday).
3501 // Croner accepts `<dow>L` in the DOW field with verified
3502 // last-<dow>-of-month semantics, and `to_cron` passes it
3503 // through verbatim. A single weekday + `L` — bare `L` and
3504 // ranges are rejected (croner would read bare `L` as
3505 // Saturday, which is a confusing footgun).
3506 if let Some(day_part) = tok.strip_suffix(['L', 'l']) {
3507 // No `.trim()`: a cron DOW token can't carry internal
3508 // whitespace, so `"fri L"` must be *rejected* here (its
3509 // strip leaves `"fri "`, and `is_day` catches the space)
3510 // rather than trimmed into a clean `"fri"` that then
3511 // produces a malformed `fri L` cron downstream and a
3512 // confusing croner error (gemini #560).
3513 let d = day_part.to_ascii_lowercase();
3514 if d.is_empty() {
3515 return invalid("`L` (last-weekday) needs a weekday before it, e.g. friL");
3516 }
3517 if d.contains('-') || !is_day(&d) {
3518 return invalid(
3519 "the part before L must be a single weekday (e.g. friL = last Friday)",
3520 );
3521 }
3522 continue;
3523 }
3524 for part in tok.split('-') {
3525 let p = part.trim().to_ascii_lowercase();
3526 if p.is_empty() {
3527 return invalid("empty range bound");
3528 }
3529 if p != "*" && !is_day(&p) {
3530 return invalid(&format!("'{part}' is not a day"));
3531 }
3532 }
3533 }
3534 Ok(())
3535 }
3536
3537 /// For a one-shot (`at` carries a date), the absolute instant it
3538 /// fires in `tz`. `None` for a repeating calendar. Used to warn
3539 /// about a one-shot whose date is already in the past (it would
3540 /// never fire).
3541 pub fn oneshot_instant(&self, tz: ScheduleTz) -> Option<chrono::DateTime<chrono::Utc>> {
3542 let p = self.parse_at().ok()?;
3543 let date = p.date?;
3544 let naive = date.and_hms_opt(p.hour, p.minute, 0)?;
3545 tz.naive_to_utc(naive)
3546 }
3547
3548 /// The wall-clock time-of-day this calendar fires at (`None` if
3549 /// `at` is unparseable — validate() guards that). Used to detect
3550 /// a calendar whose fire time can never fall inside its
3551 /// `constraints.window` (claude #452 review).
3552 pub fn fire_time(&self) -> Option<chrono::NaiveTime> {
3553 let p = self.parse_at().ok()?;
3554 chrono::NaiveTime::from_hms_opt(p.hour, p.minute, 0)
3555 }
3556
3557 /// Lower to the cron string the scheduler engine runs. Repeating
3558 /// → 6-field `0 {min} {hour} * * {dow}`; one-shot → 7-field
3559 /// `0 {min} {hour} {day} {month} * {year}` (a past year never
3560 /// fires — that's what makes it one-shot).
3561 fn to_cron(&self) -> Result<String, String> {
3562 use chrono::Datelike;
3563 let ParsedAt { minute, hour, date } = self.parse_at()?;
3564 match date {
3565 Some(d) => {
3566 if !self.days.is_empty() {
3567 return Err(
3568 "when.at with a date is a one-shot and cannot be combined with days".into(),
3569 );
3570 }
3571 Ok(format!(
3572 "0 {minute} {hour} {} {} * {}",
3573 d.day(),
3574 d.month(),
3575 d.year()
3576 ))
3577 }
3578 None => {
3579 let dow = if self.days.is_empty() {
3580 "*".to_string()
3581 } else {
3582 self.validate_days()?;
3583 self.days.join(",")
3584 };
3585 Ok(format!("0 {minute} {hour} * * {dow}"))
3586 }
3587 }
3588 }
3589}
3590
3591/// The timezone a schedule's wall-clock fields (`when.at`,
3592/// `active.{from,until}`) are evaluated in (#418 Phase 2).
3593#[derive(
3594 Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq, Default,
3595)]
3596#[serde(rename_all = "snake_case")]
3597pub enum ScheduleTz {
3598 /// The running host's local timezone — the agent's for
3599 /// `runs_on: agent`, the backend server's otherwise. Default.
3600 #[default]
3601 Local,
3602 /// UTC — for timezone-independent schedules.
3603 Utc,
3604}
3605
3606impl ScheduleTz {
3607 /// Interpret a naive (zoneless) datetime as being in this tz and
3608 /// convert to UTC. On a DST *fold* (the local time occurs twice
3609 /// when clocks go back) we pick `.earliest()` rather than
3610 /// rejecting it; `None` is reserved for a true DST *gap* (a local
3611 /// time that never exists). `Utc` is fixed-offset so neither ever
3612 /// happens; `Local` is whatever timezone the running host is set
3613 /// to and *can* hit a gap/fold on any DST-observing host — not
3614 /// just the JST we run today (gemini + claude #432 review).
3615 fn naive_to_utc(self, naive: chrono::NaiveDateTime) -> Option<chrono::DateTime<chrono::Utc>> {
3616 use chrono::TimeZone;
3617 match self {
3618 ScheduleTz::Utc => Some(chrono::DateTime::from_naive_utc_and_offset(
3619 naive,
3620 chrono::Utc,
3621 )),
3622 ScheduleTz::Local => chrono::Local
3623 .from_local_datetime(&naive)
3624 .earliest()
3625 .map(|dt| dt.with_timezone(&chrono::Utc)),
3626 }
3627 }
3628
3629 /// The wall-clock time-of-day `now` reads as in this tz — used by
3630 /// [`Constraints::allows`] to test a maintenance window
3631 /// (#418 Phase 3). `Utc` is the naive UTC time; `Local` is the
3632 /// running host's local time.
3633 fn wall_time(self, now: chrono::DateTime<chrono::Utc>) -> chrono::NaiveTime {
3634 match self {
3635 ScheduleTz::Utc => now.time(),
3636 ScheduleTz::Local => now.with_timezone(&chrono::Local).time(),
3637 }
3638 }
3639
3640 /// The wall-clock *date* `now` reads as in this tz — used by
3641 /// [`Constraints::allows`] to test `skip_dates` (#418 holiday
3642 /// exclusion). Same tz semantics as [`Self::wall_time`].
3643 fn wall_date(self, now: chrono::DateTime<chrono::Utc>) -> chrono::NaiveDate {
3644 match self {
3645 ScheduleTz::Utc => now.date_naive(),
3646 ScheduleTz::Local => now.with_timezone(&chrono::Local).date_naive(),
3647 }
3648 }
3649
3650 /// Stable lowercase wire/display label (`local` / `utc`) — matches
3651 /// the serde `snake_case` representation. Used for the preview
3652 /// response's `tz` field so the JSON shape isn't coupled to the
3653 /// `Debug` repr (claude #578 review).
3654 pub fn as_str(self) -> &'static str {
3655 match self {
3656 ScheduleTz::Local => "local",
3657 ScheduleTz::Utc => "utc",
3658 }
3659 }
3660}
3661
3662impl std::fmt::Display for ScheduleTz {
3663 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
3664 f.write_str(self.as_str())
3665 }
3666}
3667
3668/// `once` vs `{ every: <humantime> }` — shared by `per_pc` /
3669/// `per_target`. Untagged so the YAML stays the bare keyword or a
3670/// one-key map, nothing more ceremonial.
3671#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, PartialEq, Eq)]
3672#[serde(untagged)]
3673pub enum PerPolicy {
3674 /// The bare string `once`: succeed once, then skip permanently
3675 /// (cooldown = infinity).
3676 Once(OnceLiteral),
3677 /// Re-arm after the humantime interval, e.g. `{ every: 6h }`.
3678 Every(EverySpec),
3679}
3680
3681/// Single-variant enum so serde accepts exactly the string `once`
3682/// (a free-form `String` would swallow typos like `onec`).
3683#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Copy, PartialEq, Eq)]
3684#[serde(rename_all = "snake_case")]
3685pub enum OnceLiteral {
3686 Once,
3687}
3688
3689/// `{ every: <humantime> }`. Standalone struct (not an inline
3690/// struct variant). `{ evry: 6h }` still fails to parse (the
3691/// required `every` key is missing), and the create boundaries
3692/// reject the unknown `evry` via [`crate::strict`] with its path —
3693/// while agents reading a future writer's extra fields tolerate
3694/// them (#492).
3695#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, PartialEq, Eq)]
3696pub struct EverySpec {
3697 /// Humantime interval (`10m`, `6h`, `1d`...). Parsed lazily —
3698 /// [`Schedule::validate`] rejects garbage at create time.
3699 pub every: String,
3700}
3701
3702impl PerPolicy {
3703 /// The cooldown this policy lowers to: `once` = `None`
3704 /// (permanent skip), `every` = the interval.
3705 fn cooldown(&self) -> Option<String> {
3706 match self {
3707 PerPolicy::Once(_) => None,
3708 PerPolicy::Every(EverySpec { every }) => Some(every.clone()),
3709 }
3710 }
3711}
3712
3713impl std::fmt::Display for When {
3714 /// Operator-facing one-liner (`per_pc once` / `per_pc every 6h`
3715 /// / `at 09:00 [mon-fri]` / `at 2026-06-10 09:00`) for log
3716 /// lines, audit payloads and the API's `ScheduleSummary`.
3717 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
3718 let policy = |p: &PerPolicy| match p {
3719 PerPolicy::Once(_) => "once".to_string(),
3720 PerPolicy::Every(EverySpec { every }) => format!("every {every}"),
3721 };
3722 match self {
3723 When::PerPc(p) => write!(f, "per_pc {}", policy(p)),
3724 When::PerTarget(p) => write!(f, "per_target {}", policy(p)),
3725 When::Calendar(c) if c.days.is_empty() => write!(f, "at {}", c.at),
3726 When::Calendar(c) => write!(f, "at {} [{}]", c.at, c.days.join(",")),
3727 When::On(triggers) => {
3728 let names: Vec<&str> = triggers.iter().map(|t| t.as_str()).collect();
3729 write!(f, "on [{}]", names.join(","))
3730 }
3731 }
3732 }
3733}
3734
3735impl OnTrigger {
3736 /// Lowercase wire/display label (matches the serde `snake_case`).
3737 pub fn as_str(self) -> &'static str {
3738 match self {
3739 OnTrigger::Startup => "startup",
3740 OnTrigger::Logon => "logon",
3741 OnTrigger::Lock => "lock",
3742 OnTrigger::Unlock => "unlock",
3743 OnTrigger::NetworkChange => "network_change",
3744 }
3745 }
3746}
3747
3748/// Optional validity window for a [`Schedule`] (#418 decision G).
3749/// Half-open `[from, until)`; either bound may be omitted. Bounds
3750/// are `YYYY-MM-DD` (= that day's 00:00 in the schedule's `tz`) or
3751/// full RFC3339 (offset is honored as-is, `tz` ignored). Kept as
3752/// strings so the JSON Schema the SPA editor consumes stays two
3753/// plain string fields, mirroring `jitter` / `starting_deadline`.
3754///
3755/// #418 Phase 2: bounds are evaluated in the schedule's top-level
3756/// `tz` (was UTC-only in Phase 1) so `tz: local` makes both the
3757/// calendar `at` AND the `active` window local — one consistent
3758/// timezone per schedule.
3759#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default, PartialEq, Eq)]
3760pub struct Active {
3761 /// Dormant before this instant.
3762 #[serde(default, skip_serializing_if = "Option::is_none")]
3763 pub from: Option<String>,
3764 /// Dormant from this instant on (exclusive).
3765 #[serde(default, skip_serializing_if = "Option::is_none")]
3766 pub until: Option<String>,
3767}
3768
3769impl Active {
3770 /// `skip_serializing_if` helper — an empty window means "always
3771 /// active" and is omitted from the wire format entirely.
3772 pub fn is_empty(&self) -> bool {
3773 self.from.is_none() && self.until.is_none()
3774 }
3775
3776 /// Parse one bound: RFC3339 first (offset honored, `tz`
3777 /// ignored), then bare `YYYY-MM-DD` (00:00 in `tz`).
3778 pub fn parse_bound(s: &str, tz: ScheduleTz) -> Result<chrono::DateTime<chrono::Utc>, String> {
3779 if let Ok(dt) = chrono::DateTime::parse_from_rfc3339(s) {
3780 return Ok(dt.with_timezone(&chrono::Utc));
3781 }
3782 if let Ok(d) = chrono::NaiveDate::parse_from_str(s, "%Y-%m-%d") {
3783 let midnight = d.and_hms_opt(0, 0, 0).expect("00:00:00 is always valid");
3784 return tz.naive_to_utc(midnight).ok_or_else(|| {
3785 format!("active: bound '{s}' falls in a DST gap for the schedule's tz")
3786 });
3787 }
3788 Err(format!(
3789 "active: unparseable bound '{s}' (want YYYY-MM-DD or RFC3339)"
3790 ))
3791 }
3792
3793 /// Is `now` inside the window? Unparseable bounds are treated
3794 /// as absent here (fail-open) — [`Schedule::validate`] is the
3795 /// place that rejects them loudly; this runs on every tick and
3796 /// must never panic on a stale KV blob.
3797 pub fn contains(&self, now: chrono::DateTime<chrono::Utc>, tz: ScheduleTz) -> bool {
3798 let bound = |s: &Option<String>| s.as_deref().and_then(|s| Self::parse_bound(s, tz).ok());
3799 if bound(&self.from).is_some_and(|from| now < from) {
3800 return false;
3801 }
3802 if bound(&self.until).is_some_and(|until| now >= until) {
3803 return false;
3804 }
3805 true
3806 }
3807}
3808
3809/// Host-environment gate (#418 `constraints.require`). Fire only when
3810/// the target host is in the required state. Sensed **in-process by the
3811/// agent** (Win32), so it is `runs_on: agent` only — the backend cannot
3812/// read a target host's power/idle state ([`Schedule::validate`]
3813/// rejects it on `runs_on: backend`, symmetric with `when: { on }`).
3814///
3815/// Evaluated at fire time as a skip-this-tick gate (NOT in
3816/// [`Constraints::allows`], which stays pure for `preview`): a reconcile
3817/// cadence re-checks every minute (so it effectively defers until the
3818/// state is met — the intended pairing); a `calendar` fire that lands
3819/// while the state is unmet is simply missed, same as `window`. It is
3820/// therefore a *runtime* gate and does not appear in `preview`.
3821// No `Eq`: `cpu_below: Option<f64>` is only `PartialEq` (f64 is not Eq).
3822#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default, PartialEq)]
3823pub struct Require {
3824 /// Fire only while on **AC power** (skip on battery). Reads
3825 /// `GetSystemPowerStatus`; an unknown/unreadable status is treated
3826 /// as not-on-AC (fail-closed — a restrictive gate must not fire
3827 /// when it can't confirm the condition). `false` (default) = no
3828 /// power requirement.
3829 #[serde(default, skip_serializing_if = "std::ops::Not::not")]
3830 pub ac_power: bool,
3831 /// Fire only when the active console session has had **no keyboard /
3832 /// mouse input for at least this long** (humantime, e.g. `"10m"`) —
3833 /// "don't run while the user is actively working". Input-based
3834 /// (simpler than Task Scheduler's CPU/disk-aware idle). A
3835 /// headless / disconnected console (no interactive user) trivially
3836 /// satisfies it. `None` (default) = no idle requirement. Parsed
3837 /// lazily; [`Schedule::validate`] rejects garbage at create time.
3838 #[serde(default, skip_serializing_if = "Option::is_none")]
3839 pub idle: Option<String>,
3840 /// Fire only when the **whole-machine CPU usage is below this
3841 /// percent** (0–100; e.g. `20.0` = "system CPU < 20%") — "don't run
3842 /// while the box is busy". Reuses the agent's `host_perf` system CPU%
3843 /// sample (`sysinfo` mean over cores), so the reading is up to one
3844 /// `host_perf` cadence old (default 60s) — fine as a "generally
3845 /// busy?" proxy, and more accurate than a fresh one-shot read (CPU%
3846 /// needs two samples). An unavailable sample (host_perf not warmed
3847 /// up yet, or stale) is treated as "not below" (fail-closed — a
3848 /// restrictive gate must not fire when it can't confirm). `None`
3849 /// (default) = no CPU requirement. [`Schedule::validate`] rejects an
3850 /// out-of-range value at create time.
3851 #[serde(default, skip_serializing_if = "Option::is_none")]
3852 pub cpu_below: Option<f64>,
3853}
3854
3855impl Require {
3856 /// `skip_serializing_if` helper for an embedded empty `require`.
3857 pub fn is_empty(&self) -> bool {
3858 !self.ac_power && self.idle.is_none() && self.cpu_below.is_none()
3859 }
3860
3861 /// Parsed minimum-idle duration (`None` = no idle requirement, or an
3862 /// unparseable value — `validate` rejects the latter at create time).
3863 pub fn min_idle(&self) -> Option<std::time::Duration> {
3864 self.idle
3865 .as_deref()
3866 .and_then(|s| humantime::parse_duration(s.trim()).ok())
3867 }
3868
3869 /// First unparseable field for create-time rejection (mirrors
3870 /// [`Constraints::bad_skip_date`]).
3871 pub fn bad_idle(&self) -> Option<String> {
3872 self.idle.as_deref().and_then(|s| {
3873 humantime::parse_duration(s.trim())
3874 .err()
3875 .map(|e| format!("constraints.require.idle: invalid duration '{s}': {e}"))
3876 })
3877 }
3878}
3879
3880/// Pure env-gate decision (#418 `constraints.require`). The Win32
3881/// sensing lives in the agent (`kanade-agent::env_gate`); this is the
3882/// testable core, fed the already-sensed host state. Deliberately a
3883/// free fn (not folded into [`Constraints::allows`]) so `allows` stays
3884/// pure and `preview` never evaluates a runtime gate.
3885///
3886/// `ac_online` = is the host on AC power. `idle` = how long the console
3887/// has been idle (`None` = couldn't determine → an idle requirement is
3888/// treated as unmet). `cpu_pct` = whole-machine CPU usage 0–100 (`None`
3889/// = no sample yet → a `cpu_below` requirement is treated as unmet).
3890pub fn require_met(
3891 req: &Require,
3892 ac_online: bool,
3893 idle: Option<std::time::Duration>,
3894 cpu_pct: Option<f64>,
3895) -> bool {
3896 if req.ac_power && !ac_online {
3897 return false;
3898 }
3899 if let Some(min) = req.min_idle() {
3900 match idle {
3901 Some(d) if d >= min => {}
3902 _ => return false,
3903 }
3904 }
3905 if let Some(max) = req.cpu_below {
3906 match cpu_pct {
3907 Some(p) if p < max => {}
3908 _ => return false,
3909 }
3910 }
3911 true
3912}
3913
3914/// [`Active`] decides *over what date range* a schedule is live,
3915/// `Constraints` decides *when, within an active period,* a fire is
3916/// allowed: `window` (a maintenance time-of-day window),
3917/// `max_concurrent` (a fleet-wide running-instance cap), `skip_dates`
3918/// (holiday exclusion) and `require` (host-environment gates, agent-only
3919/// — see [`Require`]).
3920// No `Eq`: contains `require: Option<Require>` which holds an f64.
3921#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default, PartialEq)]
3922pub struct Constraints {
3923 /// `"HH:MM-HH:MM"` wall-clock window (evaluated in the schedule's
3924 /// `tz`). Fires outside it are skipped — mainly for reconcile
3925 /// cadences ("patrol every 6h, but only fire overnight") and
3926 /// daytime change-freezes. `start > end` crosses midnight
3927 /// (`"22:00-05:00"` = 22:00 through 05:00 next morning). Parsed
3928 /// lazily; [`Schedule::validate`] rejects garbage at create time.
3929 #[serde(default, skip_serializing_if = "Option::is_none")]
3930 pub window: Option<String>,
3931 /// Fleet-wide cap on how many instances of this schedule's job may
3932 /// run **at the same time** (#418 "同時実行ハード上限"). The
3933 /// backend scheduler counts the job's still-in-flight runs
3934 /// (`execution_results.finished_at IS NULL`) each tick and only
3935 /// dispatches to as many remaining pcs as there are free slots —
3936 /// a rolling window that refills as runs complete. Useful for
3937 /// disk/CPU/network-heavy jobs you don't want hammering the whole
3938 /// fleet at once.
3939 ///
3940 /// **Backend-only** (it needs a central counter): combining it
3941 /// with `runs_on: agent` is rejected by [`Schedule::validate`]
3942 /// (#418 decision E — "中央上限には中央が要る"). Most meaningful
3943 /// for `per_pc` reconcile cadences, where the poll re-ticks and
3944 /// refills slots. `None` (default) = no cap.
3945 #[serde(default, skip_serializing_if = "Option::is_none")]
3946 pub max_concurrent: Option<u32>,
3947 /// Calendar dates the schedule must **not** fire on — holidays,
3948 /// blackout days, one-off freeze dates (#418 "祝日除外"). Each is
3949 /// `YYYY-MM-DD`, evaluated as a wall-clock date in the schedule's
3950 /// `tz`. Applies to every `when` shape (a reconcile cadence skips
3951 /// the whole day; a calendar fire landing on the date is
3952 /// suppressed) and is honored by both the live scheduler and
3953 /// `preview`, since both gate on [`Constraints::allows`]. Empty
3954 /// (default) = no skips. Operator-supplied: there is no built-in
3955 /// holiday calendar — list the dates you care about. Parsed lazily;
3956 /// [`Schedule::validate`] rejects a malformed date at create time.
3957 #[serde(default, skip_serializing_if = "Vec::is_empty")]
3958 pub skip_dates: Vec<String>,
3959 /// Host-environment gate (#418): fire only when the target host is
3960 /// in the required state (on AC power, idle). Agent-sensed at fire
3961 /// time, `runs_on: agent` only. See [`Require`]. `None` (default) =
3962 /// no environment requirement.
3963 #[serde(default, skip_serializing_if = "Option::is_none")]
3964 pub require: Option<Require>,
3965}
3966
3967impl Constraints {
3968 /// `skip_serializing_if` helper — empty constraints are omitted
3969 /// from the wire format entirely.
3970 pub fn is_empty(&self) -> bool {
3971 self.window.is_none()
3972 && self.max_concurrent.is_none()
3973 && self.skip_dates.is_empty()
3974 && self.require.as_ref().is_none_or(Require::is_empty)
3975 }
3976
3977 /// The first unparseable `skip_dates` entry, if any — the
3978 /// scheduler logs it at register time so a fail-closed
3979 /// (never-firing) schedule from a hand-edited KV blob is
3980 /// diagnosable, mirroring [`Schedule::bad_window`].
3981 pub fn bad_skip_date(&self) -> Option<String> {
3982 self.skip_dates.iter().find_map(|s| {
3983 chrono::NaiveDate::parse_from_str(s.trim(), "%Y-%m-%d")
3984 .err()
3985 .map(|e| format!("constraints.skip_dates: invalid date '{s}': {e}"))
3986 })
3987 }
3988
3989 /// Parse `"HH:MM-HH:MM"` into `(start, end)`. Equal bounds are an
3990 /// error (a zero-width or all-day window is ambiguous — write no
3991 /// window for "always").
3992 pub fn parse_window(s: &str) -> Result<(chrono::NaiveTime, chrono::NaiveTime), String> {
3993 let (a, b) = s
3994 .split_once('-')
3995 .ok_or_else(|| format!("constraints.window: '{s}' must be 'HH:MM-HH:MM'"))?;
3996 let parse = |part: &str| {
3997 chrono::NaiveTime::parse_from_str(part.trim(), "%H:%M")
3998 .map_err(|e| format!("constraints.window: invalid time '{}': {e}", part.trim()))
3999 };
4000 let (start, end) = (parse(a)?, parse(b)?);
4001 if start == end {
4002 return Err(format!(
4003 "constraints.window: start and end are equal ('{s}'); omit window for 'always'"
4004 ));
4005 }
4006 Ok((start, end))
4007 }
4008
4009 /// Is a fire allowed at `now` (evaluated in `tz`)? No window =
4010 /// always allowed. Half-open `[start, end)`; `start > end`
4011 /// crosses midnight.
4012 ///
4013 /// **Fail-closed** on an unparseable window (returns `false`,
4014 /// gemini #452 review): a window is a *restrictive* constraint
4015 /// (change-freeze / overnight-only), so a corrupt one must NOT
4016 /// silently allow fires during the restricted hours. Bad windows
4017 /// are rejected at create time by [`Schedule::validate`]; this
4018 /// only bites a hand-edited KV blob, where blocking is the safe
4019 /// direction. The scheduler warns at register time
4020 /// ([`Schedule::bad_window`]) so a stuck schedule is diagnosable.
4021 /// The tick path never panics regardless.
4022 pub fn allows(&self, now: chrono::DateTime<chrono::Utc>, tz: ScheduleTz) -> bool {
4023 // #418 holiday / blackout dates: never fire on a listed wall
4024 // date (in `tz`). Checked before the window since a skipped day
4025 // overrides any within-window allowance. Fail-closed on a
4026 // corrupt entry (same posture as `window`): a skip date is a
4027 // *restrictive* constraint, so a garbled one must not silently
4028 // re-enable fires — it blocks until fixed (`validate` rejects it
4029 // at create time; `bad_skip_date` lets the scheduler warn).
4030 if !self.skip_dates.is_empty() {
4031 let today = tz.wall_date(now);
4032 let blocked = self.skip_dates.iter().any(|s| {
4033 match chrono::NaiveDate::parse_from_str(s.trim(), "%Y-%m-%d") {
4034 Ok(d) => d == today,
4035 Err(_) => true, // corrupt entry → fail-closed (block)
4036 }
4037 });
4038 if blocked {
4039 return false;
4040 }
4041 }
4042 match self.window.as_deref() {
4043 // No window → always allowed.
4044 None => true,
4045 // Window set: membership, or fail-closed if unparseable
4046 // (`window_contains` returns None for a corrupt window).
4047 Some(_) => self.window_contains(tz.wall_time(now)).unwrap_or(false),
4048 }
4049 }
4050
4051 /// Membership of a wall-clock time-of-day in the window. `None`
4052 /// when there is no window or it's unparseable (callers decide
4053 /// the failure direction). `start > end` crosses midnight.
4054 fn window_contains(&self, t: chrono::NaiveTime) -> Option<bool> {
4055 let (start, end) = Self::parse_window(self.window.as_deref()?).ok()?;
4056 Some(if start <= end {
4057 start <= t && t < end
4058 } else {
4059 t >= start || t < end
4060 })
4061 }
4062}
4063
4064/// What to do when a fire's script fails (#418 Phase 4 — the "高"
4065/// retry/backoff gap). Where [`Constraints`] gates *whether* a fire
4066/// happens, `OnFailure` decides what happens *after* one ran and
4067/// came back bad. Only `retry` so far; future `notify` / `disable`
4068/// would join the same namespace.
4069#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default, PartialEq, Eq)]
4070pub struct OnFailure {
4071 /// Re-run the script in-process when it exits non-zero (or times
4072 /// out), up to a cap, with a fixed backoff between attempts.
4073 /// `None` (default) = no retry: a failed run is published as-is
4074 /// and (for reconcile cadences) simply re-fires on the next poll
4075 /// tick. See [`Retry`].
4076 #[serde(default, skip_serializing_if = "Option::is_none")]
4077 pub retry: Option<Retry>,
4078}
4079
4080impl OnFailure {
4081 /// `skip_serializing_if` helper — an empty policy is omitted from
4082 /// the wire format entirely.
4083 pub fn is_empty(&self) -> bool {
4084 self.retry.is_none()
4085 }
4086
4087 /// Lower the operator-facing `retry` (humantime backoff) onto the
4088 /// engine vocabulary the agent's executor runs on (backoff in
4089 /// whole seconds). Single seam shared by the backend command
4090 /// builder and the agent's local scheduler so the two stamp the
4091 /// same [`crate::wire::RetrySpec`] onto every Command. Returns
4092 /// `None` when there is no retry policy or the backoff is
4093 /// unparseable (validate() rejects the latter at create time;
4094 /// this stays fail-safe = "no retry" for a hand-edited KV blob
4095 /// rather than panicking on the fire path).
4096 pub fn lowered_retry(&self) -> Option<crate::wire::RetrySpec> {
4097 let r = self.retry.as_ref()?;
4098 let backoff_secs = humantime::parse_duration(&r.backoff).ok()?.as_secs();
4099 Some(crate::wire::RetrySpec {
4100 max: r.max,
4101 backoff_secs,
4102 })
4103 }
4104}
4105
4106/// Fixed-backoff retry policy (#418 Phase 4). `max` is the number of
4107/// *additional* attempts after the first run (so `max: 3` = up to 4
4108/// total executions); `backoff` is the humantime delay slept between
4109/// attempts. The retry happens fire-side (inside `kanade fire` /
4110/// `handle_command`) on every OS for the PoC — the Windows-native
4111/// "restart on failure" Task Scheduler path is deferred to the
4112/// native-delegation phase (#418 decision H).
4113#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, PartialEq, Eq)]
4114pub struct Retry {
4115 /// Max additional attempts after the first failure. Bounded
4116 /// `1..=10` by [`Schedule::validate`] — a typo'd `max: 1000`
4117 /// with a short backoff would otherwise pin a flapping script in
4118 /// a tight loop for the whole window.
4119 pub max: u32,
4120 /// Humantime delay slept between attempts (`"10m"`, `"30s"`).
4121 pub backoff: String,
4122}
4123
4124/// Fleet-wide change-freeze (#418 Phase 5 — the "メンテナンス窓 /
4125/// 変更凍結" gap's global half). Where [`Constraints::window`] is a
4126/// *per-schedule* time-of-day gate, a `Freeze` is a *single, fleet-
4127/// global* "stop all automated change" switch the operator flips
4128/// during an incident or a year-end change-freeze. It lives in its
4129/// own KV singleton ([`crate::kv::KEY_FREEZE`]); when present and
4130/// active, both the backend scheduler and every agent's local
4131/// scheduler skip *every* fire.
4132///
4133/// Shapes:
4134/// * `{}` (no bounds) — frozen indefinitely until the operator
4135/// clears it (incident "big red button").
4136/// * `{ from, until }` — frozen only within `[from, until)`,
4137/// evaluated in `tz` (planned change-freeze; auto-thaws).
4138///
4139/// The KV key being *absent* means "not frozen" — so clearing the
4140/// freeze is a KV delete, and `is_active` only ever runs on a freeze
4141/// the operator actually set.
4142#[derive(Serialize, Deserialize, schemars::JsonSchema, Debug, Clone, Default, PartialEq, Eq)]
4143pub struct Freeze {
4144 /// Frozen from this instant (RFC3339 or bare `YYYY-MM-DD` in
4145 /// `tz`). `None` ⇒ frozen from the beginning of time.
4146 #[serde(default, skip_serializing_if = "Option::is_none")]
4147 pub from: Option<String>,
4148 /// Thawed from this instant on, exclusive. `None` ⇒ frozen with
4149 /// no scheduled end (manual clear required).
4150 #[serde(default, skip_serializing_if = "Option::is_none")]
4151 pub until: Option<String>,
4152 /// Operator-supplied note surfaced on the freeze-skip log and the
4153 /// SPA banner ("year-end change freeze", "INC-1234"). Advisory.
4154 #[serde(default, skip_serializing_if = "Option::is_none")]
4155 pub reason: Option<String>,
4156 /// Timezone the bare-date bounds are evaluated in (RFC3339 bounds
4157 /// carry their own offset). Defaults to host-local like a
4158 /// schedule's `tz`.
4159 #[serde(default)]
4160 pub tz: ScheduleTz,
4161}
4162
4163impl Freeze {
4164 /// Is the fleet frozen at `now`? An empty window (`from`/`until`
4165 /// both absent) is frozen unconditionally; otherwise membership of
4166 /// `[from, until)` in `tz`. Half-open like [`Active::contains`],
4167 /// but **fails CLOSED** on an unparseable bound — a freeze is a
4168 /// safety switch, so a corrupt window (only reachable via a
4169 /// hand-edited KV blob; `validate` rejects it at set time) must
4170 /// mean "frozen", not "fire normally" (coderabbit #472). This is
4171 /// the one deliberate divergence from `active`'s fail-OPEN
4172 /// behaviour, where an unparseable bound dormant-skips a schedule.
4173 pub fn is_active(&self, now: chrono::DateTime<chrono::Utc>) -> bool {
4174 // Parse a bound; an unparseable one short-circuits the whole
4175 // check to `true` (frozen) via the closure's `None` sentinel
4176 // handled below.
4177 let bound = |s: &Option<String>| -> Result<Option<chrono::DateTime<chrono::Utc>>, ()> {
4178 match s.as_deref() {
4179 None => Ok(None),
4180 Some(raw) => Active::parse_bound(raw, self.tz).map(Some).map_err(|_| ()),
4181 }
4182 };
4183 let (from, until) = match (bound(&self.from), bound(&self.until)) {
4184 (Ok(f), Ok(u)) => (f, u),
4185 // Any corrupt bound → fail closed (frozen).
4186 _ => return true,
4187 };
4188 if from.is_some_and(|f| now < f) {
4189 return false;
4190 }
4191 if until.is_some_and(|u| now >= u) {
4192 return false;
4193 }
4194 true
4195 }
4196
4197 /// Reject unparseable bounds / `from >= until` at set time (the
4198 /// API + CLI counterpart to [`Schedule::validate`]).
4199 pub fn validate(&self) -> Result<(), String> {
4200 let from = self
4201 .from
4202 .as_deref()
4203 .map(|s| Active::parse_bound(s, self.tz))
4204 .transpose()
4205 .map_err(|e| e.replace("active:", "freeze:"))?;
4206 let until = self
4207 .until
4208 .as_deref()
4209 .map(|s| Active::parse_bound(s, self.tz))
4210 .transpose()
4211 .map_err(|e| e.replace("active:", "freeze:"))?;
4212 if let (Some(f), Some(u)) = (from, until) {
4213 if f >= u {
4214 return Err(format!(
4215 "freeze.from ({}) must be strictly before freeze.until ({})",
4216 self.from.as_deref().unwrap_or_default(),
4217 self.until.as_deref().unwrap_or_default(),
4218 ));
4219 }
4220 }
4221 Ok(())
4222 }
4223}
4224
4225/// The system-generated poll cadence every reconcile-shaped `when`
4226/// lowers to. Operators never write this: the real inter-run
4227/// spacing is the `every` cooldown; this only bounds "how soon do
4228/// we notice somebody is due" (#418 decision B took the poll
4229/// period away from the operator).
4230pub const POLL_CRON: &str = "0 * * * * *";
4231
4232/// What a [`When`] lowers to — the exact (cron, mode, cooldown)
4233/// trio the pre-#418 engine ran on. Keeping the engine vocabulary
4234/// unchanged is what lets Phase 1 swap the operator surface without
4235/// touching the tick / dedup machinery.
4236pub struct Lowered {
4237 /// Cron handed to `tokio-cron-scheduler` — [`POLL_CRON`] for
4238 /// reconcile shapes, a 6/7-field cron for calendar shapes.
4239 pub cron: String,
4240 /// Dedup semantics for `decide_fire`.
4241 pub mode: ExecMode,
4242 /// Humantime re-arm interval (`None` = succeed once, skip
4243 /// forever).
4244 pub cooldown: Option<String>,
4245 /// Timezone to evaluate `cron` in (#418 Phase 2). The scheduler
4246 /// passes this to `Job::new_async_tz`. Reconcile shapes carry
4247 /// the schedule's tz too even though POLL_CRON is tz-agnostic,
4248 /// so the same value drives the `active`-window check.
4249 pub tz: ScheduleTz,
4250}
4251
4252impl Schedule {
4253 /// The error message if this schedule's `constraints.window` is
4254 /// set but unparseable, else `None`. The scheduler logs this at
4255 /// register time so a fail-closed (never-firing) schedule from a
4256 /// hand-edited KV blob is diagnosable (gemini #452 review).
4257 pub fn bad_window(&self) -> Option<String> {
4258 let w = self.constraints.window.as_deref()?;
4259 Constraints::parse_window(w).err()
4260 }
4261
4262 /// True when this is a `calendar` schedule whose fire time can
4263 /// never fall inside its `constraints.window` — the cron fires,
4264 /// the window check rejects it, and (firing only at that
4265 /// time-of-day) it effectively never runs. An easy misconfig to
4266 /// set up by accident; the scheduler warns at register time
4267 /// (claude #452 review). Reconcile shapes poll every minute, so
4268 /// they always catch the window opening and aren't affected.
4269 pub fn calendar_outside_window(&self) -> bool {
4270 let When::Calendar(c) = &self.when else {
4271 return false;
4272 };
4273 let Some(t) = c.fire_time() else {
4274 return false;
4275 };
4276 matches!(self.constraints.window_contains(t), Some(false))
4277 }
4278
4279 /// Up to `count` future instants this schedule will fire, as
4280 /// absolute UTC, strictly after `now` — the dry-run / preview
4281 /// surface (#418 "ドライラン / プレビュー"). Only **calendar**
4282 /// schedules have discrete fire times; reconcile shapes
4283 /// (`per_pc`/`per_target`) poll every minute gated by cooldown, so
4284 /// they return an empty vec and the caller describes the cadence
4285 /// instead. Occurrences outside the `active.{from,until}` window or
4286 /// the `constraints.window` are **skipped**, so the list reflects
4287 /// when the schedule will ACTUALLY run, not the raw cron ticks.
4288 /// Evaluated in the schedule's `tz`, exactly like the scheduler's
4289 /// `Job::new_async_tz`, and with the same croner config the
4290 /// scheduler / [`Schedule::validate`] use, so a preview can never
4291 /// disagree with a real fire. A schedule that can never fire (a
4292 /// calendar time wholly outside its window, a past one-shot,
4293 /// `enabled: false` is *not* considered here — callers gate on
4294 /// `enabled` separately) yields an empty vec.
4295 pub fn preview_fires(
4296 &self,
4297 now: chrono::DateTime<chrono::Utc>,
4298 count: usize,
4299 ) -> Vec<chrono::DateTime<chrono::Utc>> {
4300 use croner::parser::{CronParser, Seconds};
4301 if !matches!(self.when, When::Calendar(_)) {
4302 return Vec::new();
4303 }
4304 // Same lowering + croner config as `next_calendar_fire` and the
4305 // live scheduler, so a preview can never disagree with a real
4306 // fire. `preview_fires` adds the N-occurrence walk and the
4307 // active / window filtering on top of that single seam.
4308 let lowered = self.lowered();
4309 let Ok(cron) = CronParser::builder()
4310 .seconds(Seconds::Required)
4311 .dom_and_dow(true)
4312 .build()
4313 .parse(&lowered.cron)
4314 else {
4315 return Vec::new();
4316 };
4317 let accept = |utc: chrono::DateTime<chrono::Utc>| {
4318 self.active.contains(utc, self.tz) && self.constraints.allows(utc, self.tz)
4319 };
4320 match self.tz {
4321 ScheduleTz::Utc => Self::next_occurrences(&cron, now, count, accept),
4322 ScheduleTz::Local => {
4323 Self::next_occurrences(&cron, now.with_timezone(&chrono::Local), count, accept)
4324 }
4325 }
4326 }
4327
4328 /// Walk croner forward from `after` collecting up to `count`
4329 /// accepted occurrences (converted to UTC). Generic over the tz the
4330 /// cron is evaluated in so `preview_fires` can run it in either
4331 /// `Utc` or `Local` without duplicating the loop.
4332 fn next_occurrences<Tz>(
4333 cron: &croner::Cron,
4334 after: chrono::DateTime<Tz>,
4335 count: usize,
4336 accept: impl Fn(chrono::DateTime<chrono::Utc>) -> bool,
4337 ) -> Vec<chrono::DateTime<chrono::Utc>>
4338 where
4339 Tz: chrono::TimeZone,
4340 {
4341 // Bound the scan so an `active`/window dead-end (every future
4342 // tick rejected) can't spin forever: ~4096 raw ticks covers
4343 // >10y of a daily calendar while staying instant for croner.
4344 const SCAN_CAP: usize = 4096;
4345 let mut out = Vec::with_capacity(count.min(SCAN_CAP));
4346 let mut cursor = after;
4347 let mut scanned = 0usize;
4348 while out.len() < count && scanned < SCAN_CAP {
4349 scanned += 1;
4350 let Ok(next) = cron.find_next_occurrence(&cursor, false) else {
4351 break;
4352 };
4353 let utc = next.with_timezone(&chrono::Utc);
4354 if accept(utc) {
4355 out.push(utc);
4356 }
4357 // `find_next_occurrence(.., inclusive = false)` already
4358 // advances strictly past `cursor`, so handing it `next`
4359 // verbatim gets the following occurrence — no manual +1s
4360 // nudge (and `DateTime<Tz>` is `Copy`, so no clone).
4361 cursor = next;
4362 }
4363 out
4364 }
4365
4366 /// Lower the operator-facing `when` onto the engine vocabulary.
4367 /// Single seam shared by the backend scheduler and the agent's
4368 /// local scheduler so the two can never drift.
4369 pub fn lowered(&self) -> Lowered {
4370 let tz = self.tz;
4371 match &self.when {
4372 When::PerPc(p) => Lowered {
4373 cron: POLL_CRON.into(),
4374 mode: ExecMode::OncePerPc,
4375 cooldown: p.cooldown(),
4376 tz,
4377 },
4378 When::PerTarget(p) => Lowered {
4379 cron: POLL_CRON.into(),
4380 mode: ExecMode::OncePerTarget,
4381 cooldown: p.cooldown(),
4382 tz,
4383 },
4384 // `to_cron` only fails on a malformed `at` (rejected by
4385 // validate() at create time). For a hand-edited KV blob
4386 // that slipped past, emit a deliberately-invalid cron so
4387 // register()'s Job::new_async_tz fails → warn+skip,
4388 // rather than firing at the wrong time.
4389 When::Calendar(c) => Lowered {
4390 cron: c
4391 .to_cron()
4392 .unwrap_or_else(|_| "# invalid calendar at".into()),
4393 mode: ExecMode::EveryTick,
4394 cooldown: None,
4395 tz,
4396 },
4397 // Event triggers have no cron — the agent fires them from an
4398 // OS event source. The `# event-trigger` cron is never
4399 // registered (the scheduler branches on `is_event()` first),
4400 // but keep it deliberately-invalid as a belt-and-suspenders
4401 // so a stray registration would fail rather than misfire.
4402 When::On(_) => Lowered {
4403 cron: "# event-trigger (no cron)".into(),
4404 mode: ExecMode::Event,
4405 cooldown: None,
4406 tz,
4407 },
4408 }
4409 }
4410
4411 /// True when this schedule fires from an OS event (`when: { on }`)
4412 /// rather than a clock — the agent skips `tokio-cron` registration
4413 /// for these and drives them from boot / session-change instead.
4414 pub fn is_event(&self) -> bool {
4415 matches!(self.when, When::On(_))
4416 }
4417
4418 /// The OS event triggers this schedule listens for, or `&[]` when it
4419 /// is not an event schedule.
4420 pub fn event_triggers(&self) -> &[OnTrigger] {
4421 match &self.when {
4422 When::On(t) => t,
4423 _ => &[],
4424 }
4425 }
4426
4427 /// The next absolute (UTC) time this schedule fires, or `None` when
4428 /// it has no discrete upcoming fire to preview.
4429 ///
4430 /// Used by the KLP `maintenance.list` preview ("what's about to
4431 /// happen on my PC", SPEC §2.1). Returns `None` for:
4432 ///
4433 /// - reconcile shapes (`per_pc` / `per_target`) — they lower to the
4434 /// every-minute [`POLL_CRON`] and re-converge state continuously,
4435 /// so "next fire" is always ~60s away and means nothing to a user
4436 /// previewing upcoming maintenance;
4437 /// - a calendar schedule whose lowered cron won't parse (a
4438 /// hand-edited KV blob that slipped past [`Schedule::validate`]);
4439 /// - a cron with no future occurrence.
4440 ///
4441 /// The wall-clock fire is evaluated in the schedule's own `tz`
4442 /// (matching the live tick's `Job::new_async_tz`) then normalised
4443 /// to UTC for the wire. `inclusive = false`: strictly the *next*
4444 /// fire after `now`, never one matching the current instant.
4445 pub fn next_calendar_fire(
4446 &self,
4447 now: chrono::DateTime<chrono::Utc>,
4448 ) -> Option<chrono::DateTime<chrono::Utc>> {
4449 if !matches!(self.when, When::Calendar(_)) {
4450 return None;
4451 }
4452 let lowered = self.lowered();
4453 // Same parser configuration tokio-cron-scheduler 0.15 uses
4454 // internally, so this can never compute a fire the live
4455 // scheduler wouldn't (seconds required, DOM-and-DOW honored).
4456 let cron = croner::parser::CronParser::builder()
4457 .seconds(croner::parser::Seconds::Required)
4458 .dom_and_dow(true)
4459 .build()
4460 .parse(&lowered.cron)
4461 .ok()?;
4462 match lowered.tz {
4463 ScheduleTz::Utc => cron.find_next_occurrence(&now, false).ok(),
4464 ScheduleTz::Local => {
4465 let now_local = now.with_timezone(&chrono::Local);
4466 cron.find_next_occurrence(&now_local, false)
4467 .ok()
4468 .map(|t| t.with_timezone(&chrono::Utc))
4469 }
4470 }
4471 }
4472
4473 /// Cross-field semantic checks that don't fit pure serde derive
4474 /// — the [`Manifest::validate`] counterpart (#418 decision F;
4475 /// pre-Phase-1 a broken schedule was accepted at create time
4476 /// and silently warn-skipped at tick time). Run at every create
4477 /// site: `kanade schedule create` (client-side) and
4478 /// `POST /api/schedules`. The job_id-exists check lives in the
4479 /// API handler instead — it needs the JOBS KV.
4480 pub fn validate(&self) -> Result<(), String> {
4481 if matches!(self.runs_on, RunsOn::Agent) && matches!(self.when, When::PerTarget(_)) {
4482 return Err(
4483 "when.per_target needs fleet-wide completion data and is backend-only; \
4484 it cannot be combined with runs_on: agent (each agent self-schedules, \
4485 so per-target dedup would be deduping across a target of 1)"
4486 .into(),
4487 );
4488 }
4489 // #418 event triggers: the agent owns the OS event source
4490 // (boot / session-change), so `when: { on }` is agent-only and
4491 // needs at least one trigger.
4492 if let When::On(triggers) = &self.when {
4493 if !matches!(self.runs_on, RunsOn::Agent) {
4494 return Err(
4495 "when.on (OS event trigger) is fired by the agent's own event \
4496 source, so it requires runs_on: agent"
4497 .into(),
4498 );
4499 }
4500 if triggers.is_empty() {
4501 return Err(
4502 "when.on must list at least one trigger (e.g. [startup, logon])".into(),
4503 );
4504 }
4505 }
4506 if let Some(cd) = self.lowered().cooldown.as_deref() {
4507 humantime::parse_duration(cd)
4508 .map_err(|e| format!("when.every: invalid duration '{cd}': {e}"))?;
4509 }
4510 if let When::Calendar(c) = &self.when {
4511 // Lower the calendar form to its cron (catches a bad `at`
4512 // and the date+days conflict), then validate that cron
4513 // with the same parser configuration tokio-cron-scheduler
4514 // 0.15 uses internally (croner, seconds required,
4515 // DOM-and-DOW both honored, year optional) — create-time
4516 // validation can never accept what register() rejects.
4517 let cron = c.to_cron()?;
4518 croner::parser::CronParser::builder()
4519 .seconds(croner::parser::Seconds::Required)
4520 .dom_and_dow(true)
4521 .build()
4522 .parse(&cron)
4523 .map_err(|e| format!("when.at lowered to invalid cron '{cron}': {e}"))?;
4524 }
4525 // The other humantime strings on the schedule (claude #419
4526 // review): runtime degrades gracefully on both (bad jitter →
4527 // silent no-op, bad starting_deadline → warn + skipped tick),
4528 // but "rejected at create time" should cover every field the
4529 // operator can typo, not just `when`.
4530 if let Some(j) = &self.plan.jitter {
4531 humantime::parse_duration(j)
4532 .map_err(|e| format!("jitter: invalid duration '{j}': {e}"))?;
4533 }
4534 if let Some(sd) = &self.starting_deadline {
4535 humantime::parse_duration(sd)
4536 .map_err(|e| format!("starting_deadline: invalid duration '{sd}': {e}"))?;
4537 }
4538 let from = self
4539 .active
4540 .from
4541 .as_deref()
4542 .map(|s| Active::parse_bound(s, self.tz))
4543 .transpose()?;
4544 let until = self
4545 .active
4546 .until
4547 .as_deref()
4548 .map(|s| Active::parse_bound(s, self.tz))
4549 .transpose()?;
4550 if let (Some(f), Some(u)) = (from, until) {
4551 if f >= u {
4552 return Err(format!(
4553 "active.from ({}) must be strictly before active.until ({})",
4554 self.active.from.as_deref().unwrap_or_default(),
4555 self.active.until.as_deref().unwrap_or_default(),
4556 ));
4557 }
4558 }
4559 // #418 Phase 3: a bad maintenance window is rejected at create
4560 // time (parse_window also catches equal bounds).
4561 if let Some(w) = self.constraints.window.as_deref() {
4562 Constraints::parse_window(w)?;
4563 }
4564 // #418 holiday exclusion: reject a malformed skip date at create
4565 // time so the fail-closed `allows` path only ever bites a
4566 // hand-edited KV blob, not a fresh `kanade schedule create`.
4567 if let Some(err) = self.constraints.bad_skip_date() {
4568 return Err(err);
4569 }
4570 // #418: constraints.max_concurrent is a central running-instance
4571 // cap, so it needs the backend's counter — reject it on
4572 // runs_on: agent (decision E), and reject a meaningless 0.
4573 if let Some(mc) = self.constraints.max_concurrent {
4574 // Check the structural incompatibility (agent has no central
4575 // counter) before the value range, so a `max_concurrent: 0`
4576 // + `runs_on: agent` combo reports the more fundamental
4577 // problem first (claude #542).
4578 if matches!(self.runs_on, RunsOn::Agent) {
4579 return Err(
4580 "constraints.max_concurrent needs a central counter and is backend-only; \
4581 it cannot be combined with runs_on: agent (each agent self-schedules, \
4582 so there is no fleet-wide count to cap against)"
4583 .into(),
4584 );
4585 }
4586 if mc == 0 {
4587 return Err(
4588 "constraints.max_concurrent must be >= 1 (0 would never fire; \
4589 omit it for no cap)"
4590 .into(),
4591 );
4592 }
4593 }
4594 // #418: constraints.require (host-state env gates: ac_power /
4595 // idle / cpu_below) is sensed in-process by the agent, so it
4596 // needs runs_on: agent — the backend can't read a target host's
4597 // power / idle / cpu state. Symmetric with `when: { on }` (also
4598 // agent-only); inverse of max_concurrent (backend-only).
4599 if let Some(req) = &self.constraints.require {
4600 if !req.is_empty() && matches!(self.runs_on, RunsOn::Backend) {
4601 return Err(
4602 "constraints.require (host-state env gates: ac_power / idle / cpu_below) \
4603 is sensed in-process by the agent and needs runs_on: agent; the backend \
4604 cannot read a target host's power / idle / cpu state"
4605 .into(),
4606 );
4607 }
4608 // Reject a malformed idle duration at create time so the
4609 // fail-closed runtime path only ever bites a hand-edited
4610 // KV blob (mirror skip_dates / on_failure.retry).
4611 if let Some(err) = req.bad_idle() {
4612 return Err(err);
4613 }
4614 // cpu_below is a percent — reject out-of-range so a typo
4615 // can't make a schedule that never (>=100 is always-busy?
4616 // no — <0 never matches) or trivially fires.
4617 if let Some(c) = req.cpu_below
4618 && !(c > 0.0 && c <= 100.0)
4619 {
4620 return Err(format!(
4621 "constraints.require.cpu_below must be in (0, 100] percent (got {c}); \
4622 omit it for no CPU requirement"
4623 ));
4624 }
4625 }
4626 // #418 Phase 4: a bad on_failure.retry is rejected at create
4627 // time — backoff must be valid humantime, and max is bounded
4628 // so a typo can't pin a flapping script in a tight loop.
4629 if let Some(r) = &self.on_failure.retry {
4630 let backoff = humantime::parse_duration(&r.backoff).map_err(|e| {
4631 format!(
4632 "on_failure.retry.backoff: invalid duration '{}': {e}",
4633 r.backoff
4634 )
4635 })?;
4636 // The wire form lowers backoff to whole seconds, so a
4637 // sub-second value would silently become a 0s no-wait
4638 // (coderabbit #466). Reject it rather than honour a backoff
4639 // the operator can't actually get.
4640 if backoff.as_secs() < 1 {
4641 return Err(format!(
4642 "on_failure.retry.backoff must be >= 1s (got '{}'); sub-second backoffs \
4643 round to 0 on the wire",
4644 r.backoff
4645 ));
4646 }
4647 if !(1..=10).contains(&r.max) {
4648 return Err(format!(
4649 "on_failure.retry.max must be 1..=10 (got {}); it counts additional \
4650 attempts after the first run",
4651 r.max
4652 ));
4653 }
4654 }
4655 Ok(())
4656 }
4657}
4658
4659fn default_true() -> bool {
4660 true
4661}