agentics-domain 0.4.0

Domain types and validation models for the Agentics challenge platform.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
use serde::{Deserialize, Serialize};

use super::super::names::RunName;
use super::super::paths::{BundleRelativePath, RunInputPath, RunOutputPath};
use super::serde_helpers::{
    required_nullable, required_nullable_non_empty_vec, required_nullable_non_empty_vec_schema,
    required_nullable_schema, serialize_empty_vec_as_null,
};

/// Evaluator entrypoint and output-file contract for a bundle.
#[derive(Debug, Clone, Serialize, Deserialize, garde::Validate, schemars::JsonSchema)]
#[garde(allow_unvalidated)]
#[serde(deny_unknown_fields)]
pub struct EvaluatorSpec {
    #[garde(
        length(min = 1),
        inner(
            custom(crate::validation::trimmed_non_empty),
            custom(crate::validation::no_nul)
        )
    )]
    pub command: Vec<String>,
    pub result_file: BundleRelativePath,
}

/// Supported challenge execution topology.
#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(rename_all = "snake_case")]
pub enum ChallengeExecutionMode {
    SeparatedEvaluator,
    PipedStdio,
    CoexecutedBenchmark,
}

impl ChallengeExecutionMode {
    /// Return the stable runtime name used for container labels and bundle script directories.
    pub fn runtime_name(self) -> &'static str {
        match self {
            Self::SeparatedEvaluator => "separated-evaluator",
            Self::PipedStdio => "interactive-evaluator",
            Self::CoexecutedBenchmark => "coexecuted-evaluator",
        }
    }
}

/// Challenge-owned execution topology and run manifest locations for `zip_project`.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(tag = "mode", rename_all = "snake_case")]
pub enum ChallengeExecutionSpec {
    SeparatedEvaluator(SeparatedEvaluatorExecutionSpec),
    PipedStdio(PipedStdioExecutionSpec),
    CoexecutedBenchmark(CoexecutedBenchmarkExecutionSpec),
}

impl ChallengeExecutionSpec {
    /// Return the current execution topology mode.
    pub fn mode(&self) -> ChallengeExecutionMode {
        match self {
            Self::SeparatedEvaluator(_) => ChallengeExecutionMode::SeparatedEvaluator,
            Self::PipedStdio(_) => ChallengeExecutionMode::PipedStdio,
            Self::CoexecutedBenchmark(_) => ChallengeExecutionMode::CoexecutedBenchmark,
        }
    }

    /// Borrow the current piped-stdio execution contract.
    pub fn piped_stdio(&self) -> Option<&PipedStdioExecutionSpec> {
        match self {
            Self::SeparatedEvaluator(_) => None,
            Self::PipedStdio(spec) => Some(spec),
            Self::CoexecutedBenchmark(_) => None,
        }
    }

    /// Borrow the current coexecuted-evaluator contract.
    pub fn coexecuted_benchmark(&self) -> Option<&CoexecutedBenchmarkExecutionSpec> {
        match self {
            Self::SeparatedEvaluator(_) | Self::PipedStdio(_) => None,
            Self::CoexecutedBenchmark(spec) => Some(spec),
        }
    }

    /// Borrow the trusted evaluator command contract for the current topology.
    pub fn trusted_evaluator(&self) -> &EvaluatorSpec {
        match self {
            Self::SeparatedEvaluator(spec) => &spec.separated_evaluator,
            Self::PipedStdio(spec) => &spec.interactive_evaluator,
            Self::CoexecutedBenchmark(spec) => &spec.coexecuted_evaluator,
        }
    }

    /// Borrow public validation run locator if declared.
    pub fn validation_runs(&self) -> Option<&BundleRelativePath> {
        match self {
            Self::SeparatedEvaluator(spec) => spec.validation_runs.as_ref(),
            Self::PipedStdio(_) | Self::CoexecutedBenchmark(_) => None,
        }
    }

    /// Borrow public validation setup contract if declared.
    pub fn validation_setup(&self) -> Option<&ChallengeSetupSpec> {
        match self {
            Self::SeparatedEvaluator(spec) => spec.validation_setup.as_ref(),
            Self::PipedStdio(_) | Self::CoexecutedBenchmark(_) => None,
        }
    }

    /// Borrow official benchmark run locator if declared.
    pub fn official_runs(&self) -> Option<&BundleRelativePath> {
        match self {
            Self::SeparatedEvaluator(spec) => spec.official_runs.as_ref(),
            Self::PipedStdio(_) | Self::CoexecutedBenchmark(_) => None,
        }
    }

    /// Borrow official benchmark setup contract if declared.
    pub fn official_evaluation_setup(&self) -> Option<&ChallengeSetupSpec> {
        match self {
            Self::SeparatedEvaluator(spec) => spec.official_evaluation_setup.as_ref(),
            Self::PipedStdio(_) | Self::CoexecutedBenchmark(_) => None,
        }
    }

    /// Return whether the official evaluator declares setup-generated official inputs.
    pub fn has_official_evaluation_setup(&self) -> bool {
        match self {
            Self::SeparatedEvaluator(spec) => spec.official_evaluation_setup.is_some(),
            Self::PipedStdio(spec) => spec.official_evaluation_setup.is_some(),
            Self::CoexecutedBenchmark(spec) => spec.official_evaluation_setup.is_some(),
        }
    }
}

/// Current separated-container evaluator topology.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct SeparatedEvaluatorExecutionSpec {
    pub separated_evaluator: EvaluatorSpec,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<BundleRelativePath>"
    )]
    pub validation_runs: Option<BundleRelativePath>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<ChallengeSetupSpec>"
    )]
    pub validation_setup: Option<ChallengeSetupSpec>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<BundleRelativePath>"
    )]
    pub official_runs: Option<BundleRelativePath>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<ChallengeSetupSpec>"
    )]
    pub official_evaluation_setup: Option<ChallengeSetupSpec>,
}

/// Interactive topology where a trusted interactive-evaluator exchanges stdio with one solution run.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct PipedStdioExecutionSpec {
    pub interactive_evaluator: EvaluatorSpec,
    pub acknowledge_stdio_protocol_framing: bool,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<BundleRelativePath>"
    )]
    pub validation_session: Option<BundleRelativePath>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<PipedStdioSetupSpec>"
    )]
    pub validation_setup: Option<PipedStdioSetupSpec>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<BundleRelativePath>"
    )]
    pub official_session: Option<BundleRelativePath>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<PipedStdioSetupSpec>"
    )]
    pub official_evaluation_setup: Option<PipedStdioSetupSpec>,
}

/// Coexecuted topology where a trusted coexecuted-evaluator imports participant code in one container.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct CoexecutedBenchmarkExecutionSpec {
    pub coexecuted_evaluator: EvaluatorSpec,
    pub acknowledge_danger: bool,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<CoexecutedBenchmarkSetupSpec>"
    )]
    pub validation_setup: Option<CoexecutedBenchmarkSetupSpec>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<CoexecutedBenchmarkSetupSpec>"
    )]
    pub official_evaluation_setup: Option<CoexecutedBenchmarkSetupSpec>,
}

/// Public execution metadata that excludes official private benchmark locators.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(tag = "mode", rename_all = "snake_case")]
pub enum PublicChallengeExecutionSpec {
    SeparatedEvaluator(PublicSeparatedEvaluatorExecutionSpec),
    PipedStdio(PublicPipedStdioExecutionSpec),
    CoexecutedBenchmark(PublicCoexecutedBenchmarkExecutionSpec),
}

impl PublicChallengeExecutionSpec {
    /// Borrow the trusted evaluator command contract for the public execution topology.
    pub fn trusted_evaluator(&self) -> &EvaluatorSpec {
        match self {
            Self::SeparatedEvaluator(spec) => &spec.separated_evaluator,
            Self::PipedStdio(spec) => &spec.interactive_evaluator,
            Self::CoexecutedBenchmark(spec) => &spec.coexecuted_evaluator,
        }
    }
}

impl From<ChallengeExecutionSpec> for PublicChallengeExecutionSpec {
    fn from(execution: ChallengeExecutionSpec) -> Self {
        match execution {
            ChallengeExecutionSpec::SeparatedEvaluator(spec) => {
                Self::SeparatedEvaluator(PublicSeparatedEvaluatorExecutionSpec {
                    separated_evaluator: spec.separated_evaluator,
                    validation_runs: spec.validation_runs,
                    validation_setup: spec.validation_setup,
                })
            }
            ChallengeExecutionSpec::PipedStdio(spec) => {
                Self::PipedStdio(PublicPipedStdioExecutionSpec {
                    interactive_evaluator: spec.interactive_evaluator,
                    acknowledge_stdio_protocol_framing: spec.acknowledge_stdio_protocol_framing,
                    validation_session: spec.validation_session,
                    validation_setup: spec.validation_setup,
                })
            }
            ChallengeExecutionSpec::CoexecutedBenchmark(spec) => {
                Self::CoexecutedBenchmark(PublicCoexecutedBenchmarkExecutionSpec {
                    coexecuted_evaluator: spec.coexecuted_evaluator,
                    acknowledge_danger: spec.acknowledge_danger,
                    validation_setup: spec.validation_setup,
                })
            }
        }
    }
}

/// Public separated-evaluator topology metadata.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct PublicSeparatedEvaluatorExecutionSpec {
    pub separated_evaluator: EvaluatorSpec,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub validation_runs: Option<BundleRelativePath>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub validation_setup: Option<ChallengeSetupSpec>,
}

/// Public piped-stdio topology metadata.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct PublicPipedStdioExecutionSpec {
    pub interactive_evaluator: EvaluatorSpec,
    pub acknowledge_stdio_protocol_framing: bool,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub validation_session: Option<BundleRelativePath>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub validation_setup: Option<PipedStdioSetupSpec>,
}

/// Public coexecuted-evaluator topology metadata.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct PublicCoexecutedBenchmarkExecutionSpec {
    pub coexecuted_evaluator: EvaluatorSpec,
    pub acknowledge_danger: bool,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub validation_setup: Option<CoexecutedBenchmarkSetupSpec>,
}

/// Optional separated-evaluator command that sets up generated benchmark inputs.
#[derive(Debug, Clone, Serialize, Deserialize, garde::Validate, schemars::JsonSchema)]
#[garde(allow_unvalidated)]
#[serde(deny_unknown_fields)]
pub struct ChallengeSetupSpec {
    #[garde(
        length(min = 1),
        inner(
            custom(crate::validation::trimmed_non_empty),
            custom(crate::validation::no_nul)
        )
    )]
    pub command: Vec<String>,
    /// Relative path, under the setup workspace, to the generated run manifest.
    pub result_runs_file: BundleRelativePath,
    /// Challenge-owner notes about seeds, versions, or external data provenance.
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(required, schema_with = "required_nullable_schema::<String>")]
    #[garde(custom(crate::validation::optional_trimmed_non_empty))]
    pub reproducibility_notes: Option<String>,
}

/// Optional interactive-evaluator command that sets up one generated interactive session.
#[derive(Debug, Clone, Serialize, Deserialize, garde::Validate, schemars::JsonSchema)]
#[garde(allow_unvalidated)]
#[serde(deny_unknown_fields)]
pub struct PipedStdioSetupSpec {
    #[garde(
        length(min = 1),
        inner(
            custom(crate::validation::trimmed_non_empty),
            custom(crate::validation::no_nul)
        )
    )]
    pub command: Vec<String>,
    /// Relative path, under the setup workspace, to the generated session manifest.
    pub result_session_file: BundleRelativePath,
    /// Challenge-owner notes about seeds, versions, or external data provenance.
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(required, schema_with = "required_nullable_schema::<String>")]
    #[garde(custom(crate::validation::optional_trimmed_non_empty))]
    pub reproducibility_notes: Option<String>,
}

/// Optional coexecuted-evaluator command that sets up files for a coexecuted run.
#[derive(Debug, Clone, Serialize, Deserialize, garde::Validate, schemars::JsonSchema)]
#[garde(allow_unvalidated)]
#[serde(deny_unknown_fields)]
pub struct CoexecutedBenchmarkSetupSpec {
    #[garde(
        length(min = 1),
        inner(
            custom(crate::validation::trimmed_non_empty),
            custom(crate::validation::no_nul)
        )
    )]
    pub command: Vec<String>,
    /// Challenge-owner notes about seeds, versions, or external data provenance.
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(required, schema_with = "required_nullable_schema::<String>")]
    #[garde(custom(crate::validation::optional_trimmed_non_empty))]
    pub reproducibility_notes: Option<String>,
}

/// Challenge-owned list of evaluator-controlled solution invocations.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct ChallengeRunManifest {
    pub runs: Vec<ChallengeRunSpec>,
}

/// One solution invocation generated by the worker and later evaluated by the evaluator.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct ChallengeRunSpec {
    pub run_name: RunName,
    pub interface: ChallengeRunInterface,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<serde_json::Value>"
    )]
    pub stdin_json: Option<serde_json::Value>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(required, schema_with = "required_nullable_schema::<String>")]
    pub stdin_text: Option<String>,
    #[serde(
        deserialize_with = "required_nullable_non_empty_vec",
        serialize_with = "serialize_empty_vec_as_null"
    )]
    #[schemars(
        required,
        schema_with = "required_nullable_non_empty_vec_schema::<ChallengeRunInputFile>"
    )]
    pub input_files: Vec<ChallengeRunInputFile>,
    #[serde(
        deserialize_with = "required_nullable_non_empty_vec",
        serialize_with = "serialize_empty_vec_as_null"
    )]
    #[schemars(
        required,
        schema_with = "required_nullable_non_empty_vec_schema::<RunOutputPath>"
    )]
    pub output_files: Vec<RunOutputPath>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<serde_json::Map<String, serde_json::Value>>"
    )]
    pub metadata: Option<serde_json::Map<String, serde_json::Value>>,
}

/// Supported worker-managed solution input/output interfaces.
#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(rename_all = "snake_case")]
pub enum ChallengeRunInterface {
    Stdio,
    FileSystem,
}

/// One input file materialized into `AGENTICS_INPUT_DIR` for a file-mode run.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct ChallengeRunInputFile {
    pub path: RunInputPath,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub source_path: Option<BundleRelativePath>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub content: Option<String>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub content_json: Option<serde_json::Value>,
}

/// Challenge-owned single interactive session manifest for `piped_stdio`.
#[derive(Debug, Clone, Serialize, Deserialize, schemars::JsonSchema)]
#[serde(deny_unknown_fields)]
pub struct PipedStdioSessionManifest {
    pub session_name: RunName,
    #[serde(
        deserialize_with = "required_nullable_non_empty_vec",
        serialize_with = "serialize_empty_vec_as_null"
    )]
    #[schemars(
        required,
        schema_with = "required_nullable_non_empty_vec_schema::<ChallengeRunInputFile>"
    )]
    pub input_files: Vec<ChallengeRunInputFile>,
    #[serde(deserialize_with = "required_nullable")]
    #[schemars(
        required,
        schema_with = "required_nullable_schema::<serde_json::Map<String, serde_json::Value>>"
    )]
    pub metadata: Option<serde_json::Map<String, serde_json::Value>>,
}