Skip to main content

workflow_graph_shared/
yaml.rs

1//! YAML workflow definition parser.
2//!
3//! Workflow files use a GitHub Actions-inspired format:
4//!
5//! ```yaml
6//! name: CI Pipeline
7//! on: push
8//!
9//! jobs:
10//!   lint:
11//!     name: Lint
12//!     run: cargo clippy --all-targets
13//!
14//!   test:
15//!     name: Unit Tests
16//!     run: cargo test
17//!
18//!   build:
19//!     name: Build
20//!     needs: [lint, test]
21//!     run: cargo build --release
22//!
23//!   deploy:
24//!     name: Deploy
25//!     needs: [build]
26//!     steps:
27//!       - name: Deploy DB
28//!         run: ./scripts/migrate.sh
29//!       - name: Deploy App
30//!         run: ./scripts/deploy.sh
31//! ```
32
33use indexmap::IndexMap;
34use serde::Deserialize;
35
36use crate::{Job, JobStatus, Workflow};
37
38/// Top-level YAML workflow definition.
39#[derive(Debug, Deserialize)]
40pub struct WorkflowDef {
41    pub name: String,
42    #[serde(rename = "on")]
43    pub trigger: TriggerDef,
44    #[serde(default)]
45    pub env: IndexMap<String, String>,
46    pub jobs: IndexMap<String, JobDef>,
47}
48
49/// Trigger can be a simple string or a structured definition.
50#[derive(Debug, Deserialize)]
51#[serde(untagged)]
52pub enum TriggerDef {
53    Simple(String),
54    List(Vec<String>),
55    Structured(IndexMap<String, serde_yaml::Value>),
56}
57
58impl TriggerDef {
59    pub fn display(&self) -> String {
60        match self {
61            TriggerDef::Simple(s) => format!("on: {s}"),
62            TriggerDef::List(v) => format!("on: [{}]", v.join(", ")),
63            TriggerDef::Structured(m) => {
64                let keys: Vec<&str> = m.keys().map(|k| k.as_str()).collect();
65                format!("on: [{}]", keys.join(", "))
66            }
67        }
68    }
69}
70
71/// A single job definition in the workflow YAML.
72#[derive(Debug, Deserialize)]
73pub struct JobDef {
74    /// Display name (defaults to the job key if not set).
75    pub name: Option<String>,
76    /// Job dependencies — other job IDs that must succeed first.
77    #[serde(default)]
78    pub needs: Needs,
79    /// Shell command to run (simple single-command job).
80    pub run: Option<String>,
81    /// Multi-step job (used instead of `run`).
82    #[serde(default)]
83    pub steps: Vec<StepDef>,
84    /// Per-job environment variables.
85    #[serde(default)]
86    pub env: IndexMap<String, String>,
87    /// Timeout in seconds.
88    pub timeout: Option<u64>,
89    /// Condition for running this job (expression string).
90    #[serde(rename = "if")]
91    pub condition: Option<String>,
92    /// Worker labels required to execute this job.
93    #[serde(default)]
94    pub labels: Vec<String>,
95    /// Maximum number of retries on failure (default 0).
96    #[serde(default)]
97    pub retries: u32,
98}
99
100/// Dependencies can be a single string or a list.
101#[derive(Debug, Default, Deserialize)]
102#[serde(untagged)]
103pub enum Needs {
104    #[default]
105    None,
106    Single(String),
107    List(Vec<String>),
108}
109
110impl Needs {
111    pub fn to_vec(&self) -> Vec<String> {
112        match self {
113            Needs::None => vec![],
114            Needs::Single(s) => vec![s.clone()],
115            Needs::List(v) => v.clone(),
116        }
117    }
118}
119
120/// A single step within a job.
121#[derive(Debug, Deserialize)]
122pub struct StepDef {
123    pub id: Option<String>,
124    pub name: Option<String>,
125    pub run: Option<String>,
126    #[serde(rename = "if")]
127    pub condition: Option<String>,
128    #[serde(default)]
129    pub env: IndexMap<String, String>,
130}
131
132impl WorkflowDef {
133    /// Parse a YAML string into a workflow definition.
134    pub fn from_yaml(yaml: &str) -> Result<Self, String> {
135        serde_yaml::from_str(yaml).map_err(|e| format!("YAML parse error: {e}"))
136    }
137
138    /// Parse a JSON string into a workflow definition.
139    pub fn from_json(json: &str) -> Result<Self, String> {
140        serde_json::from_str(json).map_err(|e| format!("JSON parse error: {e}"))
141    }
142
143    /// Auto-detect format and parse. Tries JSON first (stricter), falls back to YAML.
144    pub fn parse(input: &str) -> Result<Self, String> {
145        let trimmed = input.trim_start();
146        if trimmed.starts_with('{') {
147            Self::from_json(input)
148        } else {
149            Self::from_yaml(input)
150        }
151    }
152
153    /// Auto-detect format based on file extension.
154    pub fn from_file_contents(contents: &str, filename: &str) -> Result<Self, String> {
155        if filename.ends_with(".json") {
156            Self::from_json(contents)
157        } else if filename.ends_with(".yml") || filename.ends_with(".yaml") {
158            Self::from_yaml(contents)
159        } else {
160            Self::parse(contents)
161        }
162    }
163
164    /// Convert to the runtime `Workflow` model.
165    ///
166    /// For jobs with `steps`, the steps are joined into a single shell script
167    /// separated by `&&`. For jobs with `run`, that command is used directly.
168    pub fn into_workflow(self, id: &str) -> Result<Workflow, String> {
169        let trigger = self.trigger.display();
170        let mut jobs = Vec::with_capacity(self.jobs.len());
171
172        for (job_id, job_def) in &self.jobs {
173            let name = job_def.name.clone().unwrap_or_else(|| job_id.clone());
174
175            let command = build_command(job_def, &self.env)?;
176            let depends_on = job_def.needs.to_vec();
177
178            // Validate dependencies exist
179            for dep in &depends_on {
180                if !self.jobs.contains_key(dep) {
181                    return Err(format!(
182                        "Job '{job_id}' depends on '{dep}', which doesn't exist"
183                    ));
184                }
185            }
186
187            jobs.push(Job {
188                id: job_id.clone(),
189                name,
190                status: JobStatus::Queued,
191                command,
192                duration_secs: None,
193                started_at: None,
194                depends_on,
195                output: None,
196                required_labels: job_def.labels.clone(),
197                max_retries: job_def.retries,
198                attempt: 0,
199            });
200        }
201
202        Ok(Workflow {
203            id: id.to_string(),
204            name: self.name,
205            trigger,
206            jobs,
207        })
208    }
209}
210
211/// Build the shell command for a job, combining env vars and steps/run.
212fn build_command(job: &JobDef, global_env: &IndexMap<String, String>) -> Result<String, String> {
213    // Collect env var exports
214    let mut env_exports = Vec::new();
215    for (k, v) in global_env {
216        env_exports.push(format!("export {k}={}", shell_quote(v)));
217    }
218    for (k, v) in &job.env {
219        env_exports.push(format!("export {k}={}", shell_quote(v)));
220    }
221
222    let commands = if !job.steps.is_empty() {
223        // Multi-step: join step commands
224        let step_cmds: Result<Vec<String>, String> = job
225            .steps
226            .iter()
227            .enumerate()
228            .filter_map(|(i, step)| {
229                step.run.as_ref().map(|cmd| {
230                    let mut parts = Vec::new();
231                    // Per-step env
232                    for (k, v) in &step.env {
233                        parts.push(format!("export {k}={}", shell_quote(v)));
234                    }
235                    let default_label = format!("step {}", i + 1);
236                    let label = step
237                        .name
238                        .as_deref()
239                        .or(step.id.as_deref())
240                        .unwrap_or(&default_label);
241                    parts.push(format!("echo '=== {label} ==='"));
242                    parts.push(cmd.trim().to_string());
243                    Ok(parts.join(" && "))
244                })
245            })
246            .collect();
247        step_cmds?
248    } else if let Some(run) = &job.run {
249        vec![run.trim().to_string()]
250    } else {
251        return Err("Job must have either 'run' or 'steps'".to_string());
252    };
253
254    let mut full = env_exports;
255    full.extend(commands);
256    Ok(full.join(" && "))
257}
258
259fn shell_quote(s: &str) -> String {
260    format!("'{}'", s.replace('\'', "'\\''"))
261}
262
263#[cfg(test)]
264mod tests {
265    use super::*;
266
267    #[test]
268    fn parse_simple_workflow() {
269        let yaml = r#"
270name: CI
271on: push
272
273jobs:
274  lint:
275    name: Lint
276    run: cargo clippy
277
278  test:
279    name: Test
280    run: cargo test
281
282  build:
283    name: Build
284    needs: [lint, test]
285    run: cargo build --release
286"#;
287        let def = WorkflowDef::from_yaml(yaml).unwrap();
288        let wf = def.into_workflow("ci-1").unwrap();
289
290        assert_eq!(wf.name, "CI");
291        assert_eq!(wf.trigger, "on: push");
292        assert_eq!(wf.jobs.len(), 3);
293        assert_eq!(wf.jobs[2].depends_on, vec!["lint", "test"]);
294    }
295
296    #[test]
297    fn parse_steps_workflow() {
298        let yaml = r#"
299name: Deploy
300on: push
301
302jobs:
303  deploy:
304    name: Deploy All
305    steps:
306      - name: Migrate DB
307        run: ./migrate.sh
308      - name: Deploy App
309        run: ./deploy.sh
310"#;
311        let def = WorkflowDef::from_yaml(yaml).unwrap();
312        let wf = def.into_workflow("deploy-1").unwrap();
313
314        assert_eq!(wf.jobs.len(), 1);
315        assert!(wf.jobs[0].command.contains("Migrate DB"));
316        assert!(wf.jobs[0].command.contains("./deploy.sh"));
317    }
318
319    #[test]
320    fn invalid_dependency_errors() {
321        let yaml = r#"
322name: Bad
323on: push
324
325jobs:
326  build:
327    needs: [nonexistent]
328    run: echo hi
329"#;
330        let def = WorkflowDef::from_yaml(yaml).unwrap();
331        let result = def.into_workflow("bad-1");
332        assert!(result.is_err());
333        assert!(result.unwrap_err().contains("nonexistent"));
334    }
335
336    #[test]
337    fn job_without_run_or_steps_errors() {
338        let yaml = r#"
339name: Bad
340on: push
341
342jobs:
343  empty:
344    name: Empty Job
345"#;
346        let def = WorkflowDef::from_yaml(yaml).unwrap();
347        let result = def.into_workflow("bad-2");
348        assert!(result.is_err());
349        assert!(
350            result
351                .unwrap_err()
352                .contains("must have either 'run' or 'steps'")
353        );
354    }
355
356    #[test]
357    fn empty_jobs_map() {
358        let yaml = r#"
359name: Empty
360on: push
361
362jobs: {}
363"#;
364        let def = WorkflowDef::from_yaml(yaml).unwrap();
365        let wf = def.into_workflow("empty-1").unwrap();
366        assert_eq!(wf.jobs.len(), 0);
367    }
368
369    #[test]
370    fn single_string_dependency() {
371        let yaml = r#"
372name: Single Dep
373on: push
374
375jobs:
376  a:
377    run: echo a
378  b:
379    needs: a
380    run: echo b
381"#;
382        let def = WorkflowDef::from_yaml(yaml).unwrap();
383        let wf = def.into_workflow("single-1").unwrap();
384        assert_eq!(wf.jobs[1].depends_on, vec!["a"]);
385    }
386
387    #[test]
388    fn special_characters_in_job_names() {
389        let yaml = r#"
390name: Special Chars
391on: push
392
393jobs:
394  build-linux_x86:
395    name: "Build (Linux x86_64)"
396    run: echo "building"
397"#;
398        let def = WorkflowDef::from_yaml(yaml).unwrap();
399        let wf = def.into_workflow("special-1").unwrap();
400        assert_eq!(wf.jobs[0].id, "build-linux_x86");
401        assert_eq!(wf.jobs[0].name, "Build (Linux x86_64)");
402    }
403
404    #[test]
405    fn labels_and_retries_parsed() {
406        let yaml = r#"
407name: Config
408on: push
409
410jobs:
411  deploy:
412    name: Deploy
413    run: ./deploy.sh
414    labels: [linux, aws]
415    retries: 3
416"#;
417        let def = WorkflowDef::from_yaml(yaml).unwrap();
418        let wf = def.into_workflow("config-1").unwrap();
419        assert_eq!(wf.jobs[0].required_labels, vec!["linux", "aws"]);
420        assert_eq!(wf.jobs[0].max_retries, 3);
421    }
422
423    #[test]
424    fn env_vars_in_command() {
425        let yaml = r#"
426name: Env
427on: push
428
429env:
430  GLOBAL: "value"
431
432jobs:
433  test:
434    run: echo test
435    env:
436      LOCAL: "local_value"
437"#;
438        let def = WorkflowDef::from_yaml(yaml).unwrap();
439        let wf = def.into_workflow("env-1").unwrap();
440        assert!(wf.jobs[0].command.contains("export GLOBAL="));
441        assert!(wf.jobs[0].command.contains("export LOCAL="));
442    }
443
444    #[test]
445    fn json_format_parsing() {
446        let json = r#"{
447            "name": "JSON Workflow",
448            "on": "push",
449            "jobs": {
450                "test": {
451                    "run": "echo test"
452                }
453            }
454        }"#;
455        let def = WorkflowDef::from_json(json).unwrap();
456        let wf = def.into_workflow("json-1").unwrap();
457        assert_eq!(wf.name, "JSON Workflow");
458        assert_eq!(wf.jobs.len(), 1);
459    }
460
461    #[test]
462    fn malformed_yaml_returns_error() {
463        let yaml = "this is not valid yaml: [[[";
464        assert!(WorkflowDef::from_yaml(yaml).is_err());
465    }
466
467    #[test]
468    fn shell_quote_handles_single_quotes() {
469        let result = super::shell_quote("it's a test");
470        assert_eq!(result, "'it'\\''s a test'");
471    }
472}