swink-agent-eval 0.9.0

Evaluation framework for swink-agent: trajectory tracing, golden path verification, and cost governance
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
repos:
  - repo: local
    hooks:
      - id: swink-eval-smoke
        name: swink-eval smoke suite
        entry: swink-eval run --set eval-sets/smoke.yaml --reporter console
        language: system
        pass_filenames: false
        stages: [commit, push]
      - id: swink-eval-gate
        name: swink-eval gate (local thresholds)
        # Ephemeral: runs the smoke suite, pipes the JSON through the gate.
        # A non-zero exit from `gate` blocks the commit.
        entry: bash -c 'swink-eval run --set eval-sets/smoke.yaml --out /tmp/swink-eval.json --reporter console >/dev/null && swink-eval gate --result /tmp/swink-eval.json --gate-config .github/eval/local-gate.json'
        language: system
        pass_filenames: false
        stages: [push]