Skip to main content

harn_vm/
stdlib.rs

1//! Standard library builtins for the Harn VM.
2
3mod agent_sessions;
4pub mod agent_state;
5pub(crate) mod agents;
6mod agents_daemon;
7pub(crate) mod assemble;
8pub mod asset_paths;
9mod bytes;
10mod calendar;
11mod channel_guardrails;
12mod channels;
13pub(crate) mod clock;
14mod collections;
15mod command_policy;
16mod compression;
17mod concurrency;
18mod connectors;
19mod cookies;
20mod crypto;
21mod csv;
22mod datetime;
23mod durable_step;
24mod event_log;
25pub(crate) mod files;
26mod flow;
27mod fs;
28mod git;
29pub(crate) mod harn_entry;
30pub(crate) mod hitl;
31mod hitl_read;
32pub mod host;
33pub(crate) mod io;
34mod iter;
35pub(crate) mod json;
36mod json_query;
37pub(crate) mod json_stream;
38mod junit;
39mod lifecycle_receipts;
40mod logging;
41pub mod long_running;
42mod math;
43pub(crate) mod memory;
44mod monitors;
45mod multipart;
46mod net_policy;
47mod oauth_dynreg;
48mod oauth_storage;
49mod observability;
50mod options;
51mod path;
52pub(crate) mod path_scope_guard;
53pub(crate) mod pool;
54mod postgres;
55pub mod process;
56mod project;
57mod project_catalog;
58mod project_enrich;
59mod regex;
60pub(crate) mod registration;
61mod review;
62mod runtime_scope;
63pub(crate) mod sandbox;
64pub mod secret_scan;
65mod sets;
66pub(crate) mod shapes;
67mod skills;
68mod strings;
69pub(crate) mod supervisor;
70pub mod template;
71mod testbench;
72mod testing;
73mod timing;
74pub mod token_redaction;
75pub(crate) mod tool_hooks;
76pub(crate) mod tools;
77pub mod tracing;
78mod transcript_compact;
79pub(crate) mod transcript_project;
80mod triggers_stdlib;
81mod tui;
82mod types;
83mod url_parse;
84mod vision;
85pub(crate) mod waitpoint;
86mod waitpoints;
87mod web;
88pub mod workflow_messages;
89
90use crate::http::register_http_builtins;
91use crate::llm::{register_deferred_llm_builtins, register_llm_builtins};
92use crate::mcp::register_mcp_builtins;
93use crate::mcp_server::register_mcp_server_builtins;
94use crate::vm::Vm;
95
96pub(crate) use crate::schema::{json_to_vm_value, schema_result_value};
97pub(crate) fn set_thread_source_dir(dir: &std::path::Path) {
98    process::set_thread_source_dir(dir);
99}
100
101/// Register core builtins: pure/deterministic, no I/O.
102pub fn register_core_stdlib(vm: &mut Vm) {
103    crate::runtime_context::register_runtime_context_builtins(vm);
104    types::register_type_builtins(vm);
105    math::register_math_builtins(vm);
106    strings::register_string_builtins(vm);
107    json::register_json_builtins(vm);
108    json_stream::register_json_stream_builtins(vm);
109    datetime::register_datetime_builtins(vm);
110    calendar::register_calendar_builtins(vm);
111    regex::register_regex_builtins(vm);
112    bytes::register_bytes_builtins(vm);
113    compression::register_compression_builtins(vm);
114    command_policy::register_command_policy_builtins(vm);
115    runtime_scope::register_runtime_scope_builtins(vm);
116    crypto::register_crypto_builtins(vm);
117    csv::register_csv_builtins(vm);
118    junit::register_junit_builtins(vm);
119    multipart::register_multipart_builtins(vm);
120    url_parse::register_url_builtins(vm);
121    web::register_web_builtins(vm);
122    cookies::register_cookie_builtins(vm);
123    path::register_path_helper_builtins(vm);
124    sets::register_set_builtins(vm);
125    collections::register_collection_builtins(vm);
126    iter::register_iter_builtins(vm);
127    event_log::register_event_log_builtins(vm);
128    durable_step::register_durable_step_builtins(vm);
129    channels::register_channel_builtins(vm);
130    channel_guardrails::register_channel_guardrail_builtins(vm);
131    shapes::register_shape_builtins(vm);
132    testing::register_testing_builtins(vm);
133    flow::register_flow_builtins(vm);
134    lifecycle_receipts::register_lifecycle_receipt_builtins(vm);
135    net_policy::register_net_policy_builtins(vm);
136}
137
138/// Register I/O builtins (requires OS access).
139pub fn register_io_stdlib(vm: &mut Vm) {
140    io::register_io_builtins(vm);
141    host::register_host_builtins(vm);
142    fs::register_fs_builtins(vm);
143    files::register_file_builtins(vm);
144    git::register_git_builtins(vm);
145    vision::register_vision_builtins(vm);
146    agent_state::register_agent_state_builtins(vm);
147    memory::register_memory_builtins(vm);
148    process::register_process_builtins(vm);
149    process::register_path_builtins(vm);
150    sandbox::register_sandbox_builtins(vm);
151    // Clock builtins overlay process::timestamp/elapsed so they honor
152    // mock_time / advance_time. Register AFTER process to take precedence.
153    clock::register_clock_builtins(vm);
154    testbench::register_testbench_builtins(vm);
155    project::register_project_builtins(vm);
156    tracing::register_tracing_builtins(vm);
157    observability::register_observability_builtins(vm);
158    timing::register_timing_builtins(vm);
159    tui::register_tui_builtins(vm);
160}
161
162fn register_agent_stdlib_before_llm(vm: &mut Vm) {
163    concurrency::register_concurrency_builtins(vm);
164    connectors::register_connector_builtins(vm);
165    review::register_review_builtins(vm);
166    secret_scan::register_secret_scan_builtins(vm);
167    tools::register_tool_builtins(vm);
168    tool_hooks::register_tool_hooks_builtins(vm);
169    crate::composition::register_composition_builtins(vm);
170    skills::register_skill_builtins(vm);
171    agents_daemon::register_daemon_builtins(vm);
172    triggers_stdlib::register_trigger_builtins(vm);
173    postgres::register_postgres_builtins(vm);
174    waitpoints::register_waitpoint_builtins(vm);
175    monitors::register_monitor_builtins(vm);
176    hitl::register_hitl_builtins(vm);
177    hitl_read::register_hitl_read_builtins(vm);
178    waitpoint::register_waitpoint_builtins(vm);
179    supervisor::register_supervisor_builtins(vm);
180    agents::register_agent_builtins(vm);
181    pool::register_pool_builtins(vm);
182    oauth_storage::register_oauth_storage_builtins(vm);
183    oauth_dynreg::register_oauth_dynreg_builtins(vm);
184    token_redaction::register_token_redaction_builtins(vm);
185    agent_sessions::register_agent_session_builtins(vm);
186    path_scope_guard::register_path_scope_guard_builtins(vm);
187    workflow_messages::register_workflow_message_builtins(vm);
188    transcript_compact::register_transcript_compaction_builtins(vm);
189    transcript_project::register_transcript_projection_builtins(vm);
190    assemble::register_assemble_context_builtin(vm);
191    crate::egress::register_egress_builtins(vm);
192    register_http_builtins(vm);
193}
194
195fn register_agent_stdlib_after_llm(vm: &mut Vm) {
196    register_mcp_builtins(vm);
197    register_mcp_server_builtins(vm);
198    crate::step_runtime::register_step_builtins(vm);
199}
200
201/// Register agent builtins (requires network access and async runtime).
202pub fn register_agent_stdlib(vm: &mut Vm) {
203    register_agent_stdlib_before_llm(vm);
204    register_llm_builtins(vm);
205    register_agent_stdlib_after_llm(vm);
206}
207
208fn register_agent_stdlib_with_deferred_llm(vm: &mut Vm) {
209    register_agent_stdlib_before_llm(vm);
210    register_deferred_llm_builtins(vm);
211    register_agent_stdlib_after_llm(vm);
212}
213
214/// Register all standard builtins on a VM (core + io + agent).
215pub fn register_vm_stdlib(vm: &mut Vm) {
216    register_core_stdlib(vm);
217    register_io_stdlib(vm);
218    register_agent_stdlib(vm);
219}
220
221/// Register the stdlib shape used by latency-sensitive CLI execution.
222pub fn register_vm_stdlib_with_deferred_llm(vm: &mut Vm) {
223    register_core_stdlib(vm);
224    register_io_stdlib(vm);
225    register_agent_stdlib_with_deferred_llm(vm);
226}
227
228pub(crate) fn rebind_execution_state_builtins(vm: &mut Vm) {
229    concurrency::register_concurrency_builtins(vm);
230}
231
232fn stdlib_probe_vm() -> Vm {
233    let mut vm = Vm::new();
234    register_vm_stdlib(&mut vm);
235    // Name-only/metadata introspection never accesses this path, but passing
236    // a real per-platform temp dir keeps registration logic honest if a
237    // callee someday validates its parent.
238    let tmp = std::env::temp_dir();
239    crate::store::register_store_builtins(&mut vm, &tmp);
240    crate::checkpoint::register_checkpoint_builtins(&mut vm, &tmp, "default");
241    crate::metadata::register_metadata_builtins(&mut vm, &tmp);
242    crate::metadata::register_scan_builtins(&mut vm);
243    vm
244}
245
246/// Return the canonical list of all stdlib builtin names. Used by
247/// harn-lint and harn-lsp to avoid hardcoded duplicate lists.
248pub fn stdlib_builtin_names() -> Vec<String> {
249    let vm = stdlib_probe_vm();
250    let mut names = vm.builtin_names();
251    // Special opcodes/keywords, not registered builtins, but linter
252    // should recognize them as valid function calls.
253    for extra in [
254        "spawn",
255        "await",
256        "cancel",
257        "cancel_graceful",
258        "__signal_interrupted",
259        "__signal_off_interrupt",
260        "__signal_on_interrupt",
261        "__signal_raise",
262        "is_cancelled",
263    ] {
264        names.push(extra.to_string());
265    }
266    names
267}
268
269/// Return discoverable metadata for registered stdlib builtins.
270pub fn stdlib_builtin_metadata() -> Vec<crate::vm::VmBuiltinMetadata> {
271    stdlib_probe_vm().builtin_metadata()
272}
273
274/// Reset thread-local stdlib state. Call between test runs.
275///
276/// Note: `long_running::reset_state()` is intentionally NOT called here
277/// because that store is process-global, not thread-local. Wiping it
278/// from a per-test reset hook lets one test cancel another test's
279/// in-flight worker thread (and lose its `agent_inbox::push`
280/// notification), which surfaces as `walk_dir_long_running` /
281/// `glob_long_running` timing out under parallel test load. The two
282/// call sites that genuinely need a clean handle store —
283/// `stdlib::fs::tests::{walk_dir_long_running,glob_long_running}` — call
284/// `long_running::reset_state()` explicitly while holding
285/// `LONG_RUNNING_TEST_LOCK`.
286pub fn reset_stdlib_state() {
287    logging::reset_logging_state();
288    process::reset_process_state();
289    clock::reset_clock_state();
290    io::reset_io_state();
291    sandbox::reset_sandbox_state();
292    fs::reset_fs_state();
293    json::reset_json_state();
294    json_stream::reset_json_stream_state();
295    host::reset_host_state();
296    observability::reset_observability_state();
297    timing::reset_timing_state();
298    durable_step::reset_durable_step_state();
299    crate::egress::reset_egress_policy_for_host();
300    hitl::reset_hitl_state();
301    crate::http::reset_http_state();
302    monitors::reset_monitor_state();
303    waitpoints::reset_waitpoint_state();
304    waitpoint::reset_waitpoint_state();
305    triggers_stdlib::reset_auto_resume_timeouts();
306    agents::reset_agent_worker_state();
307    pool::reset_pool_state();
308    postgres::reset_postgres_state();
309    supervisor::reset_supervisor_state();
310    agents::records::reset_eval_metrics();
311    agents::records::reset_friction_events();
312    tools::clear_current_tool_registry();
313    tools::clear_tool_synthesis_cache();
314    vision::reset_vision_state();
315    crate::skills::clear_current_skill_registry();
316    template::reset_prompt_registry();
317    crate::triggers::clear_webhook_intake_state();
318    crate::llm::cache::reset_in_process_cache_state();
319}