Skip to main content

harn_vm/
stdlib.rs

1//! Standard library builtins for the Harn VM.
2
3mod agent_sessions;
4pub mod agent_state;
5mod agents;
6mod agents_daemon;
7pub(crate) mod assemble;
8pub mod asset_paths;
9mod bytes;
10mod clock;
11mod collections;
12mod command_policy;
13mod compression;
14mod concurrency;
15mod connectors;
16mod cookies;
17mod crypto;
18mod csv;
19mod datetime;
20mod event_log;
21pub(crate) mod files;
22mod flow;
23mod fs;
24mod git;
25pub(crate) mod harn_entry;
26pub(crate) mod hitl;
27mod hitl_read;
28pub mod host;
29pub(crate) mod io;
30mod iter;
31pub(crate) mod json;
32mod json_query;
33mod junit;
34mod logging;
35pub mod long_running;
36mod math;
37mod memory;
38mod monitors;
39mod multipart;
40mod path;
41mod postgres;
42pub mod process;
43mod project;
44mod project_catalog;
45mod project_enrich;
46mod regex;
47pub(crate) mod registration;
48mod review;
49mod runtime_scope;
50pub(crate) mod sandbox;
51pub mod secret_scan;
52mod sets;
53pub(crate) mod shapes;
54mod skills;
55mod strings;
56pub(crate) mod supervisor;
57pub mod template;
58mod testing;
59pub(crate) mod tools;
60pub mod tracing;
61mod transcript_compact;
62mod triggers_stdlib;
63mod types;
64mod url_parse;
65mod vision;
66pub(crate) mod waitpoint;
67mod waitpoints;
68pub mod workflow_messages;
69
70use crate::http::register_http_builtins;
71use crate::llm::register_llm_builtins;
72use crate::mcp::register_mcp_builtins;
73use crate::mcp_server::register_mcp_server_builtins;
74use crate::vm::Vm;
75
76pub(crate) use crate::schema::{json_to_vm_value, schema_result_value};
77pub(crate) fn set_thread_source_dir(dir: &std::path::Path) {
78    process::set_thread_source_dir(dir);
79}
80
81/// Register core builtins: pure/deterministic, no I/O.
82pub fn register_core_stdlib(vm: &mut Vm) {
83    crate::runtime_context::register_runtime_context_builtins(vm);
84    types::register_type_builtins(vm);
85    math::register_math_builtins(vm);
86    strings::register_string_builtins(vm);
87    json::register_json_builtins(vm);
88    datetime::register_datetime_builtins(vm);
89    regex::register_regex_builtins(vm);
90    bytes::register_bytes_builtins(vm);
91    compression::register_compression_builtins(vm);
92    command_policy::register_command_policy_builtins(vm);
93    runtime_scope::register_runtime_scope_builtins(vm);
94    crypto::register_crypto_builtins(vm);
95    csv::register_csv_builtins(vm);
96    junit::register_junit_builtins(vm);
97    multipart::register_multipart_builtins(vm);
98    url_parse::register_url_builtins(vm);
99    cookies::register_cookie_builtins(vm);
100    path::register_path_helper_builtins(vm);
101    sets::register_set_builtins(vm);
102    collections::register_collection_builtins(vm);
103    iter::register_iter_builtins(vm);
104    event_log::register_event_log_builtins(vm);
105    shapes::register_shape_builtins(vm);
106    testing::register_testing_builtins(vm);
107    flow::register_flow_builtins(vm);
108}
109
110/// Register I/O builtins (requires OS access).
111pub fn register_io_stdlib(vm: &mut Vm) {
112    io::register_io_builtins(vm);
113    host::register_host_builtins(vm);
114    fs::register_fs_builtins(vm);
115    files::register_file_builtins(vm);
116    git::register_git_builtins(vm);
117    vision::register_vision_builtins(vm);
118    agent_state::register_agent_state_builtins(vm);
119    memory::register_memory_builtins(vm);
120    process::register_process_builtins(vm);
121    process::register_path_builtins(vm);
122    // Clock builtins overlay process::timestamp/elapsed so they honor
123    // mock_time / advance_time. Register AFTER process to take precedence.
124    clock::register_clock_builtins(vm);
125    project::register_project_builtins(vm);
126    tracing::register_tracing_builtins(vm);
127}
128
129/// Register agent builtins (requires network access and async runtime).
130pub fn register_agent_stdlib(vm: &mut Vm) {
131    concurrency::register_concurrency_builtins(vm);
132    connectors::register_connector_builtins(vm);
133    review::register_review_builtins(vm);
134    secret_scan::register_secret_scan_builtins(vm);
135    tools::register_tool_builtins(vm);
136    skills::register_skill_builtins(vm);
137    agents_daemon::register_daemon_builtins(vm);
138    triggers_stdlib::register_trigger_builtins(vm);
139    postgres::register_postgres_builtins(vm);
140    waitpoints::register_waitpoint_builtins(vm);
141    monitors::register_monitor_builtins(vm);
142    hitl::register_hitl_builtins(vm);
143    hitl_read::register_hitl_read_builtins(vm);
144    waitpoint::register_waitpoint_builtins(vm);
145    supervisor::register_supervisor_builtins(vm);
146    agents::register_agent_builtins(vm);
147    agent_sessions::register_agent_session_builtins(vm);
148    workflow_messages::register_workflow_message_builtins(vm);
149    transcript_compact::register_transcript_compaction_builtins(vm);
150    assemble::register_assemble_context_builtin(vm);
151    crate::egress::register_egress_builtins(vm);
152    register_http_builtins(vm);
153    register_llm_builtins(vm);
154    register_mcp_builtins(vm);
155    register_mcp_server_builtins(vm);
156    crate::step_runtime::register_step_builtins(vm);
157}
158
159/// Register all standard builtins on a VM (core + io + agent).
160pub fn register_vm_stdlib(vm: &mut Vm) {
161    register_core_stdlib(vm);
162    register_io_stdlib(vm);
163    register_agent_stdlib(vm);
164}
165
166fn stdlib_probe_vm() -> Vm {
167    let mut vm = Vm::new();
168    register_vm_stdlib(&mut vm);
169    // Name-only/metadata introspection never accesses this path, but passing
170    // a real per-platform temp dir keeps registration logic honest if a
171    // callee someday validates its parent.
172    let tmp = std::env::temp_dir();
173    crate::store::register_store_builtins(&mut vm, &tmp);
174    crate::checkpoint::register_checkpoint_builtins(&mut vm, &tmp, "default");
175    crate::metadata::register_metadata_builtins(&mut vm, &tmp);
176    crate::metadata::register_scan_builtins(&mut vm);
177    vm
178}
179
180/// Return the canonical list of all stdlib builtin names. Used by
181/// harn-lint and harn-lsp to avoid hardcoded duplicate lists.
182pub fn stdlib_builtin_names() -> Vec<String> {
183    let vm = stdlib_probe_vm();
184    let mut names = vm.builtin_names();
185    // Special opcodes/keywords, not registered builtins, but linter
186    // should recognize them as valid function calls.
187    for extra in [
188        "spawn",
189        "await",
190        "cancel",
191        "cancel_graceful",
192        "is_cancelled",
193    ] {
194        names.push(extra.to_string());
195    }
196    names
197}
198
199/// Return discoverable metadata for registered stdlib builtins.
200pub fn stdlib_builtin_metadata() -> Vec<crate::vm::VmBuiltinMetadata> {
201    stdlib_probe_vm().builtin_metadata()
202}
203
204/// Reset thread-local stdlib state. Call between test runs.
205///
206/// Note: `long_running::reset_state()` is intentionally NOT called here
207/// because that store is process-global, not thread-local. Wiping it
208/// from a per-test reset hook lets one test cancel another test's
209/// in-flight worker thread (and lose its `push_pending_feedback_global`
210/// notification), which surfaces as `walk_dir_long_running` /
211/// `glob_long_running` timing out under parallel test load. The two
212/// call sites that genuinely need a clean handle store —
213/// `stdlib::fs::tests::{walk_dir_long_running,glob_long_running}` — call
214/// `long_running::reset_state()` explicitly while holding
215/// `LONG_RUNNING_TEST_LOCK`.
216pub fn reset_stdlib_state() {
217    logging::reset_logging_state();
218    process::reset_process_state();
219    clock::reset_clock_state();
220    io::reset_io_state();
221    sandbox::reset_sandbox_state();
222    fs::reset_fs_state();
223    json::reset_json_state();
224    host::reset_host_state();
225    crate::egress::reset_egress_policy_for_host();
226    hitl::reset_hitl_state();
227    crate::http::reset_http_state();
228    monitors::reset_monitor_state();
229    waitpoints::reset_waitpoint_state();
230    waitpoint::reset_waitpoint_state();
231    postgres::reset_postgres_state();
232    supervisor::reset_supervisor_state();
233    agents::records::reset_eval_metrics();
234    agents::records::reset_friction_events();
235    tools::clear_current_tool_registry();
236    tools::clear_tool_synthesis_cache();
237    vision::reset_vision_state();
238    crate::skills::clear_current_skill_registry();
239    template::reset_prompt_registry();
240    crate::triggers::clear_webhook_intake_state();
241}