Skip to main content

harn_cli/commands/
playground.rs

1use std::collections::HashSet;
2use std::io::{self, Write};
3use std::path::{Path, PathBuf};
4use std::rc::Rc;
5
6use harn_parser::{DiagnosticSeverity, Node, SNode, TypeChecker};
7
8use crate::cli::PlaygroundArgs;
9use crate::commands::run::{
10    connect_mcp_servers, install_cli_llm_mock_mode, persist_cli_llm_mock_recording, CliLlmMockMode,
11};
12use crate::package;
13use crate::skill_loader::{
14    emit_loader_warnings, install_skills_global, load_skills, SkillLoaderInputs,
15};
16
17#[derive(Clone, Debug, PartialEq, Eq)]
18struct LlmOverride {
19    provider: String,
20    model: String,
21}
22
23/// Inputs to `execute_playground_inputs` — the in-process sibling of
24/// `harn playground`. Tests construct this directly instead of going through
25/// clap. The binary entry (`run_command`) builds this from `PlaygroundArgs`.
26#[derive(Clone, Debug)]
27pub struct PlaygroundInputs {
28    pub host: PathBuf,
29    pub script: PathBuf,
30    pub task: String,
31    /// Optional `provider:model` override, in the same format `--llm` accepts.
32    pub llm: Option<String>,
33    pub llm_mock_mode: CliLlmMockMode,
34}
35
36#[derive(Clone, Debug)]
37struct PlaygroundConfig {
38    host: PathBuf,
39    script: PathBuf,
40    task: String,
41    llm: Option<LlmOverride>,
42    llm_mock_mode: CliLlmMockMode,
43}
44
45pub(crate) async fn run_command(
46    args: PlaygroundArgs,
47    llm_mock_mode: CliLlmMockMode,
48) -> Result<(), String> {
49    let config = PlaygroundConfig {
50        host: canonicalize_or_err(&args.host)?,
51        script: canonicalize_or_err(&args.script)?,
52        task: args.task.unwrap_or_default(),
53        llm: args.llm.as_deref().map(parse_llm_override).transpose()?,
54        llm_mock_mode,
55    };
56
57    if args.watch {
58        run_watch(&config).await
59    } else {
60        let output = execute_playground(&config).await?;
61        if !output.is_empty() {
62            io::stdout()
63                .write_all(output.as_bytes())
64                .map_err(|error| format!("failed to write playground output: {error}"))?;
65        }
66        Ok(())
67    }
68}
69
70/// In-process entry point for `harn playground`. Returns the captured stdout
71/// the CLI dispatcher would have printed, or a rendered error string.
72///
73/// This is the path tests use to exercise the playground driver without
74/// spawning the `harn` binary. Watch mode is not supported here — it has no
75/// terminal output contract worth asserting on.
76pub async fn execute_playground_inputs(inputs: PlaygroundInputs) -> Result<String, String> {
77    let llm = inputs.llm.as_deref().map(parse_llm_override).transpose()?;
78    let config = PlaygroundConfig {
79        host: canonicalize_or_err(inputs.host.to_string_lossy().as_ref())?,
80        script: canonicalize_or_err(inputs.script.to_string_lossy().as_ref())?,
81        task: inputs.task,
82        llm,
83        llm_mock_mode: inputs.llm_mock_mode,
84    };
85    execute_playground(&config).await
86}
87
88async fn run_watch(config: &PlaygroundConfig) -> Result<(), String> {
89    use notify::{Event, EventKind, RecursiveMode, Watcher};
90
91    eprintln!(
92        "\x1b[2m[playground] running {} with host {}...\x1b[0m",
93        config.script.display(),
94        config.host.display()
95    );
96    emit_run_result(execute_playground(config).await);
97
98    let roots = watch_roots(&config.host, &config.script);
99    let (tx, mut rx) = tokio::sync::mpsc::channel::<()>(1);
100    let _watcher = {
101        let tx = tx.clone();
102        let mut watcher = notify::recommended_watcher(move |res: Result<Event, _>| {
103            if let Ok(event) = res {
104                if matches!(
105                    event.kind,
106                    EventKind::Modify(_) | EventKind::Create(_) | EventKind::Remove(_)
107                ) {
108                    let has_harn = event
109                        .paths
110                        .iter()
111                        .any(|path| path.extension().is_some_and(|ext| ext == "harn"));
112                    if has_harn {
113                        let _ = tx.blocking_send(());
114                    }
115                }
116            }
117        })
118        .map_err(|error| format!("failed to create playground watcher: {error}"))?;
119
120        for root in &roots {
121            watcher
122                .watch(root, RecursiveMode::Recursive)
123                .map_err(|error| format!("failed to watch {}: {error}", root.display()))?;
124        }
125        watcher
126    };
127
128    eprintln!(
129        "\x1b[2m[playground] watching {} (ctrl-c to stop)\x1b[0m",
130        roots
131            .iter()
132            .map(|path| path.display().to_string())
133            .collect::<Vec<_>>()
134            .join(", ")
135    );
136
137    loop {
138        rx.recv().await;
139        tokio::time::sleep(std::time::Duration::from_millis(200)).await;
140        while rx.try_recv().is_ok() {}
141
142        eprintln!();
143        eprintln!(
144            "\x1b[2m[playground] change detected, re-running {}...\x1b[0m",
145            config.script.display()
146        );
147        emit_run_result(execute_playground(config).await);
148    }
149}
150
151fn emit_run_result(result: Result<String, String>) {
152    match result {
153        Ok(output) => {
154            if !output.is_empty() {
155                let _ = io::stdout().write_all(output.as_bytes());
156            }
157        }
158        Err(error) => eprint!("{error}"),
159    }
160}
161
162async fn execute_playground(config: &PlaygroundConfig) -> Result<String, String> {
163    let (host_source, host_program) = crate::parse_source_file(&config.host.to_string_lossy());
164    typecheck_program(&host_source, &host_program, &config.host, &HashSet::new())?;
165    let host_exports = exported_host_functions(&host_program);
166
167    let (script_source, script_program) =
168        crate::parse_source_file(&config.script.to_string_lossy());
169    typecheck_program(
170        &script_source,
171        &script_program,
172        &config.script,
173        &host_exports,
174    )?;
175
176    let chunk = harn_vm::Compiler::new()
177        .compile(&script_program)
178        .map_err(|error| format!("error: compile error: {error}\n"))?;
179
180    let env_guard = ScopedEnv::apply(config);
181    let source_parent = config
182        .script
183        .parent()
184        .unwrap_or_else(|| Path::new("."))
185        .to_path_buf();
186    let project_root = harn_vm::stdlib::process::find_project_root(&source_parent);
187    let store_base = project_root.as_deref().unwrap_or(source_parent.as_path());
188    let execution_cwd = std::env::current_dir()
189        .unwrap_or_else(|_| PathBuf::from("."))
190        .to_string_lossy()
191        .into_owned();
192    let source_dir = source_parent.to_string_lossy().into_owned();
193
194    let local = tokio::task::LocalSet::new();
195    let result = local
196        .run_until(async {
197            install_cli_llm_mock_mode(&config.llm_mock_mode)
198                .map_err(|error| format!("error: {error}\n"))?;
199            let host_vm = configured_vm(
200                &config.host,
201                &host_source,
202                project_root.as_deref(),
203                store_base,
204            )
205            .await?;
206            let bridge = Rc::new(
207                harn_vm::bridge::HostBridge::from_harn_module(host_vm, &config.host)
208                    .await
209                    .map_err(|error| format!("error: {error}\n"))?,
210            );
211
212            let mut vm = configured_vm(
213                &config.script,
214                &script_source,
215                project_root.as_deref(),
216                store_base,
217            )
218            .await?;
219            vm.set_bridge(bridge.clone());
220            harn_vm::llm::install_current_host_bridge(bridge.clone());
221            harn_vm::stdlib::process::set_thread_execution_context(Some(
222                harn_vm::orchestration::RunExecutionRecord {
223                    cwd: Some(execution_cwd),
224                    source_dir: Some(source_dir),
225                    env: std::collections::BTreeMap::new(),
226                    adapter: None,
227                    repo_path: None,
228                    worktree_path: None,
229                    branch: None,
230                    base_ref: None,
231                    cleanup: None,
232                },
233            ));
234            let execution_result = match vm.execute(&chunk).await {
235                Ok(_) => Ok(vm.output().to_string()),
236                Err(error) => Err(vm.format_runtime_error(&error)),
237            };
238            harn_vm::llm::clear_current_host_bridge();
239            harn_vm::stdlib::process::set_thread_execution_context(None);
240            persist_cli_llm_mock_recording(&config.llm_mock_mode)
241                .map_err(|error| format!("error: {error}\n"))?;
242            execution_result
243        })
244        .await;
245    drop(env_guard);
246    result
247}
248
249async fn configured_vm(
250    path: &Path,
251    source: &str,
252    project_root: Option<&Path>,
253    store_base: &Path,
254) -> Result<harn_vm::Vm, String> {
255    let mut vm = harn_vm::Vm::new();
256    harn_vm::register_vm_stdlib(&mut vm);
257    crate::install_default_hostlib(&mut vm);
258    harn_vm::register_store_builtins(&mut vm, store_base);
259    harn_vm::register_metadata_builtins(&mut vm, store_base);
260    let pipeline_name = path
261        .file_stem()
262        .and_then(|stem| stem.to_str())
263        .unwrap_or("default");
264    harn_vm::register_checkpoint_builtins(&mut vm, store_base, pipeline_name);
265    vm.set_source_info(&path.to_string_lossy(), source);
266    if let Some(root) = project_root {
267        vm.set_project_root(root);
268    }
269    if let Some(parent) = path.parent() {
270        if !parent.as_os_str().is_empty() {
271            vm.set_source_dir(parent);
272        }
273    }
274    vm.set_global("argv", harn_vm::VmValue::List(Rc::new(Vec::new())));
275
276    let loaded = load_skills(&SkillLoaderInputs {
277        cli_dirs: Vec::new(),
278        source_path: Some(path.to_path_buf()),
279    });
280    emit_loader_warnings(&loaded.loader_warnings);
281    install_skills_global(&mut vm, &loaded);
282
283    let extensions = package::load_runtime_extensions(path);
284    package::install_runtime_extensions(&extensions);
285    if let Some(manifest) = extensions.root_manifest.as_ref() {
286        if !manifest.mcp.is_empty() {
287            connect_mcp_servers(&manifest.mcp, &mut vm).await;
288        }
289    }
290    package::install_manifest_triggers(&mut vm, &extensions)
291        .await
292        .map_err(|error| format!("failed to install manifest triggers: {error}"))?;
293
294    Ok(vm)
295}
296
297fn typecheck_program(
298    source: &str,
299    program: &[SNode],
300    path: &Path,
301    extra_names: &HashSet<String>,
302) -> Result<(), String> {
303    let graph = harn_modules::build(&[path.to_path_buf()]);
304    let mut checker = TypeChecker::new();
305    let mut imported = graph.imported_names_for_file(path).unwrap_or_default();
306    imported.extend(extra_names.iter().cloned());
307    if !imported.is_empty() {
308        checker = checker.with_imported_names(imported);
309    }
310    if let Some(imported) = graph.imported_type_declarations_for_file(path) {
311        checker = checker.with_imported_type_decls(imported);
312    }
313    if let Some(imported) = graph.imported_callable_declarations_for_file(path) {
314        checker = checker.with_imported_callable_decls(imported);
315    }
316
317    let diagnostics = checker.check(program);
318    let mut rendered = String::new();
319    let mut had_error = false;
320    for diagnostic in &diagnostics {
321        if diagnostic.severity == DiagnosticSeverity::Error {
322            had_error = true;
323        }
324        rendered.push_str(&harn_parser::diagnostic::render_type_diagnostic(
325            source,
326            &path.to_string_lossy(),
327            diagnostic,
328        ));
329    }
330
331    if had_error {
332        return Err(rendered);
333    }
334    if !rendered.is_empty() {
335        eprint!("{rendered}");
336    }
337    Ok(())
338}
339
340fn exported_host_functions(program: &[SNode]) -> HashSet<String> {
341    let mut public_names = HashSet::new();
342    let mut all_names = HashSet::new();
343    let mut has_pub_fn = false;
344
345    for node in program {
346        let inner = match &node.node {
347            Node::AttributedDecl { inner, .. } => inner.as_ref(),
348            _ => node,
349        };
350        let Node::FnDecl { name, is_pub, .. } = &inner.node else {
351            continue;
352        };
353        all_names.insert(name.clone());
354        if *is_pub {
355            has_pub_fn = true;
356            public_names.insert(name.clone());
357        }
358    }
359
360    if has_pub_fn {
361        public_names
362    } else {
363        all_names
364    }
365}
366
367fn watch_roots(host: &Path, script: &Path) -> Vec<PathBuf> {
368    let mut roots = Vec::new();
369    for candidate in [
370        host.parent().unwrap_or_else(|| Path::new(".")),
371        script.parent().unwrap_or_else(|| Path::new(".")),
372    ] {
373        if !roots.iter().any(|existing| existing == candidate) {
374            roots.push(candidate.to_path_buf());
375        }
376    }
377    roots
378}
379
380fn parse_llm_override(raw: &str) -> Result<LlmOverride, String> {
381    let (provider, model) = raw
382        .split_once(':')
383        .ok_or_else(|| "playground --llm expects provider:model".to_string())?;
384    let provider = provider.trim();
385    let model = model.trim();
386    if provider.is_empty() || model.is_empty() {
387        return Err("playground --llm expects provider:model".to_string());
388    }
389    Ok(LlmOverride {
390        provider: provider.to_string(),
391        model: model.to_string(),
392    })
393}
394
395fn canonicalize_or_err(path: &str) -> Result<PathBuf, String> {
396    std::fs::canonicalize(path).map_err(|error| format!("failed to resolve {path}: {error}"))
397}
398
399struct ScopedEnv {
400    previous: Vec<(String, Option<String>)>,
401}
402
403impl ScopedEnv {
404    fn apply(config: &PlaygroundConfig) -> Self {
405        let mut previous = Vec::new();
406        Self::set("HARN_TASK", Some(config.task.as_str()), &mut previous);
407        if let Some(llm) = &config.llm {
408            Self::set(
409                "HARN_LLM_PROVIDER",
410                Some(llm.provider.as_str()),
411                &mut previous,
412            );
413            Self::set("HARN_LLM_MODEL", Some(llm.model.as_str()), &mut previous);
414        }
415        Self { previous }
416    }
417
418    fn set(key: &str, value: Option<&str>, previous: &mut Vec<(String, Option<String>)>) {
419        previous.push((key.to_string(), std::env::var(key).ok()));
420        match value {
421            Some(value) => std::env::set_var(key, value),
422            None => std::env::remove_var(key),
423        }
424    }
425}
426
427impl Drop for ScopedEnv {
428    fn drop(&mut self) {
429        for (key, previous) in self.previous.iter().rev() {
430            match previous {
431                Some(value) => std::env::set_var(key, value),
432                None => std::env::remove_var(key),
433            }
434        }
435    }
436}
437
438#[cfg(test)]
439mod tests {
440    use super::*;
441
442    fn write_file(path: &Path, contents: &str) {
443        if let Some(parent) = path.parent() {
444            std::fs::create_dir_all(parent).unwrap();
445        }
446        std::fs::write(path, contents).unwrap();
447    }
448
449    #[test]
450    fn exported_host_functions_prefers_pub_names() {
451        let temp = tempfile::tempdir().unwrap();
452        let path = temp.path().join("host_pub.harn");
453        let source = r#"
454fn helper() {}
455pub fn run_shell(command) { return command }
456pub fn request_permission(tool_name, request_args) { return true }
457"#;
458        write_file(&path, source);
459        let (_, program) = crate::parse_source_file(path.to_string_lossy().as_ref());
460        let names = exported_host_functions(&program);
461        assert!(names.contains("run_shell"));
462        assert!(names.contains("request_permission"));
463        assert!(!names.contains("helper"));
464    }
465
466    #[test]
467    fn parse_llm_override_splits_provider_and_model() {
468        let parsed = parse_llm_override("ollama:qwen2.5-coder:latest").unwrap();
469        assert_eq!(parsed.provider, "ollama");
470        assert_eq!(parsed.model, "qwen2.5-coder:latest");
471    }
472
473    #[tokio::test(flavor = "current_thread")]
474    async fn playground_executes_host_backed_script() {
475        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
476        let temp = tempfile::tempdir().unwrap();
477        let host = temp.path().join("host.harn");
478        let script = temp.path().join("pipeline.harn");
479        write_file(
480            &host,
481            r#"
482pub fn build_prompt(task) {
483  return "prompt: " + task
484}
485"#,
486        );
487        write_file(
488            &script,
489            r#"
490pipeline default(task) {
491  llm_mock({text: "done"})
492  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
493  println(result.text)
494}
495"#,
496        );
497
498        let output = execute_playground(&PlaygroundConfig {
499            host,
500            script,
501            task: "ship it".to_string(),
502            llm: Some(LlmOverride {
503                provider: "mock".to_string(),
504                model: "mock".to_string(),
505            }),
506            llm_mock_mode: CliLlmMockMode::Off,
507        })
508        .await
509        .unwrap();
510
511        assert!(output.contains("done"));
512    }
513
514    #[tokio::test(flavor = "current_thread")]
515    async fn playground_reports_missing_capability_with_caller_context() {
516        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
517        let temp = tempfile::tempdir().unwrap();
518        let host = temp.path().join("host.harn");
519        let script = temp.path().join("pipeline.harn");
520        write_file(
521            &host,
522            r#"
523pub fn helper() {
524  return "ok"
525}
526"#,
527        );
528        write_file(
529            &script,
530            r#"
531pipeline default(task) {
532  run_shell("pwd")
533}
534"#,
535        );
536
537        let error = execute_playground(&PlaygroundConfig {
538            host,
539            script,
540            task: String::new(),
541            llm: None,
542            llm_mock_mode: CliLlmMockMode::Off,
543        })
544        .await
545        .unwrap_err();
546
547        assert!(error.contains("run_shell"));
548        assert!(error.contains("pipeline.harn:3:3"));
549    }
550
551    #[tokio::test(flavor = "current_thread")]
552    async fn playground_replays_cli_llm_mock_fixtures() {
553        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
554        let temp = tempfile::tempdir().unwrap();
555        let host = temp.path().join("host.harn");
556        let script = temp.path().join("pipeline.harn");
557        let fixtures = temp.path().join("fixtures.jsonl");
558        write_file(
559            &host,
560            r#"
561pub fn build_prompt(task) {
562  return "prompt: " + task
563}
564"#,
565        );
566        write_file(
567            &script,
568            r#"
569pipeline default(task) {
570  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
571  println(result.text)
572}
573"#,
574        );
575        write_file(
576            &fixtures,
577            r#"{"text":"fixture replay","model":"fixture-model"}
578"#,
579        );
580
581        let output = execute_playground(&PlaygroundConfig {
582            host,
583            script,
584            task: "ship it".to_string(),
585            llm: Some(LlmOverride {
586                provider: "anthropic".to_string(),
587                model: "claude-sonnet".to_string(),
588            }),
589            llm_mock_mode: CliLlmMockMode::Replay {
590                fixture_path: fixtures,
591            },
592        })
593        .await
594        .unwrap();
595
596        assert!(output.contains("fixture replay"));
597    }
598}