Skip to main content

harn_cli/commands/
playground.rs

1use std::collections::HashSet;
2use std::io::{self, Write};
3use std::path::{Path, PathBuf};
4use std::rc::Rc;
5
6use harn_parser::{DiagnosticSeverity, Node, SNode, TypeChecker};
7
8use crate::cli::PlaygroundArgs;
9use crate::commands::run::{
10    connect_mcp_servers, install_cli_llm_mock_mode, persist_cli_llm_mock_recording, CliLlmMockMode,
11};
12use crate::package;
13use crate::skill_loader::{
14    emit_loader_warnings, install_skills_global, load_skills, SkillLoaderInputs,
15};
16
17#[derive(Clone, Debug, PartialEq, Eq)]
18struct LlmOverride {
19    provider: String,
20    model: String,
21}
22
23/// Inputs to `execute_playground_inputs` — the in-process sibling of
24/// `harn playground`. Tests construct this directly instead of going through
25/// clap. The binary entry (`run_command`) builds this from `PlaygroundArgs`.
26#[derive(Clone, Debug)]
27pub struct PlaygroundInputs {
28    pub host: PathBuf,
29    pub script: PathBuf,
30    pub task: String,
31    /// Optional `provider:model` override, in the same format `--llm` accepts.
32    pub llm: Option<String>,
33    pub llm_mock_mode: CliLlmMockMode,
34}
35
36#[derive(Clone, Debug)]
37struct PlaygroundConfig {
38    host: PathBuf,
39    script: PathBuf,
40    task: String,
41    llm: Option<LlmOverride>,
42    llm_mock_mode: CliLlmMockMode,
43}
44
45pub(crate) async fn run_command(
46    args: PlaygroundArgs,
47    llm_mock_mode: CliLlmMockMode,
48) -> Result<(), String> {
49    let config = PlaygroundConfig {
50        host: canonicalize_or_err(&args.host)?,
51        script: canonicalize_or_err(&args.script)?,
52        task: args.task.unwrap_or_default(),
53        llm: args.llm.as_deref().map(parse_llm_override).transpose()?,
54        llm_mock_mode,
55    };
56
57    if args.watch {
58        run_watch(&config).await
59    } else {
60        let output = execute_playground(&config).await?;
61        if !output.is_empty() {
62            io::stdout()
63                .write_all(output.as_bytes())
64                .map_err(|error| format!("failed to write playground output: {error}"))?;
65        }
66        Ok(())
67    }
68}
69
70/// In-process entry point for `harn playground`. Returns the captured stdout
71/// the CLI dispatcher would have printed, or a rendered error string.
72///
73/// This is the path tests use to exercise the playground driver without
74/// spawning the `harn` binary. Watch mode is not supported here — it has no
75/// terminal output contract worth asserting on.
76pub async fn execute_playground_inputs(inputs: PlaygroundInputs) -> Result<String, String> {
77    let llm = inputs.llm.as_deref().map(parse_llm_override).transpose()?;
78    let config = PlaygroundConfig {
79        host: canonicalize_or_err(inputs.host.to_string_lossy().as_ref())?,
80        script: canonicalize_or_err(inputs.script.to_string_lossy().as_ref())?,
81        task: inputs.task,
82        llm,
83        llm_mock_mode: inputs.llm_mock_mode,
84    };
85    execute_playground(&config).await
86}
87
88async fn run_watch(config: &PlaygroundConfig) -> Result<(), String> {
89    use notify::{Event, EventKind, RecursiveMode, Watcher};
90
91    eprintln!(
92        "\x1b[2m[playground] running {} with host {}...\x1b[0m",
93        config.script.display(),
94        config.host.display()
95    );
96    emit_run_result(execute_playground(config).await);
97
98    let roots = watch_roots(&config.host, &config.script);
99    let (tx, mut rx) = tokio::sync::mpsc::channel::<()>(1);
100    let _watcher = {
101        let tx = tx.clone();
102        let mut watcher = notify::recommended_watcher(move |res: Result<Event, _>| {
103            if let Ok(event) = res {
104                if matches!(
105                    event.kind,
106                    EventKind::Modify(_) | EventKind::Create(_) | EventKind::Remove(_)
107                ) {
108                    let has_harn = event
109                        .paths
110                        .iter()
111                        .any(|path| path.extension().is_some_and(|ext| ext == "harn"));
112                    if has_harn {
113                        let _ = tx.blocking_send(());
114                    }
115                }
116            }
117        })
118        .map_err(|error| format!("failed to create playground watcher: {error}"))?;
119
120        for root in &roots {
121            watcher
122                .watch(root, RecursiveMode::Recursive)
123                .map_err(|error| format!("failed to watch {}: {error}", root.display()))?;
124        }
125        watcher
126    };
127
128    eprintln!(
129        "\x1b[2m[playground] watching {} (ctrl-c to stop)\x1b[0m",
130        roots
131            .iter()
132            .map(|path| path.display().to_string())
133            .collect::<Vec<_>>()
134            .join(", ")
135    );
136
137    loop {
138        rx.recv().await;
139        tokio::time::sleep(std::time::Duration::from_millis(200)).await;
140        while rx.try_recv().is_ok() {}
141
142        eprintln!();
143        eprintln!(
144            "\x1b[2m[playground] change detected, re-running {}...\x1b[0m",
145            config.script.display()
146        );
147        emit_run_result(execute_playground(config).await);
148    }
149}
150
151fn emit_run_result(result: Result<String, String>) {
152    match result {
153        Ok(output) => {
154            if !output.is_empty() {
155                let _ = io::stdout().write_all(output.as_bytes());
156            }
157        }
158        Err(error) => eprint!("{error}"),
159    }
160}
161
162async fn execute_playground(config: &PlaygroundConfig) -> Result<String, String> {
163    let (host_source, host_program) = crate::parse_source_file(&config.host.to_string_lossy());
164    typecheck_program(&host_source, &host_program, &config.host, &HashSet::new())?;
165    let host_exports = exported_host_functions(&host_program);
166
167    let (script_source, script_program) =
168        crate::parse_source_file(&config.script.to_string_lossy());
169    typecheck_program(
170        &script_source,
171        &script_program,
172        &config.script,
173        &host_exports,
174    )?;
175
176    let chunk = harn_vm::Compiler::new()
177        .compile(&script_program)
178        .map_err(|error| format!("error: compile error: {error}\n"))?;
179
180    let env_guard = ScopedEnv::apply(config);
181    let source_parent = config
182        .script
183        .parent()
184        .unwrap_or_else(|| Path::new("."))
185        .to_path_buf();
186    let project_root = harn_vm::stdlib::process::find_project_root(&source_parent);
187    let store_base = project_root.as_deref().unwrap_or(source_parent.as_path());
188    let execution_cwd = std::env::current_dir()
189        .unwrap_or_else(|_| PathBuf::from("."))
190        .to_string_lossy()
191        .into_owned();
192    let source_dir = source_parent.to_string_lossy().into_owned();
193
194    let local = tokio::task::LocalSet::new();
195    let result = local
196        .run_until(async {
197            install_cli_llm_mock_mode(&config.llm_mock_mode)
198                .map_err(|error| format!("error: {error}\n"))?;
199            let host_vm = configured_vm(
200                &config.host,
201                &host_source,
202                project_root.as_deref(),
203                store_base,
204            )
205            .await?;
206            let bridge = Rc::new(
207                harn_vm::bridge::HostBridge::from_harn_module(host_vm, &config.host)
208                    .await
209                    .map_err(|error| format!("error: {error}\n"))?,
210            );
211
212            let mut vm = configured_vm(
213                &config.script,
214                &script_source,
215                project_root.as_deref(),
216                store_base,
217            )
218            .await?;
219            vm.set_bridge(bridge.clone());
220            harn_vm::llm::install_current_host_bridge(bridge.clone());
221            harn_vm::stdlib::process::set_thread_execution_context(Some(
222                harn_vm::orchestration::RunExecutionRecord {
223                    cwd: Some(execution_cwd),
224                    source_dir: Some(source_dir),
225                    env: std::collections::BTreeMap::new(),
226                    adapter: None,
227                    repo_path: None,
228                    worktree_path: None,
229                    branch: None,
230                    base_ref: None,
231                    cleanup: None,
232                },
233            ));
234            let execution_result = match vm.execute(&chunk).await {
235                Ok(_) => Ok(vm.output().to_string()),
236                Err(error) => Err(vm.format_runtime_error(&error)),
237            };
238            harn_vm::llm::clear_current_host_bridge();
239            harn_vm::stdlib::process::set_thread_execution_context(None);
240            persist_cli_llm_mock_recording(&config.llm_mock_mode)
241                .map_err(|error| format!("error: {error}\n"))?;
242            execution_result
243        })
244        .await;
245    drop(env_guard);
246    result
247}
248
249async fn configured_vm(
250    path: &Path,
251    source: &str,
252    project_root: Option<&Path>,
253    store_base: &Path,
254) -> Result<harn_vm::Vm, String> {
255    let mut vm = harn_vm::Vm::new();
256    harn_vm::register_vm_stdlib(&mut vm);
257    crate::install_default_hostlib(&mut vm);
258    harn_vm::register_store_builtins(&mut vm, store_base);
259    harn_vm::register_metadata_builtins(&mut vm, store_base);
260    let pipeline_name = path
261        .file_stem()
262        .and_then(|stem| stem.to_str())
263        .unwrap_or("default");
264    harn_vm::register_checkpoint_builtins(&mut vm, store_base, pipeline_name);
265    vm.set_source_info(&path.to_string_lossy(), source);
266    if let Some(root) = project_root {
267        vm.set_project_root(root);
268    }
269    if let Some(parent) = path.parent() {
270        if !parent.as_os_str().is_empty() {
271            vm.set_source_dir(parent);
272        }
273    }
274    vm.set_global("argv", harn_vm::VmValue::List(Rc::new(Vec::new())));
275    vm.set_harness(harn_vm::Harness::real());
276
277    let loaded = load_skills(&SkillLoaderInputs {
278        cli_dirs: Vec::new(),
279        source_path: Some(path.to_path_buf()),
280    });
281    emit_loader_warnings(&loaded.loader_warnings);
282    install_skills_global(&mut vm, &loaded);
283
284    let extensions = package::load_runtime_extensions(path);
285    package::install_runtime_extensions(&extensions);
286    if let Some(manifest) = extensions.root_manifest.as_ref() {
287        if !manifest.mcp.is_empty() {
288            connect_mcp_servers(&manifest.mcp, &mut vm).await;
289        }
290    }
291    package::install_manifest_triggers(&mut vm, &extensions)
292        .await
293        .map_err(|error| format!("failed to install manifest triggers: {error}"))?;
294
295    Ok(vm)
296}
297
298fn typecheck_program(
299    source: &str,
300    program: &[SNode],
301    path: &Path,
302    extra_names: &HashSet<String>,
303) -> Result<(), String> {
304    let graph = harn_modules::build(&[path.to_path_buf()]);
305    let mut checker = TypeChecker::new();
306    let mut imported = graph.imported_names_for_file(path).unwrap_or_default();
307    imported.extend(extra_names.iter().cloned());
308    if !imported.is_empty() {
309        checker = checker.with_imported_names(imported);
310    }
311    if let Some(imported) = graph.imported_type_declarations_for_file(path) {
312        checker = checker.with_imported_type_decls(imported);
313    }
314    if let Some(imported) = graph.imported_callable_declarations_for_file(path) {
315        checker = checker.with_imported_callable_decls(imported);
316    }
317
318    let diagnostics = checker.check(program);
319    let mut rendered = String::new();
320    let mut had_error = false;
321    for diagnostic in &diagnostics {
322        if diagnostic.severity == DiagnosticSeverity::Error {
323            had_error = true;
324        }
325        rendered.push_str(&harn_parser::diagnostic::render_type_diagnostic(
326            source,
327            &path.to_string_lossy(),
328            diagnostic,
329        ));
330    }
331
332    if had_error {
333        return Err(rendered);
334    }
335    if !rendered.is_empty() {
336        eprint!("{rendered}");
337    }
338    Ok(())
339}
340
341fn exported_host_functions(program: &[SNode]) -> HashSet<String> {
342    let mut public_names = HashSet::new();
343    let mut all_names = HashSet::new();
344    let mut has_pub_fn = false;
345
346    for node in program {
347        let inner = match &node.node {
348            Node::AttributedDecl { inner, .. } => inner.as_ref(),
349            _ => node,
350        };
351        let Node::FnDecl { name, is_pub, .. } = &inner.node else {
352            continue;
353        };
354        all_names.insert(name.clone());
355        if *is_pub {
356            has_pub_fn = true;
357            public_names.insert(name.clone());
358        }
359    }
360
361    if has_pub_fn {
362        public_names
363    } else {
364        all_names
365    }
366}
367
368fn watch_roots(host: &Path, script: &Path) -> Vec<PathBuf> {
369    let mut roots = Vec::new();
370    for candidate in [
371        host.parent().unwrap_or_else(|| Path::new(".")),
372        script.parent().unwrap_or_else(|| Path::new(".")),
373    ] {
374        if !roots.iter().any(|existing| existing == candidate) {
375            roots.push(candidate.to_path_buf());
376        }
377    }
378    roots
379}
380
381fn parse_llm_override(raw: &str) -> Result<LlmOverride, String> {
382    let (provider, model) = raw
383        .split_once(':')
384        .ok_or_else(|| "playground --llm expects provider:model".to_string())?;
385    let provider = provider.trim();
386    let model = model.trim();
387    if provider.is_empty() || model.is_empty() {
388        return Err("playground --llm expects provider:model".to_string());
389    }
390    Ok(LlmOverride {
391        provider: provider.to_string(),
392        model: model.to_string(),
393    })
394}
395
396fn canonicalize_or_err(path: &str) -> Result<PathBuf, String> {
397    std::fs::canonicalize(path).map_err(|error| format!("failed to resolve {path}: {error}"))
398}
399
400struct ScopedEnv {
401    previous: Vec<(String, Option<String>)>,
402}
403
404impl ScopedEnv {
405    fn apply(config: &PlaygroundConfig) -> Self {
406        let mut previous = Vec::new();
407        Self::set("HARN_TASK", Some(config.task.as_str()), &mut previous);
408        if let Some(llm) = &config.llm {
409            Self::set(
410                "HARN_LLM_PROVIDER",
411                Some(llm.provider.as_str()),
412                &mut previous,
413            );
414            Self::set("HARN_LLM_MODEL", Some(llm.model.as_str()), &mut previous);
415        }
416        Self { previous }
417    }
418
419    fn set(key: &str, value: Option<&str>, previous: &mut Vec<(String, Option<String>)>) {
420        previous.push((key.to_string(), std::env::var(key).ok()));
421        match value {
422            Some(value) => std::env::set_var(key, value),
423            None => std::env::remove_var(key),
424        }
425    }
426}
427
428impl Drop for ScopedEnv {
429    fn drop(&mut self) {
430        for (key, previous) in self.previous.iter().rev() {
431            match previous {
432                Some(value) => std::env::set_var(key, value),
433                None => std::env::remove_var(key),
434            }
435        }
436    }
437}
438
439#[cfg(test)]
440mod tests {
441    use super::*;
442
443    fn write_file(path: &Path, contents: &str) {
444        if let Some(parent) = path.parent() {
445            std::fs::create_dir_all(parent).unwrap();
446        }
447        std::fs::write(path, contents).unwrap();
448    }
449
450    #[test]
451    fn exported_host_functions_prefers_pub_names() {
452        let temp = tempfile::tempdir().unwrap();
453        let path = temp.path().join("host_pub.harn");
454        let source = r#"
455fn helper() {}
456pub fn run_shell(command) { return command }
457pub fn request_permission(tool_name, request_args) { return true }
458"#;
459        write_file(&path, source);
460        let (_, program) = crate::parse_source_file(path.to_string_lossy().as_ref());
461        let names = exported_host_functions(&program);
462        assert!(names.contains("run_shell"));
463        assert!(names.contains("request_permission"));
464        assert!(!names.contains("helper"));
465    }
466
467    #[test]
468    fn parse_llm_override_splits_provider_and_model() {
469        let parsed = parse_llm_override("ollama:qwen2.5-coder:latest").unwrap();
470        assert_eq!(parsed.provider, "ollama");
471        assert_eq!(parsed.model, "qwen2.5-coder:latest");
472    }
473
474    #[tokio::test(flavor = "current_thread")]
475    async fn playground_executes_host_backed_script() {
476        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
477        let temp = tempfile::tempdir().unwrap();
478        let host = temp.path().join("host.harn");
479        let script = temp.path().join("pipeline.harn");
480        write_file(
481            &host,
482            r#"
483pub fn build_prompt(task) {
484  return "prompt: " + task
485}
486"#,
487        );
488        write_file(
489            &script,
490            r#"
491pipeline default(task) {
492  llm_mock({text: "done"})
493  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
494  println(result.text)
495}
496"#,
497        );
498
499        let output = execute_playground(&PlaygroundConfig {
500            host,
501            script,
502            task: "ship it".to_string(),
503            llm: Some(LlmOverride {
504                provider: "mock".to_string(),
505                model: "mock".to_string(),
506            }),
507            llm_mock_mode: CliLlmMockMode::Off,
508        })
509        .await
510        .unwrap();
511
512        assert!(output.contains("done"));
513    }
514
515    #[tokio::test(flavor = "current_thread")]
516    async fn playground_reports_missing_capability_with_caller_context() {
517        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
518        let temp = tempfile::tempdir().unwrap();
519        let host = temp.path().join("host.harn");
520        let script = temp.path().join("pipeline.harn");
521        write_file(
522            &host,
523            r#"
524pub fn helper() {
525  return "ok"
526}
527"#,
528        );
529        write_file(
530            &script,
531            r#"
532pipeline default(task) {
533  run_shell("pwd")
534}
535"#,
536        );
537
538        let error = execute_playground(&PlaygroundConfig {
539            host,
540            script,
541            task: String::new(),
542            llm: None,
543            llm_mock_mode: CliLlmMockMode::Off,
544        })
545        .await
546        .unwrap_err();
547
548        assert!(error.contains("run_shell"));
549        assert!(error.contains("pipeline.harn:3:3"));
550    }
551
552    #[tokio::test(flavor = "current_thread")]
553    async fn playground_replays_cli_llm_mock_fixtures() {
554        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
555        let temp = tempfile::tempdir().unwrap();
556        let host = temp.path().join("host.harn");
557        let script = temp.path().join("pipeline.harn");
558        let fixtures = temp.path().join("fixtures.jsonl");
559        write_file(
560            &host,
561            r#"
562pub fn build_prompt(task) {
563  return "prompt: " + task
564}
565"#,
566        );
567        write_file(
568            &script,
569            r#"
570pipeline default(task) {
571  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
572  println(result.text)
573}
574"#,
575        );
576        write_file(
577            &fixtures,
578            r#"{"text":"fixture replay","model":"fixture-model"}
579"#,
580        );
581
582        let output = execute_playground(&PlaygroundConfig {
583            host,
584            script,
585            task: "ship it".to_string(),
586            llm: Some(LlmOverride {
587                provider: "anthropic".to_string(),
588                model: "claude-sonnet".to_string(),
589            }),
590            llm_mock_mode: CliLlmMockMode::Replay {
591                fixture_path: fixtures,
592            },
593        })
594        .await
595        .unwrap();
596
597        assert!(output.contains("fixture replay"));
598    }
599}