Skip to main content

harn_cli/commands/
playground.rs

1use std::collections::HashSet;
2use std::io::{self, Write};
3use std::path::{Path, PathBuf};
4use std::rc::Rc;
5
6use harn_parser::{DiagnosticSeverity, Node, SNode, TypeChecker};
7
8use crate::cli::PlaygroundArgs;
9use crate::commands::run::{
10    connect_mcp_servers, install_cli_llm_mock_mode, persist_cli_llm_mock_recording, CliLlmMockMode,
11};
12use crate::package;
13use crate::skill_loader::{
14    emit_loader_warnings, install_skills_global, load_skills, SkillLoaderInputs,
15};
16
17#[derive(Clone, Debug, PartialEq, Eq)]
18struct LlmOverride {
19    provider: String,
20    model: String,
21}
22
23/// Inputs to `execute_playground_inputs` — the in-process sibling of
24/// `harn playground`. Tests construct this directly instead of going through
25/// clap. The binary entry (`run_command`) builds this from `PlaygroundArgs`.
26#[derive(Clone, Debug)]
27pub struct PlaygroundInputs {
28    pub host: PathBuf,
29    pub script: PathBuf,
30    pub task: String,
31    /// Optional `provider:model` override, in the same format `--llm` accepts.
32    pub llm: Option<String>,
33    pub llm_mock_mode: CliLlmMockMode,
34}
35
36#[derive(Clone, Debug)]
37struct PlaygroundConfig {
38    host: PathBuf,
39    script: PathBuf,
40    task: String,
41    llm: Option<LlmOverride>,
42    llm_mock_mode: CliLlmMockMode,
43}
44
45pub(crate) async fn run_command(
46    args: PlaygroundArgs,
47    llm_mock_mode: CliLlmMockMode,
48) -> Result<(), String> {
49    let config = PlaygroundConfig {
50        host: canonicalize_or_err(&args.host)?,
51        script: canonicalize_or_err(&args.script)?,
52        task: args.task.unwrap_or_default(),
53        llm: args.llm.as_deref().map(parse_llm_override).transpose()?,
54        llm_mock_mode,
55    };
56
57    if args.watch {
58        run_watch(&config).await
59    } else {
60        let output = execute_playground(&config).await?;
61        if !output.is_empty() {
62            io::stdout()
63                .write_all(output.as_bytes())
64                .map_err(|error| format!("failed to write playground output: {error}"))?;
65        }
66        Ok(())
67    }
68}
69
70/// In-process entry point for `harn playground`. Returns the captured stdout
71/// the CLI dispatcher would have printed, or a rendered error string.
72///
73/// This is the path tests use to exercise the playground driver without
74/// spawning the `harn` binary. Watch mode is not supported here — it has no
75/// terminal output contract worth asserting on.
76pub async fn execute_playground_inputs(inputs: PlaygroundInputs) -> Result<String, String> {
77    let llm = inputs.llm.as_deref().map(parse_llm_override).transpose()?;
78    let config = PlaygroundConfig {
79        host: canonicalize_or_err(inputs.host.to_string_lossy().as_ref())?,
80        script: canonicalize_or_err(inputs.script.to_string_lossy().as_ref())?,
81        task: inputs.task,
82        llm,
83        llm_mock_mode: inputs.llm_mock_mode,
84    };
85    execute_playground(&config).await
86}
87
88async fn run_watch(config: &PlaygroundConfig) -> Result<(), String> {
89    use notify::{Event, EventKind, RecursiveMode, Watcher};
90
91    eprintln!(
92        "\x1b[2m[playground] running {} with host {}...\x1b[0m",
93        config.script.display(),
94        config.host.display()
95    );
96    emit_run_result(execute_playground(config).await);
97
98    let roots = watch_roots(&config.host, &config.script);
99    let (tx, mut rx) = tokio::sync::mpsc::channel::<()>(1);
100    let _watcher = {
101        let tx = tx.clone();
102        let mut watcher = notify::recommended_watcher(move |res: Result<Event, _>| {
103            if let Ok(event) = res {
104                if matches!(
105                    event.kind,
106                    EventKind::Modify(_) | EventKind::Create(_) | EventKind::Remove(_)
107                ) {
108                    let has_harn = event
109                        .paths
110                        .iter()
111                        .any(|path| path.extension().is_some_and(|ext| ext == "harn"));
112                    if has_harn {
113                        let _ = tx.blocking_send(());
114                    }
115                }
116            }
117        })
118        .map_err(|error| format!("failed to create playground watcher: {error}"))?;
119
120        for root in &roots {
121            watcher
122                .watch(root, RecursiveMode::Recursive)
123                .map_err(|error| format!("failed to watch {}: {error}", root.display()))?;
124        }
125        watcher
126    };
127
128    eprintln!(
129        "\x1b[2m[playground] watching {} (ctrl-c to stop)\x1b[0m",
130        roots
131            .iter()
132            .map(|path| path.display().to_string())
133            .collect::<Vec<_>>()
134            .join(", ")
135    );
136
137    loop {
138        rx.recv().await;
139        tokio::time::sleep(std::time::Duration::from_millis(200)).await;
140        while rx.try_recv().is_ok() {}
141
142        eprintln!();
143        eprintln!(
144            "\x1b[2m[playground] change detected, re-running {}...\x1b[0m",
145            config.script.display()
146        );
147        emit_run_result(execute_playground(config).await);
148    }
149}
150
151fn emit_run_result(result: Result<String, String>) {
152    match result {
153        Ok(output) => {
154            if !output.is_empty() {
155                let _ = io::stdout().write_all(output.as_bytes());
156            }
157        }
158        Err(error) => eprint!("{error}"),
159    }
160}
161
162async fn execute_playground(config: &PlaygroundConfig) -> Result<String, String> {
163    let (host_source, host_program) = crate::parse_source_file(&config.host.to_string_lossy());
164    typecheck_program(&host_source, &host_program, &config.host, &HashSet::new())?;
165    let host_exports = exported_host_functions(&host_program);
166
167    let (script_source, script_program) =
168        crate::parse_source_file(&config.script.to_string_lossy());
169    typecheck_program(
170        &script_source,
171        &script_program,
172        &config.script,
173        &host_exports,
174    )?;
175
176    let chunk = harn_vm::Compiler::new()
177        .compile(&script_program)
178        .map_err(|error| format!("error: compile error: {error}\n"))?;
179
180    let env_guard = ScopedEnv::apply(config);
181    let source_parent = config
182        .script
183        .parent()
184        .unwrap_or_else(|| Path::new("."))
185        .to_path_buf();
186    let project_root = harn_vm::stdlib::process::find_project_root(&source_parent);
187    let store_base = project_root.as_deref().unwrap_or(source_parent.as_path());
188    let execution_cwd = std::env::current_dir()
189        .unwrap_or_else(|_| PathBuf::from("."))
190        .to_string_lossy()
191        .into_owned();
192    let source_dir = source_parent.to_string_lossy().into_owned();
193
194    let local = tokio::task::LocalSet::new();
195    let result = local
196        .run_until(async {
197            install_cli_llm_mock_mode(&config.llm_mock_mode)
198                .map_err(|error| format!("error: {error}\n"))?;
199            let host_vm = configured_vm(
200                &config.host,
201                &host_source,
202                project_root.as_deref(),
203                store_base,
204            )
205            .await?;
206            let bridge = Rc::new(
207                harn_vm::bridge::HostBridge::from_harn_module(host_vm, &config.host)
208                    .await
209                    .map_err(|error| format!("error: {error}\n"))?,
210            );
211
212            let mut vm = configured_vm(
213                &config.script,
214                &script_source,
215                project_root.as_deref(),
216                store_base,
217            )
218            .await?;
219            vm.set_bridge(bridge.clone());
220            harn_vm::llm::install_current_host_bridge(bridge.clone());
221            harn_vm::stdlib::process::set_thread_execution_context(Some(
222                harn_vm::orchestration::RunExecutionRecord {
223                    cwd: Some(execution_cwd),
224                    source_dir: Some(source_dir),
225                    env: std::collections::BTreeMap::new(),
226                    adapter: None,
227                    repo_path: None,
228                    worktree_path: None,
229                    branch: None,
230                    base_ref: None,
231                    cleanup: None,
232                },
233            ));
234            let execution_result = match vm.execute(&chunk).await {
235                Ok(_) => Ok(vm.output().to_string()),
236                Err(error) => Err(vm.format_runtime_error(&error)),
237            };
238            harn_vm::llm::clear_current_host_bridge();
239            harn_vm::stdlib::process::set_thread_execution_context(None);
240            persist_cli_llm_mock_recording(&config.llm_mock_mode)
241                .map_err(|error| format!("error: {error}\n"))?;
242            execution_result
243        })
244        .await;
245    drop(env_guard);
246    result
247}
248
249async fn configured_vm(
250    path: &Path,
251    source: &str,
252    project_root: Option<&Path>,
253    store_base: &Path,
254) -> Result<harn_vm::Vm, String> {
255    let mut vm = harn_vm::Vm::new();
256    harn_vm::register_vm_stdlib(&mut vm);
257    crate::install_default_hostlib(&mut vm);
258    harn_vm::register_store_builtins(&mut vm, store_base);
259    harn_vm::register_metadata_builtins(&mut vm, store_base);
260    let pipeline_name = path
261        .file_stem()
262        .and_then(|stem| stem.to_str())
263        .unwrap_or("default");
264    harn_vm::register_checkpoint_builtins(&mut vm, store_base, pipeline_name);
265    vm.set_source_info(&path.to_string_lossy(), source);
266    if let Some(root) = project_root {
267        vm.set_project_root(root);
268    }
269    if let Some(parent) = path.parent() {
270        if !parent.as_os_str().is_empty() {
271            vm.set_source_dir(parent);
272        }
273    }
274    vm.set_global("argv", harn_vm::VmValue::List(Rc::new(Vec::new())));
275
276    let loaded = load_skills(&SkillLoaderInputs {
277        cli_dirs: Vec::new(),
278        source_path: Some(path.to_path_buf()),
279    });
280    emit_loader_warnings(&loaded.loader_warnings);
281    install_skills_global(&mut vm, &loaded);
282
283    let extensions = package::load_runtime_extensions(path);
284    package::install_runtime_extensions(&extensions);
285    if let Some(manifest) = extensions.root_manifest.as_ref() {
286        if !manifest.mcp.is_empty() {
287            connect_mcp_servers(&manifest.mcp, &mut vm).await;
288        }
289    }
290    package::install_manifest_triggers(&mut vm, &extensions)
291        .await
292        .map_err(|error| format!("failed to install manifest triggers: {error}"))?;
293
294    Ok(vm)
295}
296
297fn typecheck_program(
298    source: &str,
299    program: &[SNode],
300    path: &Path,
301    extra_names: &HashSet<String>,
302) -> Result<(), String> {
303    let graph = harn_modules::build(&[path.to_path_buf()]);
304    let mut checker = TypeChecker::new();
305    let mut imported = graph.imported_names_for_file(path).unwrap_or_default();
306    imported.extend(extra_names.iter().cloned());
307    if !imported.is_empty() {
308        checker = checker.with_imported_names(imported);
309    }
310    if let Some(imported) = graph.imported_type_declarations_for_file(path) {
311        checker = checker.with_imported_type_decls(imported);
312    }
313
314    let diagnostics = checker.check(program);
315    let mut rendered = String::new();
316    let mut had_error = false;
317    for diagnostic in &diagnostics {
318        if diagnostic.severity == DiagnosticSeverity::Error {
319            had_error = true;
320        }
321        rendered.push_str(&harn_parser::diagnostic::render_type_diagnostic(
322            source,
323            &path.to_string_lossy(),
324            diagnostic,
325        ));
326    }
327
328    if had_error {
329        return Err(rendered);
330    }
331    if !rendered.is_empty() {
332        eprint!("{rendered}");
333    }
334    Ok(())
335}
336
337fn exported_host_functions(program: &[SNode]) -> HashSet<String> {
338    let mut public_names = HashSet::new();
339    let mut all_names = HashSet::new();
340    let mut has_pub_fn = false;
341
342    for node in program {
343        let inner = match &node.node {
344            Node::AttributedDecl { inner, .. } => inner.as_ref(),
345            _ => node,
346        };
347        let Node::FnDecl { name, is_pub, .. } = &inner.node else {
348            continue;
349        };
350        all_names.insert(name.clone());
351        if *is_pub {
352            has_pub_fn = true;
353            public_names.insert(name.clone());
354        }
355    }
356
357    if has_pub_fn {
358        public_names
359    } else {
360        all_names
361    }
362}
363
364fn watch_roots(host: &Path, script: &Path) -> Vec<PathBuf> {
365    let mut roots = Vec::new();
366    for candidate in [
367        host.parent().unwrap_or_else(|| Path::new(".")),
368        script.parent().unwrap_or_else(|| Path::new(".")),
369    ] {
370        if !roots.iter().any(|existing| existing == candidate) {
371            roots.push(candidate.to_path_buf());
372        }
373    }
374    roots
375}
376
377fn parse_llm_override(raw: &str) -> Result<LlmOverride, String> {
378    let (provider, model) = raw
379        .split_once(':')
380        .ok_or_else(|| "playground --llm expects provider:model".to_string())?;
381    let provider = provider.trim();
382    let model = model.trim();
383    if provider.is_empty() || model.is_empty() {
384        return Err("playground --llm expects provider:model".to_string());
385    }
386    Ok(LlmOverride {
387        provider: provider.to_string(),
388        model: model.to_string(),
389    })
390}
391
392fn canonicalize_or_err(path: &str) -> Result<PathBuf, String> {
393    std::fs::canonicalize(path).map_err(|error| format!("failed to resolve {path}: {error}"))
394}
395
396struct ScopedEnv {
397    previous: Vec<(String, Option<String>)>,
398}
399
400impl ScopedEnv {
401    fn apply(config: &PlaygroundConfig) -> Self {
402        let mut previous = Vec::new();
403        Self::set("HARN_TASK", Some(config.task.as_str()), &mut previous);
404        if let Some(llm) = &config.llm {
405            Self::set(
406                "HARN_LLM_PROVIDER",
407                Some(llm.provider.as_str()),
408                &mut previous,
409            );
410            Self::set("HARN_LLM_MODEL", Some(llm.model.as_str()), &mut previous);
411        }
412        Self { previous }
413    }
414
415    fn set(key: &str, value: Option<&str>, previous: &mut Vec<(String, Option<String>)>) {
416        previous.push((key.to_string(), std::env::var(key).ok()));
417        match value {
418            Some(value) => std::env::set_var(key, value),
419            None => std::env::remove_var(key),
420        }
421    }
422}
423
424impl Drop for ScopedEnv {
425    fn drop(&mut self) {
426        for (key, previous) in self.previous.iter().rev() {
427            match previous {
428                Some(value) => std::env::set_var(key, value),
429                None => std::env::remove_var(key),
430            }
431        }
432    }
433}
434
435#[cfg(test)]
436mod tests {
437    use super::*;
438
439    fn write_file(path: &Path, contents: &str) {
440        if let Some(parent) = path.parent() {
441            std::fs::create_dir_all(parent).unwrap();
442        }
443        std::fs::write(path, contents).unwrap();
444    }
445
446    #[test]
447    fn exported_host_functions_prefers_pub_names() {
448        let temp = tempfile::tempdir().unwrap();
449        let path = temp.path().join("host_pub.harn");
450        let source = r#"
451fn helper() {}
452pub fn run_shell(command) { return command }
453pub fn request_permission(tool_name, request_args) { return true }
454"#;
455        write_file(&path, source);
456        let (_, program) = crate::parse_source_file(path.to_string_lossy().as_ref());
457        let names = exported_host_functions(&program);
458        assert!(names.contains("run_shell"));
459        assert!(names.contains("request_permission"));
460        assert!(!names.contains("helper"));
461    }
462
463    #[test]
464    fn parse_llm_override_splits_provider_and_model() {
465        let parsed = parse_llm_override("ollama:qwen2.5-coder:latest").unwrap();
466        assert_eq!(parsed.provider, "ollama");
467        assert_eq!(parsed.model, "qwen2.5-coder:latest");
468    }
469
470    #[tokio::test(flavor = "current_thread")]
471    async fn playground_executes_host_backed_script() {
472        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
473        let temp = tempfile::tempdir().unwrap();
474        let host = temp.path().join("host.harn");
475        let script = temp.path().join("pipeline.harn");
476        write_file(
477            &host,
478            r#"
479pub fn build_prompt(task) {
480  return "prompt: " + task
481}
482"#,
483        );
484        write_file(
485            &script,
486            r#"
487pipeline default(task) {
488  llm_mock({text: "done"})
489  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
490  println(result.text)
491}
492"#,
493        );
494
495        let output = execute_playground(&PlaygroundConfig {
496            host,
497            script,
498            task: "ship it".to_string(),
499            llm: Some(LlmOverride {
500                provider: "mock".to_string(),
501                model: "mock".to_string(),
502            }),
503            llm_mock_mode: CliLlmMockMode::Off,
504        })
505        .await
506        .unwrap();
507
508        assert!(output.contains("done"));
509    }
510
511    #[tokio::test(flavor = "current_thread")]
512    async fn playground_reports_missing_capability_with_caller_context() {
513        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
514        let temp = tempfile::tempdir().unwrap();
515        let host = temp.path().join("host.harn");
516        let script = temp.path().join("pipeline.harn");
517        write_file(
518            &host,
519            r#"
520pub fn helper() {
521  return "ok"
522}
523"#,
524        );
525        write_file(
526            &script,
527            r#"
528pipeline default(task) {
529  run_shell("pwd")
530}
531"#,
532        );
533
534        let error = execute_playground(&PlaygroundConfig {
535            host,
536            script,
537            task: String::new(),
538            llm: None,
539            llm_mock_mode: CliLlmMockMode::Off,
540        })
541        .await
542        .unwrap_err();
543
544        assert!(error.contains("run_shell"));
545        assert!(error.contains("pipeline.harn:3:3"));
546    }
547
548    #[tokio::test(flavor = "current_thread")]
549    async fn playground_replays_cli_llm_mock_fixtures() {
550        let _guard = crate::tests::common::env_lock::lock_env().lock().await;
551        let temp = tempfile::tempdir().unwrap();
552        let host = temp.path().join("host.harn");
553        let script = temp.path().join("pipeline.harn");
554        let fixtures = temp.path().join("fixtures.jsonl");
555        write_file(
556            &host,
557            r#"
558pub fn build_prompt(task) {
559  return "prompt: " + task
560}
561"#,
562        );
563        write_file(
564            &script,
565            r#"
566pipeline default(task) {
567  let result = llm_call(build_prompt(env_or("HARN_TASK", "")), "You are concise.")
568  println(result.text)
569}
570"#,
571        );
572        write_file(
573            &fixtures,
574            r#"{"text":"fixture replay","model":"fixture-model"}
575"#,
576        );
577
578        let output = execute_playground(&PlaygroundConfig {
579            host,
580            script,
581            task: "ship it".to_string(),
582            llm: Some(LlmOverride {
583                provider: "anthropic".to_string(),
584                model: "claude-sonnet".to_string(),
585            }),
586            llm_mock_mode: CliLlmMockMode::Replay {
587                fixture_path: fixtures,
588            },
589        })
590        .await
591        .unwrap();
592
593        assert!(output.contains("fixture replay"));
594    }
595}