#pragma once
#include "llama.h"
#include "common.h"
struct common_speculative;
std::string common_speculative_type_name_str();
enum common_speculative_type common_speculative_type_from_name(const std::string & name);
std::string common_speculative_type_to_str(enum common_speculative_type type);
bool common_speculative_is_compat(llama_context * ctx_tgt);
common_speculative * common_speculative_init(
common_params_speculative & params,
llama_context * ctx_tgt);
void common_speculative_free(common_speculative * spec);
void common_speculative_begin(common_speculative * spec, const llama_tokens & prompt);
llama_tokens common_speculative_draft(
common_speculative * spec,
const common_params_speculative & params,
const llama_tokens & prompt,
llama_token id_last);
void common_speculative_accept(common_speculative * spec, uint16_t n_accepted);
void common_speculative_print_stats(const common_speculative * spec);