pub async fn generate( endpoint: &str, model: &str, system_prompt: &str, user_prompt: &str, keep_alive: &str, ) -> Result<String, String>