Skip to main content

Crate orchard

Crate orchard 

Source
Expand description

Orchard - Rust client for high-performance LLM inference on Apple Silicon.

Re-exports§

pub use error::Error;
pub use error::Result;
pub use ipc::client::EventCallback;
pub use ipc::client::IPCClient;
pub use ipc::client::ResponseDelta;
pub use ipc::client::TokenLogProb;
pub use ipc::endpoints;
pub use ipc::serialization::build_batch_request_payload;
pub use ipc::serialization::CapabilityEntry;
pub use ipc::serialization::LayoutEntry;
pub use ipc::serialization::PromptPayload;
pub use ipc::serialization::RequestType;
pub use ipc::serialization::SegmentType;
pub use engine::fetch::EngineFetcher;
pub use engine::lifecycle::EnginePaths;
pub use engine::lifecycle::InferenceEngine;
pub use engine::multiprocess;
pub use model::registry::ModelEntry;
pub use model::registry::ModelInfo;
pub use model::registry::ModelLoadState;
pub use model::registry::ModelRegistry;
pub use model::resolver::ModelResolver;
pub use model::resolver::ResolvedModel;
pub use formatter::control_tokens::ControlTokens;
pub use formatter::control_tokens::Role;
pub use formatter::control_tokens::RoleTags;
pub use formatter::multimodal::build_multimodal_layout;
pub use formatter::multimodal::build_multimodal_messages;
pub use formatter::multimodal::CapabilityInput;
pub use formatter::multimodal::ContentType;
pub use formatter::multimodal::LayoutSegment;
pub use formatter::ChatFormatter;
pub use client::BatchChatResult;
pub use client::ChatResult;
pub use client::Client;
pub use client::ClientDelta;
pub use client::ClientResponse;
pub use client::ContentPartAddedEvent;
pub use client::ContentPartDoneEvent;
pub use client::FunctionCallArgumentsDeltaEvent;
pub use client::FunctionCallArgumentsDoneEvent;
pub use client::IncompleteDetails;
pub use client::InputTokensDetails;
pub use client::OutputFunctionCall;
pub use client::OutputItemAddedEvent;
pub use client::OutputItemDoneEvent;
pub use client::OutputMessage;
pub use client::OutputReasoning;
pub use client::OutputStatus;
pub use client::OutputTextContent;
pub use client::OutputTextDeltaEvent;
pub use client::OutputTextDoneEvent;
pub use client::OutputTokensDetails;
pub use client::ReasoningContent;
pub use client::ReasoningDeltaEvent;
pub use client::ReasoningDoneEvent;
pub use client::ReasoningSummaryTextContent;
pub use client::ReasoningSummaryTextDeltaEvent;
pub use client::ReasoningSummaryTextDoneEvent;
pub use client::ResponseCompletedEvent;
pub use client::ResponseCreatedEvent;
pub use client::ResponseError;
pub use client::ResponseEvent;
pub use client::ResponseFailedEvent;
pub use client::ResponseInProgressEvent;
pub use client::ResponseIncompleteEvent;
pub use client::ResponseInputItem;
pub use client::ResponseObject;
pub use client::ResponseOutputItem;
pub use client::ResponseSnapshot;
pub use client::ResponseUsage;
pub use client::ResponsesInput;
pub use client::ResponsesRequest;
pub use client::ResponsesResult;
pub use client::SamplingParams;
pub use client::StreamErrorDetail;
pub use client::StreamErrorEvent;
pub use client::UsageStats;

Modules§

client
High-level client API for Orchard.
engine
Engine management for PIE (Proxy Inference Engine).
error
Unified error type for Orchard.
formatter
Chat formatting for LLM prompts.
ipc
IPC communication with PIE (Proxy Inference Engine).
model
Model management for Orchard.

Constants§

VERSION
Library version