Struct GpuSpec

Source

pub struct GpuSpec {
    pub count: u32,
    pub vendor: String,
    pub mode: Option<String>,
    pub model: Option<String>,
    pub scheduling: Option<SchedulingPolicy>,
    pub distributed: Option<DistributedConfig>,
    pub sharing: Option<GpuSharingMode>,
    pub mps_pipe_dir: Option<String>,
    pub mps_log_dir: Option<String>,
    pub time_slice_index: Option<u32>,
    pub time_slicing_config_path: Option<String>,
}

Expand description

GPU resource specification

Supported vendors:

nvidia - NVIDIA GPUs via NVIDIA Container Toolkit (default)
amd - AMD GPUs via ROCm (/dev/kfd + /dev/dri/renderD*)
intel - Intel GPUs via VAAPI/i915 (/dev/dri/renderD*)
apple - Apple Silicon GPUs via Metal/MPS (macOS only)

Unknown vendors fall back to DRI render node passthrough.

§GPU mode (macOS only)

When vendor is "apple", the mode field controls how GPU access is provided:

"native" – Seatbelt sandbox with direct Metal/MPS access (lowest overhead)
"vm" – libkrun micro-VM with GPU forwarding (stronger isolation)
None (default) – Auto-select based on platform and vendor

On Linux, mode is ignored; GPU passthrough always uses device node binding.

Fields§

§count: u32

Number of GPUs to request

§vendor: String

GPU vendor (nvidia, amd, intel, apple) - defaults to nvidia

§mode: Option<String>

GPU access mode (macOS only): "native", "vm", or None for auto-select

§model: Option<String>

Pin to a specific GPU model (e.g. “A100”, “H100”). Substring match against detected GPU model names.

§scheduling: Option<SchedulingPolicy>

Scheduling policy for GPU workloads.

best-effort (default): place what fits
gang: all-or-nothing for distributed jobs
spread: distribute across nodes

§distributed: Option<DistributedConfig>

Distributed GPU job coordination. When set, injects MASTER_ADDR, WORLD_SIZE, RANK, LOCAL_RANK env vars.

§sharing: Option<GpuSharingMode>

GPU sharing mode: exclusive (default), mps, or time-slice.

§mps_pipe_dir: Option<String>

Host directory for the NVIDIA MPS control pipe.

Only consulted when sharing == Mps. Defaults to /tmp/nvidia-mps when unset. The directory MUST exist on the host (created by the nvidia-cuda-mps-control daemon). It is bind-mounted into the container at the same path and exported as CUDA_MPS_PIPE_DIRECTORY.

§mps_log_dir: Option<String>

Host directory for NVIDIA MPS log output.

Only consulted when sharing == Mps. Defaults to /tmp/nvidia-log when unset. The directory MUST exist on the host. It is bind-mounted into the container and exported as CUDA_MPS_LOG_DIRECTORY.

§time_slice_index: Option<u32>

CUDA device index this replica should see when sharing == TimeSlice.

Emitted as CUDA_VISIBLE_DEVICES=<slice_index>, overriding the default 0..count visibility list. Use this together with a host-side NVIDIA time-slicing config to advertise a single physical GPU as multiple virtual slices.

§time_slicing_config_path: Option<String>

Optional host path to a NVIDIA time-slicing config YAML.

When set, the file is bind-mounted read-only at /etc/nvidia/gpu-time-slicing.yaml inside the container so tools that inspect the slicing topology (e.g. monitoring sidecars) can read it. The file is not interpreted by ZLayer — it’s purely informational for the workload.

Struct GpuSpec Copy item path

§GPU mode (macOS only)

Fields§

Trait Implementations§

impl Clone for GpuSpec

fn clone(&self) -> GpuSpec

fn clone_from(&mut self, source: &Self)

impl Debug for GpuSpec

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for GpuSpec

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Eq for GpuSpec

impl PartialEq for GpuSpec

fn eq(&self, other: &GpuSpec) -> bool

fn ne(&self, other: &Rhs) -> bool

impl Serialize for GpuSpec

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

impl StructuralPartialEq for GpuSpec

impl Validate for GpuSpec

fn validate(&self) -> Result<(), ValidationErrors>

impl<'v_a> ValidateArgs<'v_a> for GpuSpec

type Args = ()

fn validate_with_args(&self, args: Self::Args) -> Result<(), ValidationErrors>

Auto Trait Implementations§

impl Freeze for GpuSpec

impl RefUnwindSafe for GpuSpec

impl Send for GpuSpec

impl Sync for GpuSpec

impl Unpin for GpuSpec

impl UnsafeUnpin for GpuSpec

impl UnwindSafe for GpuSpec

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<Q, K> Equivalent<K> for Qwhere Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

fn equivalent(&self, key: &K) -> bool

impl<Q, K> Equivalent<K> for Qwhere Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

fn equivalent(&self, key: &K) -> bool

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> FromBase64 for Twhere T: for<'de> Deserialize<'de>,

fn from_base64<Input>(raw: &Input) -> Result<T, Error>where Input: AsRef<[u8]> + ?Sized,

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<C> SignWithKey<String> for Cwhere C: ToBase64,

fn sign_with_key(self, key: &impl SigningAlgorithm) -> Result<String, Error>

impl<T> ToBase64 for Twhere T: Serialize,

fn to_base64(&self) -> Result<Cow<'_, str>, Error>

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct GpuSpec

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

impl<T> FromBase64 for T
where T: for<'de> Deserialize<'de>,

fn from_base64<Input>(raw: &Input) -> Result<T, Error>
where Input: AsRef<[u8]> + ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Sized + Policy<B, E>, P: Policy<B, E>,

impl<C> SignWithKey<String> for C
where C: ToBase64,

impl<T> ToBase64 for T
where T: Serialize,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,