MultiGpuCoordinator

Struct MultiGpuCoordinator 

pub struct MultiGpuCoordinator {
    config: MultiGpuConfig,
    devices: RwLock<RawRwLock, Vec<DeviceInfo>>,
    kernel_device_map: RwLock<RawRwLock, HashMap<KernelId, usize>>,
    device_kernel_counts: RwLock<RawRwLock, Vec<AtomicUsize>>,
    round_robin_counter: AtomicUsize,
    total_kernels: AtomicU64,
    custom_selector: RwLock<RawRwLock, Option<Arc<dyn Fn(&[DeviceStatus], &LaunchOptions) -> usize + Send + Sync>>>,
}
Expand description

Multi-GPU coordinator for managing kernels across devices.

Fields§

§config: MultiGpuConfig§devices: RwLock<RawRwLock, Vec<DeviceInfo>>§kernel_device_map: RwLock<RawRwLock, HashMap<KernelId, usize>>§device_kernel_counts: RwLock<RawRwLock, Vec<AtomicUsize>>§round_robin_counter: AtomicUsize§total_kernels: AtomicU64§custom_selector: RwLock<RawRwLock, Option<Arc<dyn Fn(&[DeviceStatus], &LaunchOptions) -> usize + Send + Sync>>>

Implementations§

§

impl MultiGpuCoordinator

pub fn new(config: MultiGpuConfig) -> Arc<MultiGpuCoordinator>

Create a new multi-GPU coordinator.

pub fn register_device(&self, device: DeviceInfo)

Register a device with the coordinator.

pub fn unregister_device(&self, index: usize)

Unregister a device.

pub fn devices(&self) -> Vec<DeviceInfo>

Get all registered devices.

pub fn device(&self, index: usize) -> Option<DeviceInfo>

Get device info by index.

pub fn device_count(&self) -> usize

Get number of devices.

pub fn select_device( &self, options: &LaunchOptions, ) -> Result<usize, RingKernelError>

Select a device for launching a kernel.

pub fn assign_kernel(&self, kernel_id: KernelId, device_index: usize)

Assign a kernel to a device.

pub fn remove_kernel(&self, kernel_id: &KernelId)

Remove a kernel assignment.

pub fn get_kernel_device(&self, kernel_id: &KernelId) -> Option<usize>

Get device for a kernel.

pub fn kernels_on_device(&self, device_index: usize) -> Vec<KernelId>

Get all kernels on a device.

pub fn get_all_status(&self) -> Vec<DeviceStatus>

Get status of all devices.

pub fn get_device_status(&self, device_index: usize) -> Option<DeviceStatus>

Get status of a specific device.

pub fn set_custom_selector<F>(&self, selector: F)
where F: Fn(&[DeviceStatus], &LaunchOptions) -> usize + Send + Sync + 'static,

Set custom device selector.

pub fn stats(&self) -> MultiGpuStats

Get coordinator statistics.

pub fn can_p2p(&self, device_a: usize, device_b: usize) -> bool

Check if P2P is available between two devices.

pub fn update_device_memory(&self, device_index: usize, available_memory: u64)

Update device memory info.

Auto Trait Implementations§

Blanket Implementations§

§

impl<T> Any for T
where T: 'static + ?Sized,

§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
§

impl<T> ArchivePointee for T

§

type ArchivedMetadata = ()

The archived version of the pointer metadata for this type.
§

fn pointer_metadata( _: &<T as ArchivePointee>::ArchivedMetadata, ) -> <T as Pointee>::Metadata

Converts some archived metadata to the pointer metadata for itself.
§

impl<T> Borrow<T> for T
where T: ?Sized,

§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
§

impl<T> BorrowMut<T> for T
where T: ?Sized,

§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
§

impl<F, W, T, D> Deserialize<With<T, W>, D> for F
where W: DeserializeWith<F, T, D>, D: Fallible + ?Sized, F: ?Sized,

§

fn deserialize( &self, deserializer: &mut D, ) -> Result<With<T, W>, <D as Fallible>::Error>

Deserializes using the given deserializer
§

impl<T> From<T> for T

§

fn from(t: T) -> T

Returns the argument unchanged.

§

impl<T> Instrument for T

§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided [Span], returning an Instrumented wrapper. Read more
§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
§

impl<T, U> Into<U> for T
where U: From<T>,

§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

§

impl<T> LayoutRaw for T

§

fn layout_raw(_: <T as Pointee>::Metadata) -> Result<Layout, LayoutError>

Gets the layout of the type.
§

impl<T> Pointee for T

§

type Metadata = ()

The type for metadata in pointers and references to Self.
§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.
§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

§

fn vzip(self) -> V

§

impl<T> WithSubscriber for T

§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a [WithDispatch] wrapper. Read more
§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a [WithDispatch] wrapper. Read more