Struct numa_gpu::runtime::cuda::CudaUnifiedIterator2

source · [−]

pub struct CudaUnifiedIterator2<'a, R: Copy + DeviceCopy, S: Copy + DeviceCopy> { /* private fields */ }

Expand description

CUDA iterator for two mutable unified memory inputs.

Prefetches data from main-memory to device memory on a chunk-sized granularity.

Preconditions

All inputs are required to have the same length.

Thread safety

Only one CPU thread is used within the iterator, thus thread-safety only applies to the CUDA kernel. See the fold() documentation for details.

Implementations

source

impl<'a, R: Copy + DeviceCopy, S: Copy + DeviceCopy> CudaUnifiedIterator2<'a, R, S>

source

pub fn fold<F>(&mut self, f: F) -> Result<CudaTransferStrategyMeasurement> where
F: FnMut((LaunchableSlice<'_, R>, LaunchableSlice<'_, S>), &Stream) -> Result<()>,

Apply a GPU function that produces a single, final value.

fold() takes two arguments: a data value, and a CUDA stream. In the case of CudaUnifiedIterator2, the data value is specified as a two-tuple of launchable slices. The slices are guaranteed to have the same length.

The function passed to fold() is meant to launch a CUDA kernel function on the given CUDA stream.

In contrast to Rust’s standard library fold() iterator, the state in this iterator is implicit in GPU memory.

Thread safety

Prefetching and kernel execution are asynchronous operations. They are performed on two or more CUDA streams to achieve parallelism, i.e.. prefetching and execution overlap.

However, Rust cannot guarantee thread-safety of CUDA kernels. Thus, the user must ensure that the CUDA kernels are safe to execute on multiple CUDA streams, e.g. by using atomic operations when accessing device memory.

Trait Implementations

source

impl<'a, R: Debug + Copy + DeviceCopy, S: Debug + Copy + DeviceCopy> Debug for CudaUnifiedIterator2<'a, R, S>

source

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations

impl<'a, R, S> RefUnwindSafe for CudaUnifiedIterator2<'a, R, S> where
R: RefUnwindSafe,
S: RefUnwindSafe,

impl<'a, R, S> Send for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !Sync for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> Unpin for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !UnwindSafe for CudaUnifiedIterator2<'a, R, S>

Blanket Implementations

source

impl<T> Any for T where
T: 'static + ?Sized,

source

pub fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

source

impl<T> Borrow<T> for T where
T: ?Sized,

const: unstable · source

pub fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

source

impl<T> BorrowMut<T> for T where
T: ?Sized,

const: unstable · source

pub fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

source

impl<T> From<T> for T

const: unstable · source

pub fn from(t: T) -> T

Returns the argument unchanged.

source

impl<T, U> Into for T where
U: From<T>,

const: unstable · source

pub fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

impl<T> Pointable for T

pub const ALIGN: usize

The alignment of pointer.

type Init = T

The type for initializers.

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

pub unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

source

impl<T, U> TryFrom for T where
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

const: unstable · source

pub fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

source

impl<T, U> TryInto for T where
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

const: unstable · source

pub fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct numa_gpu::runtime::cuda::CudaUnifiedIterator2

Preconditions

Thread safety

Implementations

impl<'a, R: Copy + DeviceCopy, S: Copy + DeviceCopy> CudaUnifiedIterator2<'a, R, S>

pub fn fold<F>(&mut self, f: F) -> Result<CudaTransferStrategyMeasurement> where
F: FnMut((LaunchableSlice<'_, R>, LaunchableSlice<'_, S>), &Stream) -> Result<()>,

Thread safety

Trait Implementations

impl<'a, R: Debug + Copy + DeviceCopy, S: Debug + Copy + DeviceCopy> Debug for CudaUnifiedIterator2<'a, R, S>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations

impl<'a, R, S> RefUnwindSafe for CudaUnifiedIterator2<'a, R, S> where
R: RefUnwindSafe,
S: RefUnwindSafe,

impl<'a, R, S> Send for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !Sync for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> Unpin for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !UnwindSafe for CudaUnifiedIterator2<'a, R, S>

Blanket Implementations

impl<T> Any for T where
T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where
T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where
T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where
U: From<T>,

pub fn into(self) -> U

impl<T> Pointable for T

pub const ALIGN: usize

type Init = T

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

pub unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for T where
U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct numa_gpu::runtime::cuda::CudaUnifiedIterator2

Implementations

impl<'a, R: Copy + DeviceCopy, S: Copy + DeviceCopy> CudaUnifiedIterator2<'a, R, S>

pub fn fold<F>(&mut self, f: F) -> Result<CudaTransferStrategyMeasurement> where F: FnMut((LaunchableSlice<'_, R>, LaunchableSlice<'_, S>), &Stream) -> Result<()>,

Trait Implementations

impl<'a, R: Debug + Copy + DeviceCopy, S: Debug + Copy + DeviceCopy> Debug for CudaUnifiedIterator2<'a, R, S>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations

impl<'a, R, S> RefUnwindSafe for CudaUnifiedIterator2<'a, R, S> where R: RefUnwindSafe, S: RefUnwindSafe,

impl<'a, R, S> Send for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !Sync for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> Unpin for CudaUnifiedIterator2<'a, R, S>

impl<'a, R, S> !UnwindSafe for CudaUnifiedIterator2<'a, R, S>

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

pub fn into(self) -> U

impl<T> Pointable for T

pub const ALIGN: usize

type Init = T

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

pub unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

pub fn fold<F>(&mut self, f: F) -> Result<CudaTransferStrategyMeasurement> where
F: FnMut((LaunchableSlice<'_, R>, LaunchableSlice<'_, S>), &Stream) -> Result<()>,

impl<'a, R, S> RefUnwindSafe for CudaUnifiedIterator2<'a, R, S> where
R: RefUnwindSafe,
S: RefUnwindSafe,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,