Skip to main content

MultiHeadAttnFwdRequest

atomr_accel_cuda::kernel::cudnn::attention

Struct MultiHeadAttnFwdRequest

pub struct MultiHeadAttnFwdRequest<T: CudnnSupported> {
    pub q: GpuRef<T>,
    pub k: GpuRef<T>,
    pub v: GpuRef<T>,
    pub o: GpuRef<T>,
    pub stats: Option<GpuRef<T>>,
    pub bias: Option<GpuRef<T>>,
    pub layout: TensorLayout,
    pub params: AttentionParams,
    pub reply: Sender<Result<(), GpuError>>,
    pub _ty: PhantomData<T>,
}

Expand description

MHA forward request.

Fields§

§q: GpuRef<T>§k: GpuRef<T>§v: GpuRef<T>§o: GpuRef<T>§stats: Option<GpuRef<T>>

Optional saved softmax-stats for backward.

§bias: Option<GpuRef<T>>

Optional bias added to attention scores.

§layout: TensorLayout§params: AttentionParams§reply: Sender<Result<(), GpuError>>§_ty: PhantomData<T>

Implementations§

impl<T: CudnnSupported> MultiHeadAttnFwdRequest<T>

pub fn graph_spec(&self) -> OperationGraphSpec

Trait Implementations§

impl<T: CudnnSupported> CudnnDispatch for MultiHeadAttnFwdRequest<T>

fn dtype_name(&self) -> &'static str

fn op_kind(&self) -> &'static str

fn dispatch(self: Box<Self>, _ctx: &CudnnDispatchCtx<'_>)

Auto Trait Implementations§

impl<T> Freeze for MultiHeadAttnFwdRequest<T>

impl<T> !RefUnwindSafe for MultiHeadAttnFwdRequest<T>

impl<T> Send for MultiHeadAttnFwdRequest<T>

impl<T> Sync for MultiHeadAttnFwdRequest<T>

impl<T> Unpin for MultiHeadAttnFwdRequest<T>
where T: Unpin,

impl<T> UnsafeUnpin for MultiHeadAttnFwdRequest<T>

impl<T> !UnwindSafe for MultiHeadAttnFwdRequest<T>

Blanket Implementations§

impl<T> Any for T
where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

impl<T> Borrow<T> for T
where T: ?Sized,

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

impl<T> BorrowMut<T> for T
where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

impl<T> From<T> for T

fn from(t: T) -> T

Returns the argument unchanged.

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided [Span], returning an Instrumented wrapper. Read more

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

impl<T, U> Into<U> for T
where U: From<T>,

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

impl<T, U> TryFrom<U> for T
where U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a [WithDispatch] wrapper. Read more

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a [WithDispatch] wrapper. Read more

impl<T> Extension for T
where T: Any + Send + Sync,