Struct MultiHeadAttention

Source

pub struct MultiHeadAttention {
    pub num_heads: i32,
    pub query_proj: MaybeQuantized<Linear>,
    pub key_proj: MaybeQuantized<Linear>,
    pub value_proj: MaybeQuantized<Linear>,
    pub output_proj: MaybeQuantized<Linear>,
}

Expand description

Implements the scaled dot product attention with multiple heads.

Fields§

§num_heads: i32

Number of attention heads

§query_proj: MaybeQuantized<Linear>

Query projection layer

§key_proj: MaybeQuantized<Linear>

Key projection layer

§value_proj: MaybeQuantized<Linear>

Value projection layer

§output_proj: MaybeQuantized<Linear>

Output projection layer

Implementations§

Source §

impl MultiHeadAttention

Source

pub fn new( dims: impl Into<i32>, num_heads: impl Into<i32>, ) -> Result<Self, <<Self as Buildable>::Builder as Builder<Self>>::Error>

Creates a new instance of MultiHeadAttention.

Source §

impl MultiHeadAttention

Source

pub const DEFAULT_BIAS: bool = false

Default value for the bias field

Source

pub fn create_additive_causal_mask<T>(n: i32) -> Result<Array, Exception>
where T: ArrayElement + LowerBounded, Array: FromScalar<T>,

Creates an attention mask for use with MultiHeadAttention.

Trait Implementations§

Source §

impl Buildable for MultiHeadAttention

Source §

type Builder = MultiHeadAttentionBuilder

The builder type for this buildable type

Source §

impl Builder<MultiHeadAttention> for MultiHeadAttentionBuilder

Source §

type Error = MultiHeadAttentionBuildError

Error with building

Source §

fn build(self) -> Result<MultiHeadAttention, Self::Error>

Build the type

Source §

impl Clone for MultiHeadAttention

Source §

fn clone(&self) -> MultiHeadAttention

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for MultiHeadAttention

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl<'a, Input> Module<Input> for MultiHeadAttention
where Input: Into<MultiHeadAttentionInput<'a>>,

Source §

type Error = Exception

Error type for the module.

Source §

type Output = Array

Output type of the module.

Source §

fn forward(&mut self, input: Input) -> Result<Self::Output, Self::Error>

Forward pass of the module.

Source §

fn training_mode(&mut self, mode: bool)

Set whether the module is in training mode. Read more

Source §

impl ModuleParameters for MultiHeadAttention

Source §

fn num_parameters(&self) -> usize

Get the total number of parameters in the module. Read more

Source §

fn freeze_parameters(&mut self, recursive: bool)

Freeze all parameters in the module.

Source §

fn unfreeze_parameters(&mut self, recursive: bool)

Unfreeze all parameters in the module.

Source §

fn parameters(&self) -> ModuleParamRef<'_>

Get references to the module parameters.

Source §

fn parameters_mut(&mut self) -> ModuleParamMut<'_>

Get mutable references to the module parameters.

Source §

fn trainable_parameters(&self) -> ModuleParamRef<'_>

Get references to the trainable parameters. A parameter is trainable if it is NOT frozen.

Source §

fn all_frozen(&self) -> Option<bool>

Check if all parameters in the module are frozen. Returns None if there are no parameters.

Source §

fn any_frozen(&self) -> Option<bool>

Check if any parameter in the module is frozen. Returns None if there are no parameters.

Source §

fn update(&mut self, parameters: ModuleParam)

Update the module parameters.

Source §

fn update_flattened(&mut self, flattened_parameters: FlattenedModuleParam)

Update the module parameters from a flattened representation.

Source §

impl Quantizable for MultiHeadAttention

Source §

type Quantized = MultiHeadAttention

The quantized type.

Source §

type QuantizationError = Exception

The error type for quantization.

Source §

fn try_into_quantized( self, group_size: i32, bits: i32, ) -> Result<Self::Quantized, Self::QuantizationError>

Quantize the module with the specified group size and number of bits.

Source §

const DEFAULT_GROUP_SIZE: i32 = 64i32

The default group size for quantization.

Source §

const DEFAULT_BITS: i32 = 4i32

The default number of bits for quantization.

Auto Trait Implementations§

§

impl UnwindSafe for MultiHeadAttention

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> DynClone for T
where T: Clone,

Source §

fn __clone_box(&self, _: Private) -> *mut ()

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §