◆ qkv_ptr
void* bert::Fused_multihead_attention_params::qkv_ptr |
◆ packed_mask_ptr
void* bert::Fused_multihead_attention_params::packed_mask_ptr |
◆ o_ptr
void* bert::Fused_multihead_attention_params::o_ptr |
◆ qkv_stride_in_bytes
int64_t bert::Fused_multihead_attention_params::qkv_stride_in_bytes |
◆ packed_mask_stride_in_bytes
int64_t bert::Fused_multihead_attention_params::packed_mask_stride_in_bytes |
◆ o_stride_in_bytes
int64_t bert::Fused_multihead_attention_params::o_stride_in_bytes |
int bert::Fused_multihead_attention_params::b |
int bert::Fused_multihead_attention_params::h |
int bert::Fused_multihead_attention_params::s |
int bert::Fused_multihead_attention_params::d |
◆ scale_bmm1
uint32_t bert::Fused_multihead_attention_params::scale_bmm1 |
◆ scale_softmax
uint32_t bert::Fused_multihead_attention_params::scale_softmax |
◆ scale_bmm2
uint32_t bert::Fused_multihead_attention_params::scale_bmm2 |
◆ enable_i2f_trick
bool bert::Fused_multihead_attention_params::enable_i2f_trick |
The documentation for this struct was generated from the following file:
- fused_multihead_attention.h