easydel.kernels.gpu_ops.__init__

easydel.kernels.gpu_ops.__init__#

easydel.kernels.gpu_ops.__init__.triton_flash_attention(q: Optional[Union[Array, ndarray, bool, number]], k: Optional[Union[Array, ndarray, bool, number]], v: Optional[Union[Array, ndarray, bool, number]], attention_mask: Optional[Union[Array, ndarray, bool, number]] = None, bias: Optional[Union[Array, ndarray, bool, number]] = None, softmax_scale: Optional[float] = None, dropout_prob: float = 0.0, causal: bool = False, dropout_seed: Optional[int] = None, varlen_mode: bool = True) Union[Array, ndarray, bool, number]#