Template Function at::symint::_flash_attention_forward(const at::Tensor&, const at::Tensor&, const at::Tensor&, const ::std::optional<at::Tensor>&, const ::std::optional<at::Tensor>&, c10::SymInt, c10::SymInt, double, bool, bool, ::std::optional<double>, ::std::optional<c10::SymInt>, ::std::optional<c10::SymInt>, const ::std::optional<at::Tensor>&, const ::std::optional<at::Tensor>&)¶
Defined in File Functions.h
Function Documentation¶
-
template<typename T, typename = std::enable_if_t<std::is_same_v<T, c10::SymInt>>>
::std::tuple<at::Tensor, at::Tensor, at::Tensor, at::Tensor, at::Tensor> at::symint::_flash_attention_forward(const at::Tensor &query, const at::Tensor &key, const at::Tensor &value, const ::std::optional<at::Tensor> &cum_seq_q, const ::std::optional<at::Tensor> &cum_seq_k, c10::SymInt max_q, c10::SymInt max_k, double dropout_p, bool is_causal, bool return_debug_mask, ::std::optional<double> scale = ::std::nullopt, ::std::optional<c10::SymInt> window_size_left = ::std::nullopt, ::std::optional<c10::SymInt> window_size_right = ::std::nullopt, const ::std::optional<at::Tensor> &seqused_k = {}, const ::std::optional<at::Tensor> &alibi_slopes = {})¶