_native_decoder_only_multi_head_attention_cuda_dispatch.h source code [pytorch/build/aten/src/ATen/ops/_native_decoder_only_multi_head_attention_cuda_dispatch.h]

1	#pragma once
2	// @generated by torchgen/gen.py from DispatchKeyFunction.h
3
4	// NB: The implementing C++ file is RegisterDispatchKey.cpp
5
6	// The only #includes we need are for custom classes that have defaults in the C++ API
7	#include <c10/core/MemoryFormat.h>
8	#include <c10/core/Scalar.h>
9	#include <ATen/core/Reduction.h>
10
11	// Forward declarations of any types needed in the operator signatures.
12	// We can't directly include these classes because it will cause circular include dependencies.
13	// This file is included by TensorBody.h, which defines the Tensor class.
14	#include <ATen/core/ATen_fwd.h>
15
16	namespace at {
17
18	namespace cuda {
19
20	TORCH_API ::std::tuple<at::Tensor,at::Tensor,at::Tensor,at::Tensor> _native_decoder_only_multi_head_attention(const at::Tensor & query, const at::Tensor & key, const at::Tensor & value, int64_t embed_dim, int64_t num_head, const at::Tensor & qkv_weight, const at::Tensor & qkv_bias, const at::Tensor & proj_weight, const at::Tensor & proj_bias, const c10::optional<at::Tensor> & mask={}, const c10::optional<at::Tensor> & incr_key={}, const c10::optional<at::Tensor> & incr_value={}, bool need_weights=true, bool average_attn_weights=true);
21
22	} // namespace cuda
23	} // namespace at
24

Browse the source code of pytorch/build/aten/src/ATen/ops/_native_decoder_only_multi_head_attention_cuda_dispatch.h