Spaces:

ziqima
/

Find3D

Running

App Files Files Community

Find3D / Pointcept /libs /pointops2 /src /attention /attention_cuda_kernel.h

ziqima

initial commit

4893ce0 about 1 year ago

raw

history blame

1.79 kB

	#ifndef _ATTENTION_CUDA_KERNEL
	#define _ATTENTION_CUDA_KERNEL
	#include <vector>
	#include <torch/serialize/tensor.h>
	#include <ATen/cuda/CUDAContext.h>

	void attention_step1_forward_cuda(int N, int M, int h, int C, at::Tensor q_tensor, at::Tensor k_tensor, at::Tensor index0_tensor, at::Tensor index1_tensor, at::Tensor attn_tensor);
	void attention_step1_backward_cuda(int N, int M, int h, int C, at::Tensor grad_out_tensor, at::Tensor index0_tensor, at::Tensor index1_tensor, at::Tensor q_tensor, at::Tensor k_tensor, at::Tensor grad_q_tensor, at::Tensor grad_k_tensor);

	void attention_step2_forward_cuda(int N, int M, int h, int C, at::Tensor attn_tensor, at::Tensor v_tensor, at::Tensor index0_tensor, at::Tensor index1_tensor, at::Tensor output_tensor);
	void attention_step2_backward_cuda(int N, int M, int h, int C, at::Tensor grad_out_tensor, at::Tensor index0_tensor, at::Tensor index1_tensor, at::Tensor attn_tensor, at::Tensor v_tensor, at::Tensor grad_attn_tensor, at::Tensor grad_v_tensor);

	#ifdef __cplusplus
	extern "C" {
	#endif

	void attention_step1_forward_cuda_launcher(int N, int M, int h, int C, const float q, const float k, const int index0, const int index1, float *attn);
	void attention_step1_backward_cuda_launcher(int N, int M, int h, int C, const float grad_out, const int index0, const int index1, const float q, const float k, float grad_q, float *grad_k);

	void attention_step2_forward_cuda_launcher(int N, int M, int h, int C, const float attn, const float v, const int index0, const int index1, float *output);
	void attention_step2_backward_cuda_launcher(int N, int M, int h, int C, const float grad_out, const int index0, const int index1, const float attn, const float v, float grad_attn, float *grad_v);

	#ifdef __cplusplus
	}
	#endif
	#endif