#pragma once
#include <cuda.h>
#include <cuda_runtime.h>
#include <cuda_fp16.h>
#include <c10/macros/Export.h>
// Use TORCH_CUDA_CPP_API or TORCH_CUDA_CU_API for exports from this folder