#pragma once #include #include #include #include #include #include #include namespace torch::jit::fuser { // Creates a CPU or CUDA kernel for the given graph. // Returns the C++ or CUDA string implementing the kernel. TORCH_API std::string generateKernel( const std::string& name, const Graph& graph, const std::vector>>& inputs, const std::vector>& outputs, const bool use_cuda); } // namespace torch::jit::fuser