#pragma once #include void __KERNEL_NAME_NORMALIZED__(torch::Tensor &out, torch::Tensor const &input);