| #include <torch/extension.h>
|
|
|
| #include <vector>
|
|
|
| #include "inplace_abn.h"
|
|
|
| std::vector<at::Tensor> mean_var(at::Tensor x) {
|
| if (x.is_cuda()) {
|
| if (x.type().scalarType() == at::ScalarType::Half) {
|
| return mean_var_cuda_h(x);
|
| } else {
|
| return mean_var_cuda(x);
|
| }
|
| } else {
|
| return mean_var_cpu(x);
|
| }
|
| }
|
|
|
| at::Tensor forward(at::Tensor x, at::Tensor mean, at::Tensor var, at::Tensor weight, at::Tensor bias,
|
| bool affine, float eps) {
|
| if (x.is_cuda()) {
|
| if (x.type().scalarType() == at::ScalarType::Half) {
|
| return forward_cuda_h(x, mean, var, weight, bias, affine, eps);
|
| } else {
|
| return forward_cuda(x, mean, var, weight, bias, affine, eps);
|
| }
|
| } else {
|
| return forward_cpu(x, mean, var, weight, bias, affine, eps);
|
| }
|
| }
|
|
|
| std::vector<at::Tensor> edz_eydz(at::Tensor z, at::Tensor dz, at::Tensor weight, at::Tensor bias,
|
| bool affine, float eps) {
|
| if (z.is_cuda()) {
|
| if (z.type().scalarType() == at::ScalarType::Half) {
|
| return edz_eydz_cuda_h(z, dz, weight, bias, affine, eps);
|
| } else {
|
| return edz_eydz_cuda(z, dz, weight, bias, affine, eps);
|
| }
|
| } else {
|
| return edz_eydz_cpu(z, dz, weight, bias, affine, eps);
|
| }
|
| }
|
|
|
| at::Tensor backward(at::Tensor z, at::Tensor dz, at::Tensor var, at::Tensor weight, at::Tensor bias,
|
| at::Tensor edz, at::Tensor eydz, bool affine, float eps) {
|
| if (z.is_cuda()) {
|
| if (z.type().scalarType() == at::ScalarType::Half) {
|
| return backward_cuda_h(z, dz, var, weight, bias, edz, eydz, affine, eps);
|
| } else {
|
| return backward_cuda(z, dz, var, weight, bias, edz, eydz, affine, eps);
|
| }
|
| } else {
|
| return backward_cpu(z, dz, var, weight, bias, edz, eydz, affine, eps);
|
| }
|
| }
|
|
|
| void leaky_relu_forward(at::Tensor z, float slope) {
|
| at::leaky_relu_(z, slope);
|
| }
|
|
|
| void leaky_relu_backward(at::Tensor z, at::Tensor dz, float slope) {
|
| if (z.is_cuda()) {
|
| if (z.type().scalarType() == at::ScalarType::Half) {
|
| return leaky_relu_backward_cuda_h(z, dz, slope);
|
| } else {
|
| return leaky_relu_backward_cuda(z, dz, slope);
|
| }
|
| } else {
|
| return leaky_relu_backward_cpu(z, dz, slope);
|
| }
|
| }
|
|
|
| void elu_forward(at::Tensor z) {
|
| at::elu_(z);
|
| }
|
|
|
| void elu_backward(at::Tensor z, at::Tensor dz) {
|
| if (z.is_cuda()) {
|
| return elu_backward_cuda(z, dz);
|
| } else {
|
| return elu_backward_cpu(z, dz);
|
| }
|
| }
|
|
|
| PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
|
| m.def("mean_var", &mean_var, "Mean and variance computation");
|
| m.def("forward", &forward, "In-place forward computation");
|
| m.def("edz_eydz", &edz_eydz, "First part of backward computation");
|
| m.def("backward", &backward, "Second part of backward computation");
|
| m.def("leaky_relu_forward", &leaky_relu_forward, "Leaky relu forward computation");
|
| m.def("leaky_relu_backward", &leaky_relu_backward, "Leaky relu backward computation and inversion");
|
| m.def("elu_forward", &elu_forward, "Elu forward computation");
|
| m.def("elu_backward", &elu_backward, "Elu backward computation and inversion");
|
| }
|
|
|