#define TORCH_ASSERT_NO_OPERATORS #define _USE_MATH_DEFINES #include #include #include #include #include #include #include #include #include #include #include namespace at::native { namespace { void leaky_relu_kernel(TensorIteratorBase& iter, const Scalar& negval_) { AT_DISPATCH_FLOATING_TYPES_AND2( at::ScalarType::Half, at::ScalarType::BFloat16, iter.dtype(), "leaky_relu_cuda", [&]() { using opmath_t = at::opmath_type; auto negval = negval_.to(); gpu_kernel(iter, [negval] GPU_LAMBDA(scalar_t a) -> scalar_t { opmath_t aop = static_cast(a); return aop > opmath_t(0) ? aop : aop * negval; }); }); } void leaky_relu_backward_kernel( TensorIteratorBase& iter, const Scalar& negval_) { AT_DISPATCH_FLOATING_TYPES_AND2( at::ScalarType::Half, at::ScalarType::BFloat16, iter.dtype(), "leaky_relu_backward_cuda", [&]() { using opmath_t = at::opmath_type; auto negval = negval_.to(); gpu_kernel( iter, [negval] GPU_LAMBDA(scalar_t a, scalar_t b) -> scalar_t { opmath_t aop = static_cast(a); opmath_t bop = static_cast(b); return aop > opmath_t(0) ? bop : bop * negval; }); }); } } // namespace REGISTER_DISPATCH(leaky_relu_stub, &leaky_relu_kernel) REGISTER_DISPATCH(leaky_relu_backward_stub, &leaky_relu_backward_kernel) } // namespace at::native