#define TORCH_ASSERT_NO_OPERATORS #define _USE_MATH_DEFINES #include #include #include #include #include #include #include #include #include #include #include namespace at::native { namespace { void hardtanh_backward_kernel( TensorIterator& iter, const Scalar& min, const Scalar& max) { AT_DISPATCH_FLOATING_TYPES_AND2( at::ScalarType::Half, at::ScalarType::BFloat16, iter.dtype(), "hardtanh_backward_cuda", [&]() { using opmath_t = at::opmath_type; auto min_val = min.to(); auto max_val = max.to(); gpu_kernel( iter, [min_val, max_val] GPU_LAMBDA(scalar_t a, scalar_t b) -> scalar_t { opmath_t aop = static_cast(a); opmath_t bop = static_cast(b); return (bop <= min_val) || (bop >= max_val) ? opmath_t(0) : aop; }); }); } } // namespace REGISTER_DISPATCH(hardtanh_backward_stub, &hardtanh_backward_kernel) } // namespace at::native