#define TORCH_ASSERT_NO_OPERATORS #define _USE_MATH_DEFINES #include #include #include #include #include #include #include #include #include #include #include namespace at::native { namespace { template void threshold_kernel_impl( TensorIteratorBase& iter, scalar_t threshold, scalar_t value) { gpu_kernel_with_scalars( iter, [=] GPU_LAMBDA(scalar_t x, scalar_t other) -> scalar_t { return x <= threshold ? value : other; }); } static void threshold_kernel_cuda( TensorIteratorBase& iter, const Scalar& threshold, const Scalar& value) { AT_DISPATCH_ALL_TYPES_AND2( at::ScalarType::Half, at::ScalarType::BFloat16, iter.dtype(), "threshold_cuda", [&] { threshold_kernel_impl( iter, threshold.to(), value.to()); }); } } // namespace REGISTER_DISPATCH(threshold_stub, &threshold_kernel_cuda) } // namespace at::native