#define TORCH_ASSERT_NO_OPERATORS #include #include #include #include #include #include namespace at::native { template struct AbsFunctor { __device__ __forceinline__ scalar_t operator() (const scalar_t a) const { return std::abs(a); } }; constexpr char abs_name[] = "abs_kernel"; void abs_kernel_cuda(TensorIteratorBase& iter) { auto dtype = iter.dtype(); if (at::isComplexType(dtype)) { #if AT_USE_JITERATOR() static const auto abs_string = jiterator_stringify( template T abs_kernel(T x) { return std::abs(x); }); AT_DISPATCH_COMPLEX_TYPES_AND(kComplexHalf, dtype, "abs_cuda", [&]() { jitted_gpu_kernel< /*name=*/abs_name, /*return_dtype=*/scalar_t, /*common_dtype=*/scalar_t, /*arity=*/1>(iter, abs_string); }); #else AT_DISPATCH_COMPLEX_TYPES_AND(kComplexHalf, dtype, "abs_cuda", [&]() { using opmath_t = at::opmath_type; gpu_kernel(iter, AbsFunctor()); }); #endif } else { AT_DISPATCH_ALL_TYPES_AND3( ScalarType::Half, ScalarType::BFloat16, ScalarType::Bool, iter.dtype(), "abs_cuda", [&]() { gpu_kernel(iter, AbsFunctor()); }); } } REGISTER_DISPATCH(abs_stub, &abs_kernel_cuda) } // namespace at::native