#define TORCH_ASSERT_NO_OPERATORS #include #include #include #include #include #include #include #include #include #include namespace at::native { #if AT_USE_JITERATOR() constexpr char sin_name[] = "sin_impl"; #endif void sin_kernel_cuda(TensorIteratorBase& iter) { auto common_dtype = iter.common_dtype(); if (at::isComplexType(common_dtype)) { #if AT_USE_JITERATOR() static const auto sin_string = jiterator_stringify( template T sin_impl(T a) { return std::sin(a); }); AT_DISPATCH_COMPLEX_TYPES_AND( kComplexHalf, common_dtype, "sin_name", [&]() { jitted_gpu_kernel< /*name=*/sin_name, /*return_dtype=*/scalar_t, /*common_dtype=*/scalar_t, /*arity=*/1>(iter, sin_string); }); #else AT_DISPATCH_COMPLEX_TYPES_AND( kComplexHalf, common_dtype, "sin_name", [&]() { gpu_kernel(iter, [] GPU_LAMBDA(scalar_t a) -> scalar_t { using opmath_t = at::opmath_type; return ::sin(static_cast(a)); }); }); #endif } else { AT_DISPATCH_FLOATING_TYPES_AND2( ScalarType::Half, ScalarType::BFloat16, common_dtype, "sin_cuda", [&]() { gpu_kernel( iter, [] GPU_LAMBDA(scalar_t a) -> scalar_t { return ::sin(a); }); }); } } REGISTER_DISPATCH(sin_stub, &sin_kernel_cuda) } // namespace at::native