// required for old g++ to compile PRId64 macros, see // https://github.com/pytorch/pytorch/issues/3571 // for context #ifndef __STDC_FORMAT_MACROS #define __STDC_FORMAT_MACROS #endif // an external backend might generate file within its code tree // and check all the source files within the tree with clang-format. // so, disable it since the backend might have a different config. // clang-format off // NOTE: This condition is true for all PyTorch internal libraries, it // just excludes external projects such as torch_xla which // re-use some of the PyTorch codegen machinery. #if defined(CAFFE2_BUILD_MAIN_LIB) || \ defined(TORCH_CUDA_BUILD_MAIN_LIB) || \ defined(TORCH_HIP_BUILD_MAIN_LIB) || \ defined(TORCH_XPU_BUILD_MAIN_LIB) || \ defined(TORCH_CUDA_CU_BUILD_MAIN_LIB) || \ defined(TORCH_CUDA_CPP_BUILD_MAIN_LIB) #define TORCH_ASSERT_ONLY_METHOD_OPERATORS #endif // @generated by tools/setup_helpers/generate_code.py from RegisterDispatchKey.cpp #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace at { namespace { C10_DIAGNOSTIC_PUSH_AND_IGNORED_IF_DEFINED("-Wunused-function") void resize_out(const Tensor &out, IntArrayRef sizes, IntArrayRef strides, const TensorOptions &options) { TORCH_CHECK(options.dtype() == out.dtype(), "Expected out tensor to have dtype ", options.dtype(), ", but got ", out.dtype(), " instead"); TORCH_CHECK(options.device() == out.device(), "Expected out tensor to have device ", options.device(), ", but got ", out.device(), " instead"); const bool resized = at::native::resize_output(out, sizes); // Only restride if a resize occurred; otherwise we ignore the (advisory) // strides from the meta function and directly use the output tensor's // preexisting strides if (resized) { if (!strides.empty()) { TORCH_INTERNAL_ASSERT(!options.memory_format_opt().has_value()); // TODO: avoid the redispatch here out.as_strided_(sizes, strides); } else if (options.memory_format_opt().has_value()) { out.unsafeGetTensorImpl()->empty_tensor_restride(*options.memory_format_opt()); } } } void check_inplace(const Tensor &self, IntArrayRef sizes, const TensorOptions &options) { // These checks are needed on those operators that: // 1) don't use 'TensorIterator' (e.g. 'addmm' and 'baddbmm') // 2) have particular typing rules (e.g. 'cumsum' and 'cumprod') // For other operators (e.g. 'add'), 'TensorIterator' already checks // these things separately. TORCH_CHECK(options.dtype() == self.dtype(), "Bad in-place call: ", "input tensor dtype ", self.dtype(), " and output tensor dtype ", options.dtype(), " should match"); TORCH_CHECK(options.device() == self.device(), "Bad in-place call: ", "input tensor device ", self.device(), " and output tensor device ", options.device(), " should match"); TORCH_CHECK(sizes == self.sizes(), "Bad in-place call: ", "input tensor size ", self.sizes(), " and output tensor size ", sizes, " should match"); } C10_DIAGNOSTIC_POP() } // namespace } // namespace at // See template file RegisterDispatchDefinitions.ini namespace at { // NB: TORCH_LIBRARY_IMPL must be in an anonymous namespace to avoid // ambiguity with conflicting identifiers that may have been defined in // at namespace already. namespace { namespace { at::Tensor wrapper_AutogradLazy__max_pool3d(const at::Tensor & self, at::IntArrayRef kernel_size, at::IntArrayRef stride, at::IntArrayRef padding, at::IntArrayRef dilation, bool ceil_mode) { // No device check // DeviceGuard omitted return torch::lazy::LazyNativeFunctions::max_pool3d(self, kernel_size, stride, padding, dilation, ceil_mode); } } // anonymous namespace namespace { ::std::tuple wrapper_AutogradLazy__native_group_norm(const at::Tensor & input, const ::std::optional & weight, const ::std::optional & bias, c10::SymInt N, c10::SymInt C, c10::SymInt HxW, int64_t group, double eps) { // No device check // DeviceGuard omitted return torch::lazy::LazyNativeFunctions::native_group_norm(input, weight, bias, N.guard_int(__FILE__, __LINE__), C.guard_int(__FILE__, __LINE__), HxW.guard_int(__FILE__, __LINE__), group, eps); } } // anonymous namespace ::std::tuple wrapper_AutogradLazy_out_native_group_norm_out(const at::Tensor & input, const ::std::optional & weight, const ::std::optional & bias, c10::SymInt N, c10::SymInt C, c10::SymInt HxW, int64_t group, double eps, at::Tensor & out0, at::Tensor & out1, at::Tensor & out2) { auto wrapper_AutogradLazy_out_native_group_norm_out_tmp = wrapper_AutogradLazy__native_group_norm(input, weight, bias, N, C, HxW, group, eps); at::_copy_from_and_resize(std::get<0>(wrapper_AutogradLazy_out_native_group_norm_out_tmp), out0); at::_copy_from_and_resize(std::get<1>(wrapper_AutogradLazy_out_native_group_norm_out_tmp), out1); at::_copy_from_and_resize(std::get<2>(wrapper_AutogradLazy_out_native_group_norm_out_tmp), out2); return ::std::tuple(out0, out1, out2); } } // anonymous namespace TORCH_API void RegisterTorchScriptAutogradLazyNativeFunctions(); TORCH_API void RegisterTorchScriptAutogradLazyNativeFunctions() { static auto m = MAKE_TORCH_LIBRARY_IMPL(aten, AutogradLazy); m.impl("max_pool3d", TORCH_FN(wrapper_AutogradLazy__max_pool3d)); m.impl("native_group_norm", TORCH_FN(wrapper_AutogradLazy__native_group_norm)); m.impl("native_group_norm.out", TORCH_FN(wrapper_AutogradLazy_out_native_group_norm_out)); } namespace autogradlazy { } // namespace autogradlazy } // namespace at