#include #include #ifndef AT_PER_OPERATOR_HEADERS #include #else #include #endif #include #include #include #include using namespace torch::aot_inductor; #if AT_MKLDNN_ENABLED() template static c10::List convert_to_c10_List(const T* scalars, const int64_t len) { c10::List scalars_list; scalars_list.reserve(len); for (int64_t i = 0; i < len; i++) { scalars_list.emplace_back(scalars[i]); } return scalars_list; } AOTITorchError aoti_torch_cpu_mkldnn__convolution_pointwise_binary( AtenTensorHandle X, AtenTensorHandle other, AtenTensorHandle W, AtenTensorHandle* B, const int64_t* padding, int64_t padding_len_, const int64_t* stride, int64_t stride_len_, const int64_t* dilation, int64_t dilation_len_, int64_t groups, const char* binary_attr, double* alpha, const char** unary_attr, const double** unary_scalars, int64_t unary_scalars_len_, const char** unary_algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> unary_scalars_list; unary_scalars_list.reserve(unary_scalars_len_); for (int64_t i = 0; i < unary_scalars_len_; i++) { unary_scalars_list.emplace_back(pointer_to_optional(unary_scalars[i])); } auto tmp_result = at::native::mkldnn_convolution_pointwise_binary( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(other), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), pointer_to_list(padding, padding_len_), pointer_to_list(stride, stride_len_), pointer_to_list(dilation, dilation_len_), groups, binary_attr, pointer_to_optional(alpha), pointer_to_optional(unary_attr), unary_scalars_list, pointer_to_optional(unary_algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu_mkldnn__convolution_pointwise_binary_( AtenTensorHandle other, AtenTensorHandle X, AtenTensorHandle W, AtenTensorHandle* B, const int64_t* padding, int64_t padding_len_, const int64_t* stride, int64_t stride_len_, const int64_t* dilation, int64_t dilation_len_, int64_t groups, const char* binary_attr, double* alpha, const char** unary_attr, const double** unary_scalars, int64_t unary_scalars_len_, const char** unary_algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> unary_scalars_list; unary_scalars_list.reserve(unary_scalars_len_); for (int64_t i = 0; i < unary_scalars_len_; i++) { unary_scalars_list.emplace_back(pointer_to_optional(unary_scalars[i])); } auto tmp_result = at::native::mkldnn_convolution_pointwise_binary_( *tensor_handle_to_tensor_pointer(other), *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), pointer_to_list(padding, padding_len_), pointer_to_list(stride, stride_len_), pointer_to_list(dilation, dilation_len_), groups, binary_attr, pointer_to_optional(alpha), pointer_to_optional(unary_attr), unary_scalars_list, pointer_to_optional(unary_algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu_mkldnn__convolution_pointwise( AtenTensorHandle X, AtenTensorHandle W, AtenTensorHandle* B, const int64_t* padding, int64_t padding_len_, const int64_t* stride, int64_t stride_len_, const int64_t* dilation, int64_t dilation_len_, int64_t groups, const char* attr, const double** scalars, int64_t scalars_len_, const char** algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(scalars_len_); for (int64_t i = 0; i < scalars_len_; i++) { scalars_list.emplace_back(pointer_to_optional(scalars[i])); } auto tmp_result = at::native::mkldnn_convolution_pointwise( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), pointer_to_list(padding, padding_len_), pointer_to_list(stride, stride_len_), pointer_to_list(dilation, dilation_len_), groups, attr, scalars_list, pointer_to_optional(algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu_mkldnn__convolution_transpose_pointwise( AtenTensorHandle X, AtenTensorHandle W, AtenTensorHandle* B, const int64_t* padding, int64_t padding_len_, const int64_t* output_padding, int64_t output_padding_len_, const int64_t* stride, int64_t stride_len_, const int64_t* dilation, int64_t dilation_len_, int64_t groups, const char* attr, const double** scalars, int64_t scalars_len_, const char** algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(scalars_len_); for (int64_t i = 0; i < scalars_len_; i++) { scalars_list.emplace_back(pointer_to_optional(scalars[i])); } auto tmp_result = at::native::mkldnn_convolution_transpose_pointwise( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), pointer_to_list(padding, padding_len_), pointer_to_list(output_padding, output_padding_len_), pointer_to_list(stride, stride_len_), pointer_to_list(dilation, dilation_len_), groups, attr, scalars_list, pointer_to_optional(algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu_mkldnn_rnn_layer( AtenTensorHandle input, AtenTensorHandle weight0, AtenTensorHandle weight1, AtenTensorHandle weight2, AtenTensorHandle weight3, AtenTensorHandle hx_, AtenTensorHandle cx_, int32_t reverse, const int64_t* batch_sizes, int64_t batch_sizes_len_, int64_t mode, int64_t hidden_size, int64_t num_layers, int32_t has_biases, int32_t bidirectional, int32_t batch_first, int32_t train, AtenTensorHandle* ret0, AtenTensorHandle* ret1, AtenTensorHandle* ret2, AtenTensorHandle* ret3) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ auto tmp_result = at::cpu::mkldnn_rnn_layer( *tensor_handle_to_tensor_pointer(input), *tensor_handle_to_tensor_pointer(weight0), *tensor_handle_to_tensor_pointer(weight1), *tensor_handle_to_tensor_pointer(weight2), *tensor_handle_to_tensor_pointer(weight3), *tensor_handle_to_tensor_pointer(hx_), *tensor_handle_to_tensor_pointer(cx_), reverse, pointer_to_list(batch_sizes, batch_sizes_len_), mode, hidden_size, num_layers, has_biases, bidirectional, batch_first, train); *ret0 = new_tensor_handle(std::move(std::get<0>(tmp_result))); *ret1 = new_tensor_handle(std::move(std::get<1>(tmp_result))); *ret2 = new_tensor_handle(std::move(std::get<2>(tmp_result))); *ret3 = new_tensor_handle(std::move(std::get<3>(tmp_result))); }); } AOTITorchError aoti_torch_cpu__linear_pointwise( AtenTensorHandle X, AtenTensorHandle W, AtenTensorHandle* B, const char* attr, const double** scalars, int64_t scalars_len_, const char** algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(scalars_len_); for (int64_t i = 0; i < scalars_len_; i++) { scalars_list.emplace_back(pointer_to_optional(scalars[i])); } auto tmp_result = at::native::mkldnn_linear_pointwise( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), attr, scalars_list, pointer_to_optional(algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu__linear_pointwise_binary( AtenTensorHandle X, AtenTensorHandle other, AtenTensorHandle W, AtenTensorHandle* B, const char* attr, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ auto tmp_result = at::native::mkldnn_linear_pointwise_binary( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(other), *tensor_handle_to_tensor_pointer(W), pointer_to_optional(B), attr); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu__qlinear_pointwise_tensor( AtenTensorHandle X, AtenTensorHandle act_scale, AtenTensorHandle act_zero_point, AtenTensorHandle onednn_weight, AtenTensorHandle weight_scales, AtenTensorHandle weight_zero_points, AtenTensorHandle* B, double output_scale, int64_t output_zero_point, const int32_t* output_dtype, const char* post_op_name, const double** post_op_args, int64_t post_op_args_len_, const char* post_op_algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(post_op_args_len_); for (int64_t i = 0; i < post_op_args_len_; i++) { scalars_list.emplace_back(pointer_to_optional(post_op_args[i])); } auto tmp_result = at::native::QLinearOnednn::run_pointwise_tensor( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(act_scale), *tensor_handle_to_tensor_pointer(act_zero_point), *tensor_handle_to_tensor_pointer(onednn_weight), *tensor_handle_to_tensor_pointer(weight_scales), *tensor_handle_to_tensor_pointer(weight_zero_points), pointer_to_optional(B), output_scale, output_zero_point, pointer_to_optional(output_dtype), post_op_name, scalars_list, post_op_algorithm); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu__qlinear_pointwise_binary_tensor( AtenTensorHandle X, AtenTensorHandle act_scale, AtenTensorHandle act_zero_point, AtenTensorHandle onednn_weight, AtenTensorHandle weight_scales, AtenTensorHandle weight_zero_points, AtenTensorHandle* other, AtenTensorHandle* B, double output_scale, int64_t output_zero_point, const int32_t* output_dtype, double other_scale, int64_t other_zero_point, const char* binary_post_op, double binary_alpha, const char* unary_post_op, const double** unary_post_op_args, int64_t unary_post_op_args_len_, const char* unary_post_op_algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(unary_post_op_args_len_); for (int64_t i = 0; i < unary_post_op_args_len_; i++) { scalars_list.emplace_back(pointer_to_optional(unary_post_op_args[i])); } auto tmp_result = at::native::QLinearOnednn::run_pointwise_binary_tensor( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(act_scale), *tensor_handle_to_tensor_pointer(act_zero_point), *tensor_handle_to_tensor_pointer(onednn_weight), *tensor_handle_to_tensor_pointer(weight_scales), *tensor_handle_to_tensor_pointer(weight_zero_points), pointer_to_optional(other), pointer_to_optional(B), output_scale, output_zero_point, pointer_to_optional(output_dtype), other_scale, other_zero_point, binary_post_op, binary_alpha, unary_post_op, scalars_list, unary_post_op_algorithm); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu__qconv_pointwise_tensor( AtenTensorHandle X, AtenTensorHandle act_scale, AtenTensorHandle act_zero_point, AtenTensorHandle onednn_weight, AtenTensorHandle weight_scales, AtenTensorHandle weight_zero_points, AtenTensorHandle* B, const int64_t* stride_args, int64_t stride_len_, const int64_t* padding_args, int64_t padding_len_, const int64_t* dilation_args, int64_t dilation_len_, int64_t groups, double output_scale, int64_t output_zero_point, const int32_t* output_dtype, const char* attr, const double** post_op_args, int64_t post_op_args_len_, const char** algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> scalars_list; scalars_list.reserve(post_op_args_len_); for (int64_t i = 0; i < post_op_args_len_; i++) { scalars_list.emplace_back(pointer_to_optional(post_op_args[i])); } c10::List stride_list = convert_to_c10_List(stride_args, stride_len_); c10::List padding_list = convert_to_c10_List(padding_args, padding_len_); c10::List dilation_list = convert_to_c10_List(dilation_args, dilation_len_); auto tmp_result = at::native::QConvoneDNN::run_pointwise_tensor( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(act_scale), *tensor_handle_to_tensor_pointer(act_zero_point), *tensor_handle_to_tensor_pointer(onednn_weight), *tensor_handle_to_tensor_pointer(weight_scales), *tensor_handle_to_tensor_pointer(weight_zero_points), pointer_to_optional(B), stride_list, padding_list, dilation_list, groups, output_scale, output_zero_point, pointer_to_optional(output_dtype), attr, scalars_list, pointer_to_optional(algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } AOTITorchError aoti_torch_cpu__qconv2d_pointwise_binary_tensor( AtenTensorHandle X, AtenTensorHandle act_scale, AtenTensorHandle act_zero_point, AtenTensorHandle onednn_weight, AtenTensorHandle weight_scales, AtenTensorHandle weight_zero_points, AtenTensorHandle accum, AtenTensorHandle* B, const int64_t* stride_args, int64_t stride_len_, const int64_t* padding_args, int64_t padding_len_, const int64_t* dilation_args, int64_t dilation_len_, int64_t groups, double output_scale, int64_t output_zero_point, const int32_t* output_dtype, double accum_scale, int64_t accum_zero_point, const char* binary_attr, double* alpha, const char** unary_attr, const double** unary_scalars, int64_t unary_scalars_len_, const char** unary_algorithm, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ c10::List> unary_scalars_list; unary_scalars_list.reserve(unary_scalars_len_); for (int64_t i = 0; i < unary_scalars_len_; i++) { unary_scalars_list.emplace_back(pointer_to_optional(unary_scalars[i])); } c10::List stride_list = convert_to_c10_List(stride_args, stride_len_); c10::List padding_list = convert_to_c10_List(padding_args, padding_len_); c10::List dilation_list = convert_to_c10_List(dilation_args, dilation_len_); auto tmp_result = at::native::QConvoneDNN::run_pointwise_binary_tensor( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(act_scale), *tensor_handle_to_tensor_pointer(act_zero_point), *tensor_handle_to_tensor_pointer(onednn_weight), *tensor_handle_to_tensor_pointer(weight_scales), *tensor_handle_to_tensor_pointer(weight_zero_points), *tensor_handle_to_tensor_pointer(accum), pointer_to_optional(B), stride_list, padding_list, dilation_list, groups, output_scale, output_zero_point, pointer_to_optional(output_dtype), accum_scale, accum_zero_point, binary_attr, pointer_to_optional(alpha), pointer_to_optional(unary_attr), unary_scalars_list, pointer_to_optional(unary_algorithm)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } #if AT_MKL_ENABLED() AOTITorchError aoti_torch_cpu__mkl_linear( AtenTensorHandle X, AtenTensorHandle W, AtenTensorHandle origin_W, AtenTensorHandle* B, int64_t prepack_batch_size, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ auto tmp_result = at::native::mkl_linear( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(W), *tensor_handle_to_tensor_pointer(origin_W), pointer_to_optional(B), prepack_batch_size); *ret0 = new_tensor_handle(std::move(tmp_result)); }); } #endif // AT_MKL_ENABLED #endif // AT_MKLDNN_ENABLED() AOTITorchError aoti_torch_cpu__weight_int4pack_mm_cpu_tensor( AtenTensorHandle X, AtenTensorHandle w, AtenTensorHandle qGroupSize, AtenTensorHandle qScaleAndZeros, AtenTensorHandle* ret0) { AOTI_TORCH_CONVERT_EXCEPTION_TO_ERROR_CODE({ auto tmp_result = at::native::_weight_int4pack_mm_cpu_tensor( *tensor_handle_to_tensor_pointer(X), *tensor_handle_to_tensor_pointer(w), *tensor_handle_to_tensor_pointer(qGroupSize), *tensor_handle_to_tensor_pointer(qScaleAndZeros)); *ret0 = new_tensor_handle(std::move(tmp_result)); }); }