#if !defined(TORCH_STABLE_ONLY) && !defined(TORCH_TARGET_VERSION) #pragma once #include #include #include #include #include namespace at::native { namespace { C10_ALWAYS_INLINE void _check_rms_norm_inputs_symint( const Tensor& input, c10::SymIntArrayRef normalized_shape, const Tensor& weight /* optional */) { const int normalized_ndim = normalized_shape.size(); TORCH_CHECK( normalized_ndim >= 1, "Expected normalized_shape to be at least 1-dimensional, i.e., ", "containing at least one element, but got normalized_shape = ", normalized_shape); if (weight.defined()) { TORCH_SYM_CHECK( sym_equals(weight.sym_sizes(), normalized_shape), "Expected weight to be of same shape as normalized_shape, but got ", "weight of shape ", weight.sym_sizes(), " and normalized_shape = ", normalized_shape); } const auto input_ndim = input.dim(); const auto input_shape = input.sym_sizes(); TORCH_CHECK_VALUE( input_ndim >= normalized_ndim, "Input tensor must have at least ", normalized_ndim, " dimensions, but got ", input_ndim); auto expect_input_shape_msg = c10::str( "Given normalized_shape=", normalized_shape, ", expected input with shape [*", c10::Join(", ", normalized_shape), "], but got input of size", input_shape); TORCH_SYM_CHECK( sym_equals(input_shape.slice(input_ndim - normalized_ndim), normalized_shape), expect_input_shape_msg); } C10_ALWAYS_INLINE std::pair _check_layer_norm_inputs( const Tensor& input, IntArrayRef normalized_shape, const Tensor& weight /* optional */, const Tensor& bias /* optional */) { const int normalized_ndim = normalized_shape.size(); TORCH_CHECK( normalized_ndim >= 1, "Expected normalized_shape to be at least 1-dimensional, i.e., ", "containing at least one element, but got normalized_shape = ", normalized_shape); TORCH_CHECK( !weight.defined() || weight.sizes().equals(normalized_shape), "Expected weight to be of same shape as normalized_shape, but got ", "weight of shape ", weight.sizes(), " and normalized_shape = ", normalized_shape); TORCH_CHECK( !bias.defined() || bias.sizes().equals(normalized_shape), "Expected bias to be of same shape as normalized_shape, but got ", "bias of shape ", bias.sizes(), " and normalized_shape = ", normalized_shape); const auto input_shape = input.sizes(); const auto input_ndim = input.dim(); if (input_ndim < normalized_ndim || !input_shape.slice(input_ndim - normalized_ndim) .equals(normalized_shape)) { std::stringstream ss; ss << "Given normalized_shape=" << normalized_shape << ", expected input with shape [*"; for (auto size : normalized_shape) { ss << ", " << size; } ss << "], but got input of size" << input_shape; TORCH_CHECK(false, ss.str()); } const int axis = input_ndim - normalized_ndim; const int64_t M = c10::multiply_integers(input_shape.cbegin(), input_shape.cbegin() + axis); const int64_t N = c10::multiply_integers(input_shape.cbegin() + axis, input_shape.cend()); return std::make_pair(M, N); } } // namespace void layer_norm_cpu_out( at::Tensor& out, const at::Tensor& input, const Tensor& gamma, const Tensor& beta, double eps, int64_t M, int64_t N); std::tuple rms_norm_composite( const Tensor& input, IntArrayRef normalized_shape, const std::optional& weight_opt /* optional */, std::optional eps); Tensor rms_norm_symint( const Tensor& input, c10::SymIntArrayRef normalized_shape, const std::optional& weight_opt /* optional */, std::optional eps); using forward_fn = void (*)( const Tensor& /* X */, const Tensor& /* gamma */, const Tensor& /* beta */, int64_t /* M */, int64_t /* N */, double /* eps */, Tensor* /* Y */, Tensor* /* mean */, Tensor* /* rstd */); using backward_fn = void (*)( const Tensor& /* dY */, const Tensor& /* X */, const Tensor& /* mean */, const Tensor& /* rstd */, const Tensor& /* gamma */, int64_t /* M */, int64_t /* N */, Tensor* /* dX */, Tensor* /* dgamma */, Tensor* /* dbeta */); DECLARE_DISPATCH(forward_fn, LayerNormKernel) DECLARE_DISPATCH(backward_fn, LayerNormBackwardKernel) } // namespace at::native #else #error "This file should not be included when either TORCH_STABLE_ONLY or TORCH_TARGET_VERSION is defined." #endif // !defined(TORCH_STABLE_ONLY) && !defined(TORCH_TARGET_VERSION)