NotificationsYou must be signed in to change notification settings
Fork26.3k
Star96k

Commite4fe67f

committed

Revert "[MPS] Make fused rms_norm traceable (#150661)"

This reverts commit682f09e.Reverted#150661 on behalf ofhttps://github.com/malfet due to Has decomp started to fail again ([comment](#150661 (comment)))

1 parent32c79da commite4fe67fCopy full SHA for e4fe67f

File tree

6 files changed

+24

-20

lines changed

aten/src/ATen/native
- layer_norm.cpp
- mps/operations
  - RMSNorm.h
  - RMSNorm.mm
- native_functions.yaml
test/inductor
- test_mps_basic.py
torch/_inductor
- lowering.py

6 files changed

+24

-20

lines changed

`‎aten/src/ATen/native/layer_norm.cpp‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,6 @@`
`16`	`16`	`#include<ATen/ops/empty_like.h>`
`17`	`17`	`#include<ATen/ops/empty_like_native.h>`
`18`	`18`	`#include<ATen/ops/layer_norm_native.h>`
`19`		`-#include<ATen/ops/_fused_rms_norm.h>`
`20`	`19`	`#include<ATen/ops/native_batch_norm.h>`
`21`	`20`	`#include<ATen/ops/native_layer_norm.h>`
`22`	`21`	`#include<ATen/ops/native_layer_norm_backward_native.h>`
`@@ -28,6 +27,7 @@`
`28`	`27`	`#endif`
`29`	`28`
`30`	`29`	`#ifdef USE_MPS`
	`30`	`+#include<ATen/native/mps/operations/RMSNorm.h>`
`31`	`31`	`#include<c10/core/GradMode.h>`
`32`	`32`	`#endif`
`33`	`33`
`@@ -281,7 +281,7 @@ Tensor rms_norm_symint(`
`281`	`281`
`282`	`282`	`if (!(GradMode::is_enabled() && any_inputs_require_grad) && !any_nested && is_input_fp && is_weight_fp) {`
`283`	`283`	`auto eps_val = eps.value_or(std::numeric_limits<double>::epsilon());`
`284`		`-returnat::_fused_rms_norm(input.contiguous(), normalized_shape.size(), weight.contiguous(), eps_val);`
	`284`	`+returnmps::rms_norm_mps_kernel(input.contiguous(), normalized_shape, weight.contiguous(), eps_val);`
`285`	`285`	`}`
`286`	`286`	`}`
`287`	`287`	`#endif`

`‎aten/src/ATen/native/mps/operations/RMSNorm.h‎`

Lines changed: 14 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,14 @@`
	`1`	`+#pragma once`
	`2`	`+`
	`3`	`+#include<ATen/core/Tensor.h>`
	`4`	`+#include<c10/core/SymIntArrayRef.h>`
	`5`	`+`
	`6`	`+namespaceat::native::mps {`
	`7`	`+`
	`8`	`+Tensorrms_norm_mps_kernel(`
	`9`	`+const Tensor& input,`
	`10`	`+ c10::SymIntArrayRef normalized_shape,`
	`11`	`+const Tensor& weight,`
	`12`	`+constdouble eps);`
	`13`	`+`
	`14`	`+}// namespace at::native::mps`

`‎aten/src/ATen/native/mps/operations/RMSNorm.mm‎`

Lines changed: 8 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -4,24 +4,27 @@`
`4`	`4`	`#include<ATen/Functions.h>`
`5`	`5`	`#include<ATen/NativeFunctions.h>`
`6`	`6`	`#else`
`7`		`-#include<ATen/ops/_fused_rms_norm_native.h>`
`8`	`7`	`#include<ATen/ops/empty_like.h>`
`9`	`8`	`#endif`
`10`	`9`	`#include<ATen/native/mps/OperationUtils.h>`
	`10`	`+#include<ATen/native/mps/operations/RMSNorm.h>`
`11`	`11`	`#include<fmt/format.h>`
`12`	`12`
`13`		`-namespaceat::native {`
`14`		`-usingnamespacemps;`
	`13`	`+namespaceat::native::mps {`
`15`	`14`
`16`	`15`	`#ifndef PYTORCH_JIT_COMPILE_SHADERS`
`17`	`16`	`staticauto& lib = MetalShaderLibrary::getBundledLibrary();`
`18`	`17`	`#else`
`19`	`18`	`#include<ATen/native/mps/RMSNorm_metallib.h>`
`20`	`19`	`#endif`
`21`	`20`
`22`		`-Tensor_fused_rms_norm_mps(const Tensor& input,constint64_t normalized_ndim,const Tensor& weight,constdouble eps) {`
	`21`	`+Tensorrms_norm_mps_kernel(const Tensor& input,`
	`22`	`+ c10::SymIntArrayRef normalized_shape,`
	`23`	`+const Tensor& weight,`
	`24`	`+constdouble eps) {`
`23`	`25`	`TORCH_CHECK(input.is_contiguous() && weight.is_contiguous(),"Expected contiguous input and weight tensors");`
`24`	`26`	`auto output =at::empty_like(input);`
	`27`	`+constint normalized_ndim = normalized_shape.size();`
`25`	`28`	`constauto input_shape = input.sizes();`
`26`	`29`	`constauto input_ndim = input.dim();`
`27`	`30`	`constint axis = input_ndim - normalized_ndim;`
`@@ -61,4 +64,4 @@ Tensor _fused_rms_norm_mps(const Tensor& input, const int64_t normalized_ndim, c`
`61`	`64`	`return output;`
`62`	`65`	`}`
`63`	`66`
`64`		`-}// namespace at::native`
	`67`	`+}// namespace at::native::mps`

`‎aten/src/ATen/native/native_functions.yaml‎`

Lines changed: 0 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -3301,10 +3301,6 @@`
`3301`	`3301`	`dispatch:`
`3302`	`3302`	`CompositeImplicitAutograd: rms_norm_symint`
`3303`	`3303`
`3304`		`-- func: _fused_rms_norm(Tensor input, int normalized_shape_ndim, Tensor weight, float eps) -> Tensor`
`3305`		`- dispatch:`
`3306`		`- MPS: _fused_rms_norm_mps`
`3307`		`-`
`3308`	`3304`	`- func: nan_to_num(Tensor self, float? nan=None, float? posinf=None, float? neginf=None) -> Tensor`
`3309`	`3305`	`variants: function, method`
`3310`	`3306`	`dispatch:`

`‎test/inductor/test_mps_basic.py‎`

Lines changed: 0 additions & 8 deletions

Original file line number	Diff line number	Diff line change
`@@ -152,14 +152,6 @@ def inc_(x):`
`152`	`152`
`153`	`153`	`self.common(inc_, (torch.rand(1024),))`
`154`	`154`
`155`		`-deftest_rms_norm_nograd(self):`
`156`		`-# Regression test for https://github.com/pytorch/pytorch/issues/150629`
`157`		`-deffn(x,w):`
`158`		`-withtorch.no_grad():`
`159`		`-returntorch.nn.functional.rms_norm(x,x.shape,w)`
`160`		`-`
`161`		`-self.common(fn, (torch.rand(10),torch.ones(10)))`
`162`		`-`
`163`	`155`
`164`	`156`	`if__name__=="__main__":`
`165`	`157`	`fromtorch._dynamo.test_caseimportrun_tests`

`‎torch/_inductor/lowering.py‎`

Lines changed: 0 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -2625,7 +2625,6 @@ def is_aligned(x):`
`2625`	`2625`	`make_fallback(aten.exponential.default,warn=False)# (fails accuracy on test_torch.py)`
`2626`	`2626`	`make_fallback(aten._pdist_forward)# Has decomp. Needs benchmarks`
`2627`	`2627`	`make_fallback(aten.soft_margin_loss_backward,warn=False)# py_impl?`
`2628`		`-make_fallback(aten._fused_rms_norm,warn=False)# (MPS-only and faster than decomp)`
`2629`	`2628`
`2630`	`2629`
`2631`	`2630`	`# 1.5) Easy or Impossible`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commite4fe67f

File tree

6 files changed

6 files changed

`‎aten/src/ATen/native/layer_norm.cpp‎`

`‎aten/src/ATen/native/mps/operations/RMSNorm.h‎`

`‎aten/src/ATen/native/mps/operations/RMSNorm.mm‎`

`‎aten/src/ATen/native/native_functions.yaml‎`

`‎test/inductor/test_mps_basic.py‎`

`‎torch/_inductor/lowering.py‎`

0 commit comments