Commitf32562c

PaulZhang12

authored and

facebook-github-bot

committed

[Inductor] Add envvar to disable decomposeK (#154421)

Summary:Pull Requestresolved:#154421Add envvar to Inductor config to disable decomposeK autotuning choiceTest Plan: `buck test 'fbcode//mode/opt' fbcode//caffe2/test/inductor:max_autotune -- --exact 'caffe2/test/inductor:max_autotune - test_max_autotune_decompose_k_dynamic_False_sizes2 (caffe2.test.inductor.test_max_autotune.TestMaxAutotune)' --run-disabled`Reviewed By: eellisonDifferential Revision: D75174823

1 parent0db9c64 commitf32562cCopy full SHA for f32562c

File tree

3 files changed

+27

-0

lines changed

test/inductor
- test_max_autotune.py
torch/_inductor
- config.py
- utils.py

3 files changed

+27

-0

lines changed

`‎test/inductor/test_max_autotune.py‎`

Lines changed: 23 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -1366,6 +1366,29 @@ def test_func3(x, y, z, m, l):`
`1366`	`1366`	`self.assertEqual(hits(),0)`
`1367`	`1367`	`self.assertEqual(misses(),7)`
`1368`	`1368`
	`1369`	`+@skipIfXpu`
	`1370`	`+@unittest.skipIf(TEST_WITH_ROCM,"decompose_k not supported on ROCm")`
	`1371`	`+@unittest.skipIf(`
	`1372`	`+config.cpp_wrapper,"decompose_k not supported for cpp_wrapper yet"`
	`1373`	`+ )`
	`1374`	`+@config.patch(`
	`1375`	`+max_autotune=True,`
	`1376`	`+max_autotune_gemm_backends="TRITON",`
	`1377`	`+autotune_fallback_to_aten=False,`
	`1378`	`+disable_decompose_k=True,`
	`1379`	`+ )`
	`1380`	`+deftest_max_autotune_disable_decompose_K(self):`
	`1381`	`+M,N,K= (32,32,32768)`
	`1382`	`+`
	`1383`	`+a=torch.randn(M,K,dtype=torch.float16,device="cuda",requires_grad=True)`
	`1384`	`+b=torch.randn(K,N,dtype=torch.float16,device="cuda",requires_grad=True)`
	`1385`	`+`
	`1386`	`+compiled_func=torch.compile(lambdaa,b:a @b)`
	`1387`	`+out,code=run_and_get_code(compiled_func,a,b)`
	`1388`	`+`
	`1389`	`+forcodegenincode:`
	`1390`	`+FileCheck().check_not("decompose_k").run(codegen)`
	`1391`	`+`
`1369`	`1392`
`1370`	`1393`	`classTestMaxAutotunePrecompile(TestCase):`
`1371`	`1394`	`deftest_precompilation_threads(self):`

`‎torch/_inductor/config.py‎`

Lines changed: 3 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -396,6 +396,9 @@ def prologue_fusion_enabled() -> bool:`
`396`	`396`	`# enable slow autotuning passes to select gemm algorithms`
`397`	`397`	`max_autotune_gemm=os.environ.get("TORCHINDUCTOR_MAX_AUTOTUNE_GEMM")=="1"`
`398`	`398`
	`399`	`+# disable decomposek autotune choice for gemm`
	`400`	`+disable_decompose_k=os.environ.get("TORCHINDUCTOR_DISABLE_DECOMPOSE_K")=="1"`
	`401`	`+`
`399`	`402`	`# Modifies the number of autotuning choices displayed, set to None for all`
`400`	`403`	`autotune_num_choices_displayed:Optional[int]=10`
`401`	`404`

`‎torch/_inductor/utils.py‎`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -1595,6 +1595,7 @@ def use_decompose_k_choice(m: _IntLike, n: _IntLike, k: _IntLike) -> bool:`
`1595`	`1595`	`)`
`1596`	`1596`	`andnotV.graph.aot_mode# TODO: Support AOTI for decomposeK`
`1597`	`1597`	`andnotV.graph.cpp_wrapper`
	`1598`	`+andnotconfig.disable_decompose_k`
`1598`	`1599`	`)`
`1599`	`1600`
`1600`	`1601`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitf32562c

File tree

3 files changed

3 files changed

`‎test/inductor/test_max_autotune.py‎`

`‎torch/_inductor/config.py‎`

`‎torch/_inductor/utils.py‎`

0 commit comments