- Notifications
You must be signed in to change notification settings - Fork1.9k
Commit81aeb50
File tree
4 files changed
+9
-14
lines changed- 3rdparty
- tensorrt_llm/_torch/auto_deploy/models
- tests/unittest/_torch/auto_deploy
- _utils_test
- unit/singlegpu/models
4 files changed
+9
-14
lines changed- CHANGELOG.md-14
- README.md+2-5
- examples/77_blackwell_fmha/CMakeLists.txt+3-5
- examples/77_blackwell_fmha/collective/fmha_fusion.hpp+2-2
- examples/python/CuTeDSL/ampere/all_reduce.py+314
- examples/python/CuTeDSL/ampere/distributed_vector_add.py+189
- include/cutlass/epilogue/collective/builders/sm100_builder.inl+4-8
- include/cutlass/epilogue/dispatch_policy.hpp-4
- include/cutlass/version.h+1-1
- media/docs/cpp/cute/02_layout_algebra.md+2-2
- media/docs/cpp/cute/03_tensor.md+1-1
- media/docs/cpp/pipeline.md+1-1
- pyproject.toml+1-1
- python/CuTeDSL/base_dsl/ast_helpers.py-35
- python/CuTeDSL/base_dsl/ast_preprocessor.py+49-56
- python/CuTeDSL/base_dsl/runtime/cuda.py+1-7
- python/CuTeDSL/base_dsl/utils/logger.py+1-2
- python/CuTeDSL/cutlass/__init__.py-2
- python/CuTeDSL/cutlass_dsl/__init__.py-2
- python/CuTeDSL/requirements.txt+1-1
- python/cutlass/__init__.py+1-1
- python/cutlass/backend/__init__.py
- python/cutlass/backend/arguments.py
- python/cutlass/backend/c_types.py
- python/cutlass/backend/compiler.py
- python/cutlass/backend/conv2d_operation.py
- python/cutlass/backend/epilogue.py
- python/cutlass/backend/evt/__init__.py
- python/cutlass/backend/evt/backend/__init__.py
- python/cutlass/backend/evt/backend/emitter_base.py
- python/cutlass/backend/evt/backend/sm100_emitter.py
- python/cutlass/backend/evt/backend/sm100_nodes.py
- python/cutlass/backend/evt/backend/sm80_emitter.py
- python/cutlass/backend/evt/backend/sm80_nodes.py
- python/cutlass/backend/evt/backend/sm90_emitter.py
- python/cutlass/backend/evt/backend/sm90_nodes.py
- python/cutlass/backend/evt/epilogue.py
- python/cutlass/backend/evt/frontend/__init__.py
- python/cutlass/backend/evt/frontend/frontend_base.py
- python/cutlass/backend/evt/frontend/python_ast.py
- python/cutlass/backend/evt/ir/__init__.py
- python/cutlass/backend/evt/ir/compute_nodes.py
- python/cutlass/backend/evt/ir/dag_ir.py
- python/cutlass/backend/evt/ir/layout_algorithm.py
- python/cutlass/backend/evt/ir/layout_nodes.py
- python/cutlass/backend/evt/ir/load_nodes.py
- python/cutlass/backend/evt/ir/node.py
- python/cutlass/backend/evt/ir/store_nodes.py
- python/cutlass/backend/evt/ir/tensor.py
- python/cutlass/backend/evt/passes/__init__.py
- python/cutlass/backend/evt/passes/graph_drawer.py
- python/cutlass/backend/evt/passes/pass_argument_type.py
- python/cutlass/backend/evt/passes/pass_dag_2_tree.py
- python/cutlass/backend/evt/passes/pass_fix_element_d.py
- python/cutlass/backend/evt/passes/pass_get_impl.py
- python/cutlass/backend/evt/passes/pass_layout_elimination.py
- python/cutlass/backend/evt/passes/pass_manager.py
- python/cutlass/backend/evt/passes/pass_no_op_elimination.py
- python/cutlass/backend/evt/passes/pass_preprocess_red.py
- python/cutlass/backend/evt/passes/pass_shape_type_propagation.py
- python/cutlass/backend/evt/passes/smem_size_calculator.py
- python/cutlass/backend/evt/passes/util.py
- python/cutlass/backend/frontend.py
- python/cutlass/backend/gemm_operation.py
- python/cutlass/backend/library.py
- python/cutlass/backend/memory_manager.py
- python/cutlass/backend/operation.py
- python/cutlass/backend/reduction_operation.py
- python/cutlass/backend/type_hint.py
- python/cutlass/backend/utils/__init__.py
- python/cutlass/backend/utils/device.py
- python/cutlass/emit/__init__.py
- python/cutlass/emit/common.py
- python/cutlass/emit/pytorch.py
- python/cutlass/epilogue/__init__.py
- python/cutlass/epilogue/epilogue.py
- python/cutlass/epilogue/evt_ops.py
- python/cutlass/library_defaults.py
- python/cutlass/op/__init__.py
- python/cutlass/op/conv.py
- python/cutlass/op/gemm.py
- python/cutlass/op/gemm_grouped.py
- python/cutlass/op/op.py
- python/cutlass/shape.py
- python/cutlass/swizzle.py
- python/cutlass/utils/__init__.py
- python/cutlass/utils/check.py
- python/cutlass/utils/datatypes.py
- python/cutlass/utils/lazy_import.py
- python/cutlass/utils/profiler.py
- python/cutlass_library/generator.py+1-2
- python/cutlass_library/library.py-14
- python/setup_library.py+1-1
- python/setup_pycute.py+1-1
- setup.cfg+1-1
- test/unit/gemm/device/sm100_gemm_f8_f8_f8_tensor_op_f32_blockwise.cu+8-30
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
107 | 107 | | |
108 | 108 | | |
109 | 109 | | |
110 | | - | |
111 | | - | |
112 | | - | |
113 | | - | |
114 | | - | |
115 | | - | |
116 | | - | |
117 | | - | |
118 | | - | |
119 | 110 | | |
120 | 111 | | |
121 | 112 | | |
| |||
159 | 150 | | |
160 | 151 | | |
161 | 152 | | |
| 153 | + | |
| 154 | + | |
| 155 | + | |
| 156 | + | |
162 | 157 | | |
163 | 158 | | |
164 | 159 | | |
| |||
278 | 273 | | |
279 | 274 | | |
280 | 275 | | |
281 | | - | |
| 276 | + | |
282 | 277 | | |
283 | 278 | | |
284 | 279 | | |
| |||
Lines changed: 2 additions & 2 deletions
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
465 | 465 | | |
466 | 466 | | |
467 | 467 | | |
468 | | - | |
| 468 | + | |
469 | 469 | | |
470 | 470 | | |
471 | 471 | | |
| |||
484 | 484 | | |
485 | 485 | | |
486 | 486 | | |
487 | | - | |
| 487 | + | |
488 | 488 | | |
489 | 489 | | |
490 | 490 | | |
| |||
Lines changed: 1 addition & 1 deletion
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
48 | 48 | | |
49 | 49 | | |
50 | 50 | | |
51 | | - | |
| 51 | + | |
52 | 52 | | |
53 | 53 | | |
54 | 54 | | |
| |||
0 commit comments
Comments
(0)