Skip to content

Commit ac438c7

Browse files
ezhulenevcopybara-github
authored andcommitted
[xla:gpu] Update cutlass version and include util headers
PiperOrigin-RevId: 591825221
1 parent d7cd841 commit ac438c7

File tree

3 files changed

+20
-5
lines changed

3 files changed

+20
-5
lines changed

third_party/cutlass.BUILD

Lines changed: 15 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,21 @@ filegroup(
1717
]),
1818
)
1919

20+
filegroup(
21+
name = "cutlass_util_header_files",
22+
srcs = glob([
23+
"tools/util/include/**",
24+
]),
25+
)
26+
2027
cc_library(
2128
name = "cutlass",
22-
hdrs = [":cutlass_header_files"],
23-
strip_include_prefix = "/include",
29+
hdrs = [
30+
":cutlass_header_files",
31+
":cutlass_util_header_files",
32+
],
33+
includes = [
34+
"include",
35+
"tools/util/include",
36+
],
2437
)

workspace2.bzl

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -42,9 +42,9 @@ def _tf_repositories():
4242
tf_http_archive(
4343
name = "cutlass_archive",
4444
build_file = "//third_party:cutlass.BUILD",
45-
sha256 = "ea1b7f96919460a5d80b09c1b246652539a8605600b2be4cccc02c254bccbe50",
46-
strip_prefix = "cutlass-5783d6dbd0c34032371cce2bd999fc76007520d7",
47-
urls = tf_mirror_urls("https://github.com/chsigg/cutlass/archive/5783d6dbd0c34032371cce2bd999fc76007520d7.tar.gz"),
45+
sha256 = "84cf3fcc47c440a8dde016eb458f8d6b93b3335d9c3a7a16f388333823f1eae0",
46+
strip_prefix = "cutlass-afa7b7241aabe598b725c65480bd9fa71121732c",
47+
urls = tf_mirror_urls("https://github.com/chsigg/cutlass/archive/afa7b7241aabe598b725c65480bd9fa71121732c.tar.gz"),
4848
)
4949

5050
tf_http_archive(

xla/service/gpu/kernels/cutlass_gemm_adaptor.cu.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,12 @@ limitations under the License.
2020
#include <cstdint>
2121
#include <memory>
2222

23+
#include "cute/layout.hpp" // IWYU pragma: keep
2324
#include "cutlass/cutlass.h"
2425
#include "cutlass/gemm/gemm_enumerated_types.h"
2526
#include "cutlass/gemm_coord.h"
2627
#include "cutlass/layout/matrix.h"
28+
#include "cutlass/util/packed_stride.hpp" // IWYU pragma: keep
2729
#include "xla/service/gpu/kernels/cutlass_gemm.h"
2830

2931
namespace xla::gpu::kernel::gemm_universal {

0 commit comments

Comments
 (0)