Skip to content

Commit

Permalink
Update to Cutlass 3.5
Browse files Browse the repository at this point in the history
  • Loading branch information
tridao committed May 26, 2024
1 parent af62706 commit d732be1
Show file tree
Hide file tree
Showing 7 changed files with 7 additions and 8 deletions.
2 changes: 1 addition & 1 deletion csrc/cutlass
Submodule cutlass updated 548 files
2 changes: 1 addition & 1 deletion csrc/flash_attn/src/flash_bwd_kernel.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

#pragma once

#include <cute/algorithm/copy.hpp>
#include <cute/tensor.hpp>

#include <cutlass/cutlass.h>
#include <cutlass/array.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/flash_attn/src/flash_bwd_preprocess_kernel.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

#pragma once

#include <cute/algorithm/copy.hpp>
#include <cute/tensor.hpp>

#include <cutlass/cutlass.h>
#include <cutlass/array.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/flash_attn/src/flash_fwd_kernel.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

#pragma once

#include <cute/algorithm/copy.hpp>
#include <cute/tensor.hpp>

#include <cutlass/cutlass.h>
#include <cutlass/array.h>
Expand Down
2 changes: 1 addition & 1 deletion csrc/flash_attn/src/kernel_traits.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

#pragma once

#include "cute/algorithm/copy.hpp"
#include "cute/tensor.hpp"

#include "cutlass/cutlass.h"
#include "cutlass/layout/layout.h"
Expand Down
2 changes: 1 addition & 1 deletion csrc/flash_attn/src/rotary.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@

#pragma once

#include <cute/algorithm/copy.hpp>
#include <cute/tensor.hpp>

#include "utils.h"

Expand Down
3 changes: 1 addition & 2 deletions csrc/flash_attn/src/utils.h
Original file line number Diff line number Diff line change
Expand Up @@ -14,8 +14,7 @@
#include <cuda_bf16.h>
#endif

#include <cute/algorithm/copy.hpp>
#include <cute/algorithm/gemm.hpp>
#include <cute/tensor.hpp>

#include <cutlass/array.h>
#include <cutlass/cutlass.h>
Expand Down

0 comments on commit d732be1

Please sign in to comment.