Skip to content

Commit 6e6439b

Browse files
committed
Set warp size to 32
Signed-off-by: Hosang Yoon <hosang.yoon@amd.com>
1 parent f61ad93 commit 6e6439b

File tree

4 files changed

+6
-6
lines changed

4 files changed

+6
-6
lines changed

csrc/attention/attention_kernels.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ typedef __hip_bfloat16 __nv_bfloat16;
3636
#ifndef USE_ROCM
3737
#define WARP_SIZE 32
3838
#else
39-
#define WARP_SIZE warpSize
39+
#define WARP_SIZE 32
4040
#endif
4141

4242
#define MAX(a, b) ((a) > (b) ? (a) : (b))

csrc/attention/paged_attention_v1.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
#ifndef USE_ROCM
2323
#define WARP_SIZE 32
2424
#else
25-
#define WARP_SIZE warpSize
25+
#define WARP_SIZE 32
2626
#endif
2727

2828
#define MAX(a, b) ((a) > (b) ? (a) : (b))
@@ -212,4 +212,4 @@ void paged_attention_v1(
212212
#undef WARP_SIZE
213213
#undef MAX
214214
#undef MIN
215-
#undef DIVIDE_ROUND_UP
215+
#undef DIVIDE_ROUND_UP

csrc/attention/paged_attention_v2.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
#ifndef USE_ROCM
2323
#define WARP_SIZE 32
2424
#else
25-
#define WARP_SIZE warpSize
25+
#define WARP_SIZE 32
2626
#endif
2727

2828
#define MAX(a, b) ((a) > (b) ? (a) : (b))
@@ -222,4 +222,4 @@ void paged_attention_v2(
222222
#undef WARP_SIZE
223223
#undef MAX
224224
#undef MIN
225-
#undef DIVIDE_ROUND_UP
225+
#undef DIVIDE_ROUND_UP

csrc/cuda_compat.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
#ifndef USE_ROCM
88
#define WARP_SIZE 32
99
#else
10-
#define WARP_SIZE warpSize
10+
#define WARP_SIZE 32
1111
#endif
1212

1313
#ifndef USE_ROCM

0 commit comments

Comments
 (0)