We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 62508c5 commit 84cfdb2Copy full SHA for 84cfdb2
csrc/permute_cols.cu
@@ -10,7 +10,7 @@ static constexpr int div_ceil(int a, int b) { return (a + b - 1) / b; }
10
11
// For a given "a" of size [M,K] performs a permutation of the K columns based
12
// on the given "perm" indices.
13
-// Currently only supports 16bit types (since we permute halfs)
+// Currently only supports 16bit types (since we permute half types)
14
__global__ void permute_cols_kernel(int4 const* __restrict__ a_int4_ptr,
15
int const* __restrict__ perm_int_ptr,
16
int4* __restrict__ out_int4_ptr, int size_m,
0 commit comments