@@ -53,7 +53,7 @@ which should eliminate any need for large allocations within this method.
53
53
col_ptr = pointer (col)
54
54
w_ptr = pointer (w)
55
55
y_ptr = pointer (y, (batch_idx - 1 )* M* N + 1 )
56
- gemm! (Val (false ), Val (false ), M, N, K, alpha, col_ptr, w_ptr, beta, y_ptr)
56
+ @timeit_debug to " gemm! " gemm! (Val (false ), Val (false ), M, N, K, alpha, col_ptr, w_ptr, beta, y_ptr)
57
57
end
58
58
return y
59
59
end
@@ -99,7 +99,7 @@ See the documentation for `conv_im2col!()` for explanation of optional parameter
99
99
col_ptr = pointer (col)
100
100
dy_ptr = pointer (dy,(batch_idx - 1 )* K* N + 1 )
101
101
dw_ptr = pointer (dw)
102
- gemm! (Val (true ), Val (false ), M, N, K, alpha, col_ptr, dy_ptr, beta, dw_ptr)
102
+ @timeit_debug to " gemm! " gemm! (Val (true ), Val (false ), M, N, K, alpha, col_ptr, dy_ptr, beta, dw_ptr)
103
103
104
104
# Because we accumulate over batches in this loop, we must set `beta` equal
105
105
# to `1.0` from this point on.
@@ -144,7 +144,7 @@ See the documentation for `conv_im2col!()` for explanation of other parameters.
144
144
dy_ptr = pointer (dy, (batch_idx - 1 )* M* K + 1 )
145
145
w_ptr = pointer (w)
146
146
col_ptr = pointer (col)
147
- gemm! (Val (false ), Val (true ), M, N, K, alpha, dy_ptr, w_ptr, T (0 ), col_ptr)
147
+ @timeit_debug to " gemm! " gemm! (Val (false ), Val (true ), M, N, K, alpha, dy_ptr, w_ptr, T (0 ), col_ptr)
148
148
@timeit_debug to " col2im!" col2im! (view (dx, :, :, :, :, batch_idx), col, cdims)
149
149
end
150
150
return dx
@@ -363,4 +363,4 @@ function col2im!(x::AbstractArray{T,4}, col::AbstractArray{T,2},
363
363
end
364
364
end
365
365
end
366
- end
366
+ end
0 commit comments