Fix typo in persistent RNN kernel checks

adibo · Jun 30, 2016 · 79ab17f · 79ab17f
1 parent 8a5b2c4
commit 79ab17f
Showing 1 changed file with 2 additions and 2 deletions.
diff --git a/neon/backends/nervanagpu.py b/neon/backends/nervanagpu.py
@@ -2468,7 +2468,7 @@ def compound_rnn_unroll_fprop(self, W_recur, h_prev_s, h_ff_s, h_s, bias,
             num_blocks = (-(-h_s[0].shape[0] // 128)) * (-(-h_s[0].shape[1] // 32))
             num_blocks = (-(-num_blocks // 4))
 
-        if (activation.classnm == 'Rectlinclip' and num_blocks < self.sm_count and
+        if (activation.classnm == 'Rectlinclip' and num_blocks <= self.sm_count and
                 not self.use_cudac_kernels):
             if h_s[0].base is not h_ff_s[0].base:
                 if len(h_s[0].base.shape) == 3:
@@ -2543,7 +2543,7 @@ def compound_rnn_unroll_bprop(self, W_recur, delta_prev_s, delta_s, h_s,
             num_blocks = (-(-delta_s[0].shape[0] // 128)) * (-(-delta_s[0].shape[1] // 32))
             num_blocks = (-(-num_blocks // 4))
 
-        if (activation.classnm == 'Rectlinclip' and num_blocks < self.sm_count and
+        if (activation.classnm == 'Rectlinclip' and num_blocks <= self.sm_count and
                 not self.use_cudac_kernels):
             # Compute activation bprop for first timestep since there is
             # no compounded GEMM