From 5498f64e04e42d234f848ff76f523b2e4e88347d Mon Sep 17 00:00:00 2001 From: Salem Derisavi Date: Mon, 25 Sep 2017 14:33:00 -0400 Subject: [PATCH] fixed algorithm. padding should be on both sides --- tutorials/optimize/opt_conv_cuda.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tutorials/optimize/opt_conv_cuda.py b/tutorials/optimize/opt_conv_cuda.py index 3b04b0722408..ecacc59e4673 100644 --- a/tutorials/optimize/opt_conv_cuda.py +++ b/tutorials/optimize/opt_conv_cuda.py @@ -36,10 +36,10 @@ # Algorithm A = tvm.placeholder((in_size, in_size, in_channel, batch), name='A') W = tvm.placeholder((kernel, kernel, in_channel, out_channel), name='W') -out_size = (in_size - kernel + pad) // stride + 1 +out_size = (in_size - kernel + 2*pad) // stride + 1 # Pad input Apad = tvm.compute( - (in_size + pad, in_size + pad, in_channel, batch), + (in_size + 2*pad, in_size + 2*pad, in_channel, batch), lambda yy, xx, cc, nn: tvm.select( tvm.all(yy >= pad, yy - pad < in_size, xx >= pad, xx - pad < in_size),