diff options
author | Boris Fomitchev <bfomitchev@nvidia.com> | 2016-11-10 04:50:02 +0300 |
---|---|---|
committer | Boris Fomitchev <bfomitchev@nvidia.com> | 2016-11-10 04:50:02 +0300 |
commit | f746b7943dc728c12a1db9e339ff0d5c74b61f2d (patch) | |
tree | 7dce1f9dd420a45c5f1686fc357efe6f4b79c534 /SpatialConvolution.lua | |
parent | d6e0ce57c32b6944140aeefcf696ed218c1b220e (diff) |
Improved existing 16->32 fallback. Added performance-based fallback.
Diffstat (limited to 'SpatialConvolution.lua')
-rw-r--r-- | SpatialConvolution.lua | 7 |
1 files changed, 4 insertions, 3 deletions
diff --git a/SpatialConvolution.lua b/SpatialConvolution.lua index 9b24591..830a7e6 100644 --- a/SpatialConvolution.lua +++ b/SpatialConvolution.lua @@ -127,12 +127,13 @@ function SpatialConvolution:createIODescriptors(input) self.pad = {self.padH, self.padW} self.stride = {self.dH, self.dW} - self.convDesc = cudnn.setConvolutionDescriptor( - { padA = self.pad, + self.convDescData = { padA = self.pad, filterStrideA = self.stride, upscaleA = {1,1}, dataType = cudnn.configmap(torch.type(self.weight)) - }) + } + + self.convDesc = cudnn.setConvolutionDescriptor(self.convDescData) -- get output shape, resize output local oSize = torch.IntTensor(4) |