Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/soumith/cudnn.torch.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorBoris Fomitchev <bfomitchev@nvidia.com>2016-11-10 04:50:02 +0300
committerBoris Fomitchev <bfomitchev@nvidia.com>2016-11-10 04:50:02 +0300
commitf746b7943dc728c12a1db9e339ff0d5c74b61f2d (patch)
tree7dce1f9dd420a45c5f1686fc357efe6f4b79c534 /SpatialConvolution.lua
parentd6e0ce57c32b6944140aeefcf696ed218c1b220e (diff)
Improved existing 16->32 fallback. Added performance-based fallback.
Diffstat (limited to 'SpatialConvolution.lua')
-rw-r--r--SpatialConvolution.lua7
1 files changed, 4 insertions, 3 deletions
diff --git a/SpatialConvolution.lua b/SpatialConvolution.lua
index 9b24591..830a7e6 100644
--- a/SpatialConvolution.lua
+++ b/SpatialConvolution.lua
@@ -127,12 +127,13 @@ function SpatialConvolution:createIODescriptors(input)
self.pad = {self.padH, self.padW}
self.stride = {self.dH, self.dW}
- self.convDesc = cudnn.setConvolutionDescriptor(
- { padA = self.pad,
+ self.convDescData = { padA = self.pad,
filterStrideA = self.stride,
upscaleA = {1,1},
dataType = cudnn.configmap(torch.type(self.weight))
- })
+ }
+
+ self.convDesc = cudnn.setConvolutionDescriptor(self.convDescData)
-- get output shape, resize output
local oSize = torch.IntTensor(4)