Welcome to mirror list, hosted at ThFree Co, Russian Federation.

bench_groups.lua « test - github.com/soumith/cudnn.torch.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
blob: cfcaa41a4b236ac7c4f3c8776c78286daa9a3402 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
require 'cudnn'

m = cudnn.SpatialConvolution(512,512,13,13,1,1,1,1,512)


inp = torch.zeros(1,512,512,512)

inp = inp:cuda()
m = m:cuda()

cutorch.reserveStreams(10)
-- cutorch.setStream(2) -- disables groups parallelization

local tm = os.clock()
for i=1,10 do
   o=m:forward(inp)
   cutorch.synchronize()
   print(os.clock() - tm)
   tm = os.clock()
end

print(#o)