local Dropout, Parent = torch.class('nn.Dropout', 'nn.Module') function Dropout:__init(p,v1) Parent.__init(self) self.p = p or 0.5 self.train = true -- version 2 scales output during training instead of evaluation self.v2 = not v1 if self.p >= 1 or self.p < 0 then error(' illegal percentage, must be 0 <= p < 1') end self.noise = torch.Tensor() end function Dropout:updateOutput(input) self.output:resizeAs(input):copy(input) if self.train then self.noise:resizeAs(input) self.noise:bernoulli(1-self.p) if self.v2 then self.noise:div(1-self.p) end self.output:cmul(self.noise) elseif not self.v2 then self.output:mul(1-self.p) end return self.output end function Dropout:updateGradInput(input, gradOutput) if self.train then self.gradInput:resizeAs(gradOutput):copy(gradOutput) self.gradInput:cmul(self.noise) -- simply mask the gradients with the noise vector else error('backprop only defined while training') end return self.gradInput end function Dropout:setp(p) self.p = p end