1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
|
#ifndef TH_GENERIC_FILE
#define TH_GENERIC_FILE "generic/Tanh.c"
#else
static int nn_(Tanh_updateOutput)(lua_State *L)
{
THTensor *input = luaT_checkudata(L, 2, torch_(Tensor_id));
THTensor *output = luaT_getfieldcheckudata(L, 1, "output", torch_(Tensor_id));
THTensor_(resizeAs)(output, input);
if (input->nDimension == 1 || !THTensor_(isContiguous)(input) || !THTensor_(isContiguous)(output))
{
TH_TENSOR_APPLY2(real, output, real, input, \
*output_data = tanh(*input_data););
}
else
{
real* output_data = THTensor_(data)(output);
real* input_data = THTensor_(data)(input);
long k;
#pragma omp parallel for private(k)
for (k = 0; k < input->size[0]; k++)
{
real* ptr_output = output_data + k*input->stride[0];
real* ptr_input = input_data + k*input->stride[0];
long i;
for (i = 0; i < input->stride[0]; i++)
ptr_output[i] = tanh(ptr_input[i]);
}
}
return 1;
}
static int nn_(Tanh_updateGradInput)(lua_State *L)
{
THTensor *gradOutput = luaT_checkudata(L, 3, torch_(Tensor_id));
THTensor *output = luaT_getfieldcheckudata(L, 1, "output", torch_(Tensor_id));
THTensor *gradInput = luaT_getfieldcheckudata(L, 1, "gradInput", torch_(Tensor_id));
THTensor_(resizeAs)(gradInput, output);
if (output->nDimension == 1 ||
!THTensor_(isContiguous)(output) ||
!THTensor_(isContiguous)(gradOutput) ||
!THTensor_(isContiguous)(gradInput))
{
TH_TENSOR_APPLY3(real, gradInput, real, gradOutput, real, output, \
real z = *output_data; \
*gradInput_data = *gradOutput_data * (1. - z*z););
}
else
{
real* gradOutput_data = THTensor_(data)(gradOutput);
real* gradInput_data = THTensor_(data)(gradInput);
real* output_data = THTensor_(data)(output);
long k;
#pragma omp parallel for private(k)
for (k = 0; k < output->size[0]; k++)
{
real* ptr_gradOutput = gradOutput_data + k*output->stride[0];
real* ptr_gradInput = gradInput_data + k*output->stride[0];
real* ptr_output = output_data + k*output->stride[0];
long i;
for (i = 0; i < output->stride[0]; i++)
{
real z = ptr_output[i];
ptr_gradInput[i] = ptr_gradOutput[i] * (1. - z*z);
}
}
}
return 1;
}
static const struct luaL_Reg nn_(Tanh__) [] = {
{"Tanh_updateOutput", nn_(Tanh_updateOutput)},
{"Tanh_updateGradInput", nn_(Tanh_updateGradInput)},
{NULL, NULL}
};
static void nn_(Tanh_init)(lua_State *L)
{
luaT_pushmetaclass(L, torch_(Tensor_id));
luaT_registeratname(L, nn_(Tanh__), "nn");
lua_pop(L,1);
}
#endif
|