initial revamp of torch7 tree

author: Ronan Collobert <ronan@collobert.com> 2012-01-25 17:55:20 +0400
committer: Ronan Collobert <ronan@collobert.com> 2012-01-25 17:55:20 +0400
commit: 7a296748a34549fc8e70719c6c3533597ceff8c4 (patch)
tree: e9d87c6097381f487a1acc6525c5a08d456b7c02 /Tensor.c
1 files changed, 213 insertions, 0 deletions
diff --git a/Tensor.c b/Tensor.c
new file mode 100644
index 0000000..a3c3c4c
--- /dev/null
+++ b/Tensor.c
@@ -0,0 +1,213 @@
+#include "THC.h"
+#include "THFile.h"
+#include "luaT.h"
+
+/* ids */
+static const void *torch_File_id = NULL;
+static const void *torch_LongStorage_id = NULL;
+static const void *torch_CudaStorage_id = NULL;
+
+static const void *torch_ByteTensor_id = NULL;
+static const void *torch_CharTensor_id = NULL;
+static const void *torch_ShortTensor_id = NULL;
+static const void *torch_IntTensor_id = NULL;
+static const void *torch_LongTensor_id = NULL;
+static const void *torch_FloatTensor_id = NULL;
+static const void *torch_DoubleTensor_id = NULL;
+static const void *torch_CudaTensor_id = NULL;
+
+/* everything is as the generic Storage.c, except few things (see below) */
+
+#define real float
+#define Real Cuda
+
+#define torch_Storage_(NAME) TH_CONCAT_4(torch_,Real,Storage_,NAME)
+#define torch_Storage_id TH_CONCAT_3(torch_,Real,Storage_id)
+#define STRING_torchStorage TH_CONCAT_STRING_3(torch.,Real,Storage)
+#define torch_Tensor_(NAME) TH_CONCAT_4(torch_,Real,Tensor_,NAME)
+#define torch_Tensor_id TH_CONCAT_3(torch_,Real,Tensor_id)
+#define STRING_torchTensor TH_CONCAT_STRING_3(torch.,Real,Tensor)
+
+#define TH_GENERIC_FILE "generic/Tensor.c"
+#include "generic/Tensor.c"
+#undef TH_GENERIC_FILE
+
+#undef real
+#undef Real
+
+/* now we overwrite some methods specific to CudaTensor */
+
+#define CUDA_IMPLEMENT_TENSOR_COPY(TYPEC)                              \
+  static int cutorch_##TYPEC##Tensor_copy(lua_State *L)                 \
+  {                                                                     \
+    TH##TYPEC##Tensor *storage = luaT_checkudata(L, 1, torch_##TYPEC##Tensor_id); \
+    void *src;                                                          \
+    if( (src = luaT_toudata(L, 2, torch_##TYPEC##Tensor_id)) )          \
+      TH##TYPEC##Tensor_copy(storage, src);                             \
+    else if( (src = luaT_toudata(L, 2, torch_ByteTensor_id)) )          \
+      TH##TYPEC##Tensor_copyByte(storage, src);                         \
+    else if( (src = luaT_toudata(L, 2, torch_CharTensor_id)) )          \
+      TH##TYPEC##Tensor_copyChar(storage, src);                         \
+    else if( (src = luaT_toudata(L, 2, torch_ShortTensor_id)) )         \
+      TH##TYPEC##Tensor_copyShort(storage, src);                        \
+    else if( (src = luaT_toudata(L, 2, torch_IntTensor_id)) )           \
+      TH##TYPEC##Tensor_copyInt(storage, src);                          \
+    else if( (src = luaT_toudata(L, 2, torch_LongTensor_id)) )          \
+      TH##TYPEC##Tensor_copyLong(storage, src);                         \
+    else if( (src = luaT_toudata(L, 2, torch_FloatTensor_id)) )         \
+      TH##TYPEC##Tensor_copyFloat(storage, src);                        \
+    else if( (src = luaT_toudata(L, 2, torch_DoubleTensor_id)) )        \
+      TH##TYPEC##Tensor_copyDouble(storage, src);                       \
+    else if( (src = luaT_toudata(L, 2, torch_CudaTensor_id)) )          \
+      TH##TYPEC##Tensor_copyCuda(storage, src);                         \
+    else                                                                \
+      luaL_typerror(L, 2, "torch.*Tensor");                             \
+                                                                        \
+    lua_settop(L, 1);                                                   \
+    return 1;                                                           \
+  }
+
+CUDA_IMPLEMENT_TENSOR_COPY(Byte)
+CUDA_IMPLEMENT_TENSOR_COPY(Char)
+CUDA_IMPLEMENT_TENSOR_COPY(Short)
+CUDA_IMPLEMENT_TENSOR_COPY(Int)
+CUDA_IMPLEMENT_TENSOR_COPY(Long)
+CUDA_IMPLEMENT_TENSOR_COPY(Float)
+CUDA_IMPLEMENT_TENSOR_COPY(Double)
+CUDA_IMPLEMENT_TENSOR_COPY(Cuda)
+
+static void THFloatTensor_computesz(THFloatTensor *self, long **sz_, long **st_)
+{
+  long *sz, *st, *szh;
+  int i;
+  
+  sz = THAlloc(sizeof(long)*self->nDimension);
+  st = THAlloc(sizeof(long)*self->nDimension);
+  szh = THAlloc(sizeof(long)*self->nDimension);
+
+  for(i = self->nDimension-1; i >= 0; i--)
+  {
+    if(i == self->nDimension-1)
+      szh[i] = 1;
+    else
+      szh[i] = szh[i+1]*self->size[i+1];
+  }
+
+  memcpy(sz, szh, self->nDimension * sizeof(long));
+  memcpy(st, self->stride, self->nDimension * sizeof(long));
+  THFree(szh);
+
+  *sz_ = sz;
+  *st_ = st;
+}
+
+void THFloatTensor_kernel_copy(float *dst, 
+                                         long *dst_sz, long *dst_st, int dst_dim,
+                                         float *src,
+                                         long *src_sz, long *src_st, int src_dim,
+                                         long n_elem)
+{
+  long k;
+
+  for(k = 0; k < n_elem; k++)
+  {
+    long dst_idx = 0;
+    long dst_rest = k;
+    int dim;
+
+    for(dim = 0; dim < dst_dim; dim++)
+    {
+      dst_idx += (dst_rest/dst_sz[dim])*dst_st[dim];
+      dst_rest = dst_rest % dst_sz[dim];
+    }
+
+    long src_idx = 0;
+    long src_rest = k;
+    for(dim = 0; dim < src_dim; dim++)
+    {
+      src_idx += (src_rest/src_sz[dim])*src_st[dim];
+      src_rest = src_rest % src_sz[dim];
+    }
+
+    dst[dst_idx] = src[src_idx];
+  }
+}
+
+static int cuda_FloatTensor_fakecopy(lua_State *L)
+{
+  THFloatTensor *self = luaT_checkudata(L, 1, torch_FloatTensor_id);
+  THFloatTensor *src = luaT_checkudata(L, 2, torch_FloatTensor_id);
+  long *d_self_sz, *d_self_st, *d_src_sz, *d_src_st;
+  long nElement = THFloatTensor_nElement(self);
+
+  THArgCheck(THFloatTensor_nElement(self) == THFloatTensor_nElement(src), 2, "sizes do not match"); 
+
+  THFloatTensor_computesz(self, &d_self_sz, &d_self_st);
+  THFloatTensor_computesz(src, &d_src_sz, &d_src_st);
+
+  THFloatTensor_kernel_copy(THFloatTensor_data(self), 
+                            d_self_sz, d_self_st, self->nDimension,
+                            THFloatTensor_data(src),
+                            d_src_sz, d_src_st, src->nDimension,
+                            nElement);
+  
+  THFree(d_self_sz);
+  THFree(d_self_st);
+  THFree(d_src_sz);
+  THFree(d_src_st);
+
+  lua_settop(L, 1);
+  return 1;
+}
+
+void cutorch_CudaTensor_init(lua_State* L)
+{
+  /* the ids */
+  torch_ByteTensor_id = luaT_checktypename2id(L, "torch.ByteTensor");
+  torch_CharTensor_id = luaT_checktypename2id(L, "torch.CharTensor");
+  torch_ShortTensor_id = luaT_checktypename2id(L, "torch.ShortTensor");
+  torch_IntTensor_id = luaT_checktypename2id(L, "torch.IntTensor");
+  torch_LongTensor_id = luaT_checktypename2id(L, "torch.LongTensor");
+  torch_FloatTensor_id = luaT_checktypename2id(L, "torch.FloatTensor");
+  torch_DoubleTensor_id = luaT_checktypename2id(L, "torch.DoubleTensor");
+  
+  /* the standard stuff */
+  torch_CudaTensor_init(L);
+
+  /* additional methods */
+  luaT_pushmetaclass(L, torch_FloatTensor_id);
+  lua_pushcfunction(L, cuda_FloatTensor_fakecopy);
+  lua_setfield(L, -2, "fakecopy");
+  lua_pop(L, 1);
+
+  /* the copy methods */
+  {
+    int i;
+
+    const void* ids[8] = {torch_ByteTensor_id,
+                          torch_CharTensor_id,
+                          torch_ShortTensor_id,
+                          torch_IntTensor_id,
+                          torch_LongTensor_id,
+                          torch_FloatTensor_id,
+                          torch_DoubleTensor_id,
+                          torch_CudaTensor_id};
+    
+    static int (*funcs[8])(lua_State*) = {cutorch_ByteTensor_copy,
+                                          cutorch_CharTensor_copy,
+                                          cutorch_ShortTensor_copy,
+                                          cutorch_IntTensor_copy,
+                                          cutorch_LongTensor_copy,
+                                          cutorch_FloatTensor_copy,
+                                          cutorch_DoubleTensor_copy,
+                                          cutorch_CudaTensor_copy};
+
+    for(i = 0; i < 8; i++)
+    {
+      luaT_pushmetaclass(L, ids[i]);
+      lua_pushcfunction(L, funcs[i]);
+      lua_setfield(L, -2, "copy");
+      lua_pop(L, 1);
+    }
+  }
+}
author	Ronan Collobert <ronan@collobert.com>	2012-01-25 17:55:20 +0400
committer	Ronan Collobert <ronan@collobert.com>	2012-01-25 17:55:20 +0400
commit	7a296748a34549fc8e70719c6c3533597ceff8c4 (patch)
tree	e9d87c6097381f487a1acc6525c5a08d456b7c02 /Tensor.c