/* * Copyright 2011-2013 Blender Foundation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #ifndef __KERNEL_COMPAT_CUDA_H__ #define __KERNEL_COMPAT_CUDA_H__ #define __KERNEL_GPU__ #define __KERNEL_CUDA__ #define CCL_NAMESPACE_BEGIN #define CCL_NAMESPACE_END /* Selective nodes compilation. */ #ifndef __NODES_MAX_GROUP__ # define __NODES_MAX_GROUP__ NODE_GROUP_LEVEL_MAX #endif #ifndef __NODES_FEATURES__ # define __NODES_FEATURES__ NODE_FEATURE_ALL #endif #include #include /* Qualifier wrappers for different names on different devices */ #define ccl_device __device__ __inline__ #define ccl_device_inline __device__ __inline__ #define ccl_device_noinline __device__ __noinline__ #define ccl_global #define ccl_constant #define ccl_may_alias #define ccl_addr_space /* No assert supported for CUDA */ #define kernel_assert(cond) /* Types */ #include "util_half.h" #include "util_types.h" /* Textures */ typedef texture texture_float4; typedef texture texture_float2; typedef texture texture_float; typedef texture texture_uint; typedef texture texture_int; typedef texture texture_uint4; typedef texture texture_uchar4; typedef texture texture_image_float4; typedef texture texture_image_uchar4; /* Macros to handle different memory storage on different devices */ /* In order to use full 6GB of memory on Titan cards, use arrays instead * of textures. On earlier cards this seems slower, but on Titan it is * actually slightly faster in tests. */ #if __CUDA_ARCH__ < 300 #define __KERNEL_CUDA_TEX_STORAGE__ #endif #ifdef __KERNEL_CUDA_TEX_STORAGE__ #define kernel_tex_fetch(t, index) tex1Dfetch(t, index) #else #define kernel_tex_fetch(t, index) t[(index)] #endif #define kernel_tex_image_interp(t, x, y) tex2D(t, x, y) #define kernel_data __data /* Use fast math functions */ #define cosf(x) __cosf(((float)(x))) #define sinf(x) __sinf(((float)(x))) #define powf(x, y) __powf(((float)(x)), ((float)(y))) #define tanf(x) __tanf(((float)(x))) #define logf(x) __logf(((float)(x))) #define expf(x) __expf(((float)(x))) #endif /* __KERNEL_COMPAT_CUDA_H__ */