diff options
author | Sergey Sharybin <sergey.vfx@gmail.com> | 2016-02-12 20:33:43 +0300 |
---|---|---|
committer | Sergey Sharybin <sergey.vfx@gmail.com> | 2016-03-25 15:55:42 +0300 |
commit | 700722f68633d270584af5463a804742537e30ed (patch) | |
tree | 5b80a5a51dd278e649647f8d0a64c07d570e8eaa /intern/cycles/kernel/kernels | |
parent | 0e47e0cc9e9b19a30717042d97cb3b8fb50132ff (diff) |
Cycles: Cleanup, indent nested preprocessor directives
Quite straightforward, main trick is happening in path_source_replace_includes().
Reviewers: brecht, dingto, lukasstockner97, juicyfruit
Differential Revision: https://developer.blender.org/D1794
Diffstat (limited to 'intern/cycles/kernel/kernels')
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel.cpp | 2 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel_avx.cpp | 15 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel_avx2.cpp | 15 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel_sse2.cpp | 3 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel_sse3.cpp | 7 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cpu/kernel_sse41.cpp | 9 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/cuda/kernel.cu | 80 | ||||
-rw-r--r-- | intern/cycles/kernel/kernels/opencl/kernel.cl | 22 |
8 files changed, 74 insertions, 79 deletions
diff --git a/intern/cycles/kernel/kernels/cpu/kernel.cpp b/intern/cycles/kernel/kernels/cpu/kernel.cpp index 5c6dc31b949..643eefcdc6c 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel.cpp @@ -18,7 +18,7 @@ /* On x86-64, we can assume SSE2, so avoid the extra kernel and compile this one with SSE2 intrinsics */ #if defined(__x86_64__) || defined(_M_X64) -#define __KERNEL_SSE2__ +# define __KERNEL_SSE2__ #endif /* quiet unused define warnings */ diff --git a/intern/cycles/kernel/kernels/cpu/kernel_avx.cpp b/intern/cycles/kernel/kernels/cpu/kernel_avx.cpp index a4e43b180fb..533ab46b741 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel_avx.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel_avx.cpp @@ -20,18 +20,17 @@ /* SSE optimization disabled for now on 32 bit, see bug #36316 */ #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86))) -#define __KERNEL_SSE2__ -#define __KERNEL_SSE3__ -#define __KERNEL_SSSE3__ -#define __KERNEL_SSE41__ -#define __KERNEL_AVX__ +# define __KERNEL_SSE2__ +# define __KERNEL_SSE3__ +# define __KERNEL_SSSE3__ +# define __KERNEL_SSE41__ +# define __KERNEL_AVX__ #endif - + #include "util_optimization.h" - + #ifdef WITH_CYCLES_OPTIMIZED_KERNEL_AVX # include "kernel.h" # define KERNEL_ARCH cpu_avx # include "kernel_cpu_impl.h" - #endif /* WITH_CYCLES_OPTIMIZED_KERNEL_AVX */ diff --git a/intern/cycles/kernel/kernels/cpu/kernel_avx2.cpp b/intern/cycles/kernel/kernels/cpu/kernel_avx2.cpp index fd6c753b34c..7351e2bad6b 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel_avx2.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel_avx2.cpp @@ -17,15 +17,15 @@ /* Optimized CPU kernel entry points. This file is compiled with AVX2 * optimization flags and nearly all functions inlined, while kernel.cpp * is compiled without for other CPU's. */ - + /* SSE optimization disabled for now on 32 bit, see bug #36316 */ #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86))) -#define __KERNEL_SSE2__ -#define __KERNEL_SSE3__ -#define __KERNEL_SSSE3__ -#define __KERNEL_SSE41__ -#define __KERNEL_AVX__ -#define __KERNEL_AVX2__ +# define __KERNEL_SSE2__ +# define __KERNEL_SSE3__ +# define __KERNEL_SSSE3__ +# define __KERNEL_SSE41__ +# define __KERNEL_AVX__ +# define __KERNEL_AVX2__ #endif #include "util_optimization.h" @@ -34,5 +34,4 @@ # include "kernel.h" # define KERNEL_ARCH cpu_avx2 # include "kernel_cpu_impl.h" - #endif /* WITH_CYCLES_OPTIMIZED_KERNEL_AVX2 */ diff --git a/intern/cycles/kernel/kernels/cpu/kernel_sse2.cpp b/intern/cycles/kernel/kernels/cpu/kernel_sse2.cpp index 7e843dc1c7c..a5f2d6e7294 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel_sse2.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel_sse2.cpp @@ -20,7 +20,7 @@ /* SSE optimization disabled for now on 32 bit, see bug #36316 */ #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86))) -#define __KERNEL_SSE2__ +# define __KERNEL_SSE2__ #endif #include "util_optimization.h" @@ -29,5 +29,4 @@ # include "kernel.h" # define KERNEL_ARCH cpu_sse2 # include "kernel_cpu_impl.h" - #endif /* WITH_CYCLES_OPTIMIZED_KERNEL_SSE2 */ diff --git a/intern/cycles/kernel/kernels/cpu/kernel_sse3.cpp b/intern/cycles/kernel/kernels/cpu/kernel_sse3.cpp index cc5656ed5be..86f9ce991f8 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel_sse3.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel_sse3.cpp @@ -20,9 +20,9 @@ /* SSE optimization disabled for now on 32 bit, see bug #36316 */ #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86))) -#define __KERNEL_SSE2__ -#define __KERNEL_SSE3__ -#define __KERNEL_SSSE3__ +# define __KERNEL_SSE2__ +# define __KERNEL_SSE3__ +# define __KERNEL_SSSE3__ #endif #include "util_optimization.h" @@ -31,5 +31,4 @@ # include "kernel.h" # define KERNEL_ARCH cpu_sse3 # include "kernel_cpu_impl.h" - #endif /* WITH_CYCLES_OPTIMIZED_KERNEL_SSE3 */ diff --git a/intern/cycles/kernel/kernels/cpu/kernel_sse41.cpp b/intern/cycles/kernel/kernels/cpu/kernel_sse41.cpp index 252e16873aa..c174406047d 100644 --- a/intern/cycles/kernel/kernels/cpu/kernel_sse41.cpp +++ b/intern/cycles/kernel/kernels/cpu/kernel_sse41.cpp @@ -20,10 +20,10 @@ /* SSE optimization disabled for now on 32 bit, see bug #36316 */ #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86))) -#define __KERNEL_SSE2__ -#define __KERNEL_SSE3__ -#define __KERNEL_SSSE3__ -#define __KERNEL_SSE41__ +# define __KERNEL_SSE2__ +# define __KERNEL_SSE3__ +# define __KERNEL_SSSE3__ +# define __KERNEL_SSE41__ #endif #include "util_optimization.h" @@ -32,5 +32,4 @@ # include "kernel.h" # define KERNEL_ARCH cpu_sse41 # include "kernel_cpu_impl.h" - #endif /* WITH_CYCLES_OPTIMIZED_KERNEL_SSE41 */ diff --git a/intern/cycles/kernel/kernels/cuda/kernel.cu b/intern/cycles/kernel/kernels/cuda/kernel.cu index 29067a666c4..259b634f939 100644 --- a/intern/cycles/kernel/kernels/cuda/kernel.cu +++ b/intern/cycles/kernel/kernels/cuda/kernel.cu @@ -31,67 +31,67 @@ /* 2.0 and 2.1 */ #if __CUDA_ARCH__ == 200 || __CUDA_ARCH__ == 210 -#define CUDA_MULTIPRESSOR_MAX_REGISTERS 32768 -#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 8 -#define CUDA_BLOCK_MAX_THREADS 1024 -#define CUDA_THREAD_MAX_REGISTERS 63 +# define CUDA_MULTIPRESSOR_MAX_REGISTERS 32768 +# define CUDA_MULTIPROCESSOR_MAX_BLOCKS 8 +# define CUDA_BLOCK_MAX_THREADS 1024 +# define CUDA_THREAD_MAX_REGISTERS 63 /* tunable parameters */ -#define CUDA_THREADS_BLOCK_WIDTH 16 -#define CUDA_KERNEL_MAX_REGISTERS 32 -#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 40 +# define CUDA_THREADS_BLOCK_WIDTH 16 +# define CUDA_KERNEL_MAX_REGISTERS 32 +# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 40 /* 3.0 and 3.5 */ #elif __CUDA_ARCH__ == 300 || __CUDA_ARCH__ == 350 -#define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 -#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 -#define CUDA_BLOCK_MAX_THREADS 1024 -#define CUDA_THREAD_MAX_REGISTERS 63 +# define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 +# define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 +# define CUDA_BLOCK_MAX_THREADS 1024 +# define CUDA_THREAD_MAX_REGISTERS 63 /* tunable parameters */ -#define CUDA_THREADS_BLOCK_WIDTH 16 -#define CUDA_KERNEL_MAX_REGISTERS 63 -#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 +# define CUDA_THREADS_BLOCK_WIDTH 16 +# define CUDA_KERNEL_MAX_REGISTERS 63 +# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 /* 3.2 */ #elif __CUDA_ARCH__ == 320 -#define CUDA_MULTIPRESSOR_MAX_REGISTERS 32768 -#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 -#define CUDA_BLOCK_MAX_THREADS 1024 -#define CUDA_THREAD_MAX_REGISTERS 63 +# define CUDA_MULTIPRESSOR_MAX_REGISTERS 32768 +# define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 +# define CUDA_BLOCK_MAX_THREADS 1024 +# define CUDA_THREAD_MAX_REGISTERS 63 /* tunable parameters */ -#define CUDA_THREADS_BLOCK_WIDTH 16 -#define CUDA_KERNEL_MAX_REGISTERS 63 -#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 +# define CUDA_THREADS_BLOCK_WIDTH 16 +# define CUDA_KERNEL_MAX_REGISTERS 63 +# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 /* 3.7 */ #elif __CUDA_ARCH__ == 370 -#define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 -#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 -#define CUDA_BLOCK_MAX_THREADS 1024 -#define CUDA_THREAD_MAX_REGISTERS 255 +# define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 +# define CUDA_MULTIPROCESSOR_MAX_BLOCKS 16 +# define CUDA_BLOCK_MAX_THREADS 1024 +# define CUDA_THREAD_MAX_REGISTERS 255 /* tunable parameters */ -#define CUDA_THREADS_BLOCK_WIDTH 16 -#define CUDA_KERNEL_MAX_REGISTERS 63 -#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 +# define CUDA_THREADS_BLOCK_WIDTH 16 +# define CUDA_KERNEL_MAX_REGISTERS 63 +# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 /* 5.0, 5.2 and 5.3 */ #elif __CUDA_ARCH__ == 500 || __CUDA_ARCH__ == 520 || __CUDA_ARCH__ == 530 -#define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 -#define CUDA_MULTIPROCESSOR_MAX_BLOCKS 32 -#define CUDA_BLOCK_MAX_THREADS 1024 -#define CUDA_THREAD_MAX_REGISTERS 255 +# define CUDA_MULTIPRESSOR_MAX_REGISTERS 65536 +# define CUDA_MULTIPROCESSOR_MAX_BLOCKS 32 +# define CUDA_BLOCK_MAX_THREADS 1024 +# define CUDA_THREAD_MAX_REGISTERS 255 /* tunable parameters */ -#define CUDA_THREADS_BLOCK_WIDTH 16 -#define CUDA_KERNEL_MAX_REGISTERS 40 -#define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 +# define CUDA_THREADS_BLOCK_WIDTH 16 +# define CUDA_KERNEL_MAX_REGISTERS 40 +# define CUDA_KERNEL_BRANCHED_MAX_REGISTERS 63 /* unknown architecture */ #else -#error "Unknown or unsupported CUDA architecture, can't determine launch bounds" +# error "Unknown or unsupported CUDA architecture, can't determine launch bounds" #endif /* compute number of threads per block and minimum blocks per multiprocessor @@ -106,19 +106,19 @@ /* sanity checks */ #if CUDA_THREADS_BLOCK_WIDTH*CUDA_THREADS_BLOCK_WIDTH > CUDA_BLOCK_MAX_THREADS -#error "Maximum number of threads per block exceeded" +# error "Maximum number of threads per block exceeded" #endif #if CUDA_MULTIPRESSOR_MAX_REGISTERS/(CUDA_THREADS_BLOCK_WIDTH*CUDA_THREADS_BLOCK_WIDTH*CUDA_KERNEL_MAX_REGISTERS) > CUDA_MULTIPROCESSOR_MAX_BLOCKS -#error "Maximum number of blocks per multiprocessor exceeded" +# error "Maximum number of blocks per multiprocessor exceeded" #endif #if CUDA_KERNEL_MAX_REGISTERS > CUDA_THREAD_MAX_REGISTERS -#error "Maximum number of registers per thread exceeded" +# error "Maximum number of registers per thread exceeded" #endif #if CUDA_KERNEL_BRANCHED_MAX_REGISTERS > CUDA_THREAD_MAX_REGISTERS -#error "Maximum number of registers per thread exceeded" +# error "Maximum number of registers per thread exceeded" #endif /* kernels */ diff --git a/intern/cycles/kernel/kernels/opencl/kernel.cl b/intern/cycles/kernel/kernels/opencl/kernel.cl index bfa1d8e2e8f..aad06ed5c76 100644 --- a/intern/cycles/kernel/kernels/opencl/kernel.cl +++ b/intern/cycles/kernel/kernels/opencl/kernel.cl @@ -24,21 +24,21 @@ #include "../../kernel_film.h" #if defined(__COMPILE_ONLY_MEGAKERNEL__) || !defined(__NO_BAKING__) -#include "../../kernel_path.h" -#include "../../kernel_path_branched.h" +# include "../../kernel_path.h" +# include "../../kernel_path_branched.h" #else /* __COMPILE_ONLY_MEGAKERNEL__ */ /* Include only actually used headers for the case * when path tracing kernels are not needed. */ -#include "../../kernel_random.h" -#include "../../kernel_differential.h" -#include "../../kernel_montecarlo.h" -#include "../../kernel_projection.h" -#include "../../geom/geom.h" - -#include "../../kernel_accumulate.h" -#include "../../kernel_camera.h" -#include "../../kernel_shader.h" +# include "../../kernel_random.h" +# include "../../kernel_differential.h" +# include "../../kernel_montecarlo.h" +# include "../../kernel_projection.h" +# include "../../geom/geom.h" + +# include "../../kernel_accumulate.h" +# include "../../kernel_camera.h" +# include "../../kernel_shader.h" #endif /* defined(__COMPILE_ONLY_MEGAKERNEL__) || !defined(__NO_BAKING__) */ #include "../../kernel_bake.h" |