diff options
Diffstat (limited to 'intern/cycles/util/types_float4_impl.h')
-rw-r--r-- | intern/cycles/util/types_float4_impl.h | 109 |
1 files changed, 109 insertions, 0 deletions
diff --git a/intern/cycles/util/types_float4_impl.h b/intern/cycles/util/types_float4_impl.h new file mode 100644 index 00000000000..d75715332e5 --- /dev/null +++ b/intern/cycles/util/types_float4_impl.h @@ -0,0 +1,109 @@ +/* + * Copyright 2011-2017 Blender Foundation + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef __UTIL_TYPES_FLOAT4_IMPL_H__ +#define __UTIL_TYPES_FLOAT4_IMPL_H__ + +#ifndef __UTIL_TYPES_H__ +# error "Do not include this file directly, include util/types.h instead." +#endif + +#ifndef __KERNEL_GPU__ +# include <cstdio> +#endif + +CCL_NAMESPACE_BEGIN + +#ifndef __KERNEL_GPU__ +# ifdef __KERNEL_SSE__ +__forceinline float4::float4() +{ +} + +__forceinline float4::float4(const __m128 &a) : m128(a) +{ +} + +__forceinline float4::operator const __m128 &() const +{ + return m128; +} + +__forceinline float4::operator __m128 &() +{ + return m128; +} + +__forceinline float4 &float4::operator=(const float4 &a) +{ + m128 = a.m128; + return *this; +} +# endif /* __KERNEL_SSE__ */ + +__forceinline float float4::operator[](int i) const +{ + util_assert(i >= 0); + util_assert(i < 4); + return *(&x + i); +} + +__forceinline float &float4::operator[](int i) +{ + util_assert(i >= 0); + util_assert(i < 4); + return *(&x + i); +} + +ccl_device_inline float4 make_float4(float f) +{ +# ifdef __KERNEL_SSE__ + float4 a(_mm_set1_ps(f)); +# else + float4 a = {f, f, f, f}; +# endif + return a; +} + +ccl_device_inline float4 make_float4(float x, float y, float z, float w) +{ +# ifdef __KERNEL_SSE__ + float4 a(_mm_set_ps(w, z, y, x)); +# else + float4 a = {x, y, z, w}; +# endif + return a; +} + +ccl_device_inline float4 make_float4(const int4 &i) +{ +# ifdef __KERNEL_SSE__ + float4 a(_mm_cvtepi32_ps(i.m128)); +# else + float4 a = {(float)i.x, (float)i.y, (float)i.z, (float)i.w}; +# endif + return a; +} + +ccl_device_inline void print_float4(const char *label, const float4 &a) +{ + printf("%s: %.8f %.8f %.8f %.8f\n", label, (double)a.x, (double)a.y, (double)a.z, (double)a.w); +} +#endif /* __KERNEL_GPU__ */ + +CCL_NAMESPACE_END + +#endif /* __UTIL_TYPES_FLOAT4_IMPL_H__ */ |