diff options
Diffstat (limited to 'intern/cycles/util/util_types_float4_impl.h')
-rw-r--r-- | intern/cycles/util/util_types_float4_impl.h | 117 |
1 files changed, 117 insertions, 0 deletions
diff --git a/intern/cycles/util/util_types_float4_impl.h b/intern/cycles/util/util_types_float4_impl.h new file mode 100644 index 00000000000..ff3ec4d4ecf --- /dev/null +++ b/intern/cycles/util/util_types_float4_impl.h @@ -0,0 +1,117 @@ +/* + * Copyright 2011-2017 Blender Foundation + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef __UTIL_TYPES_FLOAT4_IMPL_H__ +#define __UTIL_TYPES_FLOAT4_IMPL_H__ + +#ifndef __UTIL_TYPES_H__ +# error "Do not include this file directly, include util_types.h instead." +#endif + +#ifndef __KERNEL_GPU__ +# include <cstdio> +#endif + +CCL_NAMESPACE_BEGIN + +#ifndef __KERNEL_GPU__ +#ifdef __KERNEL_SSE__ +__forceinline float4::float4() +{ +} + +__forceinline float4::float4(const float4& a) + : m128(a.m128) +{ +} + +__forceinline float4::float4(const __m128& a) + : m128(a) +{ +} + +__forceinline float4::operator const __m128&(void) const +{ + return m128; +} + +__forceinline float4::operator __m128&(void) +{ + return m128; +} + +__forceinline float4& float4::operator =(const float4& a) +{ + m128 = a.m128; + return *this; +} +#endif /* __KERNEL_SSE__ */ + +__forceinline float float4::operator[](int i) const +{ + util_assert(i >= 0); + util_assert(i < 4); + return *(&x + i); +} + +__forceinline float& float4::operator[](int i) +{ + util_assert(i >= 0); + util_assert(i < 4); + return *(&x + i); +} + +ccl_device_inline float4 make_float4(float f) +{ +#ifdef __KERNEL_SSE__ + float4 a(_mm_set1_ps(f)); +#else + float4 a = {f, f, f, f}; +#endif + return a; +} + +ccl_device_inline float4 make_float4(float x, float y, float z, float w) +{ +#ifdef __KERNEL_SSE__ + float4 a(_mm_set_ps(w, z, y, x)); +#else + float4 a = {x, y, z, w}; +#endif + return a; +} + +ccl_device_inline float4 make_float4(const int4& i) +{ +#ifdef __KERNEL_SSE__ + float4 a(_mm_cvtepi32_ps(i.m128)); +#else + float4 a = {(float)i.x, (float)i.y, (float)i.z, (float)i.w}; +#endif + return a; +} + +ccl_device_inline void print_float4(const char *label, const float4& a) +{ + printf("%s: %.8f %.8f %.8f %.8f\n", + label, + (double)a.x, (double)a.y, (double)a.z, (double)a.w); +} +#endif /* __KERNEL_GPU__ */ + +CCL_NAMESPACE_END + +#endif /* __UTIL_TYPES_FLOAT4_IMPL_H__ */ |