Files
test/intern/cycles/util/optimization.h
Thomas Dinges 30a22b92ca Cycles: Rename SSE4.1 kernel to SSE4.2
This commit updates all defines, compiler flags and cleans up some code for unused CPU capabilities.

There should be no functional change, unless it's run on a CPU that supports sse41 but not sse42. It will fallback to the SSE2 kernel in this case.

In preparation for the new SSE4.2 minimum in Blender 4.2.

Pull Request: https://projects.blender.org/blender/blender/pulls/118043
2024-02-09 17:25:58 +01:00

57 lines
1.3 KiB
C

/* SPDX-FileCopyrightText: 2011-2022 Blender Foundation
*
* SPDX-License-Identifier: Apache-2.0 */
#ifndef __UTIL_OPTIMIZATION_H__
#define __UTIL_OPTIMIZATION_H__
#ifndef __KERNEL_GPU__
/* x86
*
* Compile a regular, SSE2 and SSE3 kernel. */
# if defined(i386) || defined(_M_IX86)
/* We require minimum SSE2 support on x86, so auto enable. */
# define __KERNEL_SSE2__
# ifdef WITH_KERNEL_SSE2
# define WITH_CYCLES_OPTIMIZED_KERNEL_SSE2
# endif
/* x86-64
*
* Compile a regular (includes SSE2), SSE 4.2 and AVX2 kernel. */
# elif defined(__x86_64__) || defined(_M_X64)
/* SSE2 is always available on x86-64 CPUs, so auto enable */
# define __KERNEL_SSE2__
/* no SSE2 kernel on x86-64, part of regular kernel */
# ifdef WITH_KERNEL_SSE42
# define WITH_CYCLES_OPTIMIZED_KERNEL_SSE42
# endif
# ifdef WITH_KERNEL_AVX2
# define WITH_CYCLES_OPTIMIZED_KERNEL_AVX2
# endif
/* Arm Neon
*
* Compile a SSE4 kernel emulated with Neon. Most code is shared with
* SSE, some specializations for performance and compatibility are made
* made testing for __KERNEL_NEON__. */
# elif defined(__ARM_NEON) && defined(WITH_SSE2NEON)
# define __KERNEL_NEON__
# define __KERNEL_SSE__
# define __KERNEL_SSE2__
# define __KERNEL_SSE3__
# define __KERNEL_SSE42__
# endif
#endif
#endif /* __UTIL_OPTIMIZATION_H__ */