* WITH_CPU_SSE was renamed to WITH_CPU_SIMD, and now covers both SSE and Neon. * For macOS sse2neon.h is included as part of the precompiled libraries. * For Linux it is enabled if the sse2neon.h header file is detected. However this library does not have official releases and is not shipped with any Linux distribution, so manual installation and configuration is required to get this working. Ref D8237, T78710
37 lines
1.1 KiB
C++
37 lines
1.1 KiB
C++
/*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version 2
|
|
* of the License, or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
/** \file
|
|
* \ingroup bli
|
|
*
|
|
* SIMD instruction support.
|
|
*/
|
|
|
|
#if defined(__ARM_NEON) && defined(WITH_SSE2NEON)
|
|
/* SSE/SSE2 emulation on ARM Neon. Match SSE precision. */
|
|
# define SSE2NEON_PRECISE_MINMAX 1
|
|
# define SSE2NEON_PRECISE_DIV 1
|
|
# define SSE2NEON_PRECISE_SQRT 1
|
|
# include <sse2neon.h>
|
|
# define BLI_HAVE_SSE2
|
|
#elif defined(__SSE2__)
|
|
/* Native SSE2 on Intel/AMD. */
|
|
# include <emmintrin.h>
|
|
# define BLI_HAVE_SSE2
|
|
#endif
|