mirror of
https://github.com/webmproject/libwebp.git
synced 2025-03-06 17:52:50 +01:00
267 lines
8.6 KiB
C
267 lines
8.6 KiB
C
// Copyright 2022 Google Inc. All Rights Reserved.
|
|
//
|
|
// Use of this source code is governed by a BSD-style license
|
|
// that can be found in the COPYING file in the root of the source
|
|
// tree. An additional intellectual property rights grant can be found
|
|
// in the file PATENTS. All contributing project authors may
|
|
// be found in the AUTHORS file in the root of the source tree.
|
|
// -----------------------------------------------------------------------------
|
|
//
|
|
// CPU detection functions and macros.
|
|
//
|
|
// Author: Skal (pascal.massimino@gmail.com)
|
|
|
|
#ifndef WEBP_DSP_CPU_H_
|
|
#define WEBP_DSP_CPU_H_
|
|
|
|
#include <stddef.h>
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "src/webp/config.h"
|
|
#endif
|
|
|
|
#include "src/webp/types.h"
|
|
|
|
#if defined(__GNUC__)
|
|
#define LOCAL_GCC_VERSION ((__GNUC__ << 8) | __GNUC_MINOR__)
|
|
#define LOCAL_GCC_PREREQ(maj, min) (LOCAL_GCC_VERSION >= (((maj) << 8) | (min)))
|
|
#else
|
|
#define LOCAL_GCC_VERSION 0
|
|
#define LOCAL_GCC_PREREQ(maj, min) 0
|
|
#endif
|
|
|
|
#if defined(__clang__)
|
|
#define LOCAL_CLANG_VERSION ((__clang_major__ << 8) | __clang_minor__)
|
|
#define LOCAL_CLANG_PREREQ(maj, min) \
|
|
(LOCAL_CLANG_VERSION >= (((maj) << 8) | (min)))
|
|
#else
|
|
#define LOCAL_CLANG_VERSION 0
|
|
#define LOCAL_CLANG_PREREQ(maj, min) 0
|
|
#endif
|
|
|
|
#ifndef __has_builtin
|
|
#define __has_builtin(x) 0
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
// x86 defines.
|
|
|
|
#if !defined(HAVE_CONFIG_H)
|
|
#if defined(_MSC_VER) && _MSC_VER > 1310 && \
|
|
(defined(_M_X64) || defined(_M_IX86))
|
|
#define WEBP_MSC_SSE2 // Visual C++ SSE2 targets
|
|
#endif
|
|
|
|
#if defined(_MSC_VER) && _MSC_VER >= 1500 && \
|
|
(defined(_M_X64) || defined(_M_IX86))
|
|
#define WEBP_MSC_SSE41 // Visual C++ SSE4.1 targets
|
|
#endif
|
|
#endif
|
|
|
|
// WEBP_HAVE_* are used to indicate the presence of the instruction set in dsp
|
|
// files without intrinsics, allowing the corresponding Init() to be called.
|
|
// Files containing intrinsics will need to be built targeting the instruction
|
|
// set so should succeed on one of the earlier tests.
|
|
#if (defined(__SSE2__) || defined(WEBP_MSC_SSE2)) && \
|
|
(!defined(HAVE_CONFIG_H) || defined(WEBP_HAVE_SSE2))
|
|
#define WEBP_USE_SSE2
|
|
#endif
|
|
|
|
#if defined(WEBP_USE_SSE2) && !defined(WEBP_HAVE_SSE2)
|
|
#define WEBP_HAVE_SSE2
|
|
#endif
|
|
|
|
#if (defined(__SSE4_1__) || defined(WEBP_MSC_SSE41)) && \
|
|
(!defined(HAVE_CONFIG_H) || defined(WEBP_HAVE_SSE41))
|
|
#define WEBP_USE_SSE41
|
|
#endif
|
|
|
|
#if defined(WEBP_USE_SSE41) && !defined(WEBP_HAVE_SSE41)
|
|
#define WEBP_HAVE_SSE41
|
|
#endif
|
|
|
|
#undef WEBP_MSC_SSE41
|
|
#undef WEBP_MSC_SSE2
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Arm defines.
|
|
|
|
// The intrinsics currently cause compiler errors with arm-nacl-gcc and the
|
|
// inline assembly would need to be modified for use with Native Client.
|
|
#if ((defined(__ARM_NEON__) || defined(__aarch64__)) && \
|
|
(!defined(HAVE_CONFIG_H) || defined(WEBP_HAVE_NEON))) && \
|
|
!defined(__native_client__)
|
|
#define WEBP_USE_NEON
|
|
#endif
|
|
|
|
#if !defined(WEBP_USE_NEON) && defined(__ANDROID__) && \
|
|
defined(__ARM_ARCH_7A__) && defined(HAVE_CPU_FEATURES_H)
|
|
#define WEBP_ANDROID_NEON // Android targets that may have NEON
|
|
#define WEBP_USE_NEON
|
|
#endif
|
|
|
|
// Note: ARM64 is supported in Visual Studio 2017, but requires the direct
|
|
// inclusion of arm64_neon.h; Visual Studio 2019 includes this file in
|
|
// arm_neon.h. Compile errors were seen with Visual Studio 2019 16.4 with
|
|
// vtbl4_u8(); a fix was made in 16.6.
|
|
#if defined(_MSC_VER) && \
|
|
((_MSC_VER >= 1700 && defined(_M_ARM)) || \
|
|
(_MSC_VER >= 1926 && (defined(_M_ARM64) || defined(_M_ARM64EC))))
|
|
#define WEBP_USE_NEON
|
|
#define WEBP_USE_INTRINSICS
|
|
#endif
|
|
|
|
#if defined(__aarch64__) || defined(_M_ARM64) || defined(_M_ARM64EC)
|
|
#define WEBP_AARCH64 1
|
|
#else
|
|
#define WEBP_AARCH64 0
|
|
#endif
|
|
|
|
#if defined(WEBP_USE_NEON) && !defined(WEBP_HAVE_NEON)
|
|
#define WEBP_HAVE_NEON
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
// MIPS defines.
|
|
|
|
#if defined(__mips__) && !defined(__mips64) && defined(__mips_isa_rev) && \
|
|
(__mips_isa_rev >= 1) && (__mips_isa_rev < 6)
|
|
#define WEBP_USE_MIPS32
|
|
#if (__mips_isa_rev >= 2)
|
|
#define WEBP_USE_MIPS32_R2
|
|
#if defined(__mips_dspr2) || (defined(__mips_dsp_rev) && __mips_dsp_rev >= 2)
|
|
#define WEBP_USE_MIPS_DSP_R2
|
|
#endif
|
|
#endif
|
|
#endif
|
|
|
|
#if defined(__mips_msa) && defined(__mips_isa_rev) && (__mips_isa_rev >= 5)
|
|
#define WEBP_USE_MSA
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
|
|
#ifndef WEBP_DSP_OMIT_C_CODE
|
|
#define WEBP_DSP_OMIT_C_CODE 1
|
|
#endif
|
|
|
|
#if defined(WEBP_USE_NEON) && WEBP_DSP_OMIT_C_CODE
|
|
#define WEBP_NEON_OMIT_C_CODE 1
|
|
#else
|
|
#define WEBP_NEON_OMIT_C_CODE 0
|
|
#endif
|
|
|
|
#if !(LOCAL_CLANG_PREREQ(3, 8) || LOCAL_GCC_PREREQ(4, 8) || WEBP_AARCH64)
|
|
#define WEBP_NEON_WORK_AROUND_GCC 1
|
|
#else
|
|
#define WEBP_NEON_WORK_AROUND_GCC 0
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
|
|
// This macro prevents thread_sanitizer from reporting known concurrent writes.
|
|
#define WEBP_TSAN_IGNORE_FUNCTION
|
|
#if defined(__has_feature)
|
|
#if __has_feature(thread_sanitizer)
|
|
#undef WEBP_TSAN_IGNORE_FUNCTION
|
|
#define WEBP_TSAN_IGNORE_FUNCTION __attribute__((no_sanitize_thread))
|
|
#endif
|
|
#endif
|
|
|
|
#if defined(__has_feature)
|
|
#if __has_feature(memory_sanitizer)
|
|
#define WEBP_MSAN
|
|
#endif
|
|
#endif
|
|
|
|
#if defined(WEBP_USE_THREAD) && !defined(_WIN32)
|
|
#include <pthread.h> // NOLINT
|
|
|
|
#define WEBP_DSP_INIT(func) \
|
|
do { \
|
|
static volatile VP8CPUInfo func##_last_cpuinfo_used = \
|
|
(VP8CPUInfo)&func##_last_cpuinfo_used; \
|
|
static pthread_mutex_t func##_lock = PTHREAD_MUTEX_INITIALIZER; \
|
|
if (pthread_mutex_lock(&func##_lock)) break; \
|
|
if (func##_last_cpuinfo_used != VP8GetCPUInfo) func(); \
|
|
func##_last_cpuinfo_used = VP8GetCPUInfo; \
|
|
(void)pthread_mutex_unlock(&func##_lock); \
|
|
} while (0)
|
|
#else // !(defined(WEBP_USE_THREAD) && !defined(_WIN32))
|
|
#define WEBP_DSP_INIT(func) \
|
|
do { \
|
|
static volatile VP8CPUInfo func##_last_cpuinfo_used = \
|
|
(VP8CPUInfo)&func##_last_cpuinfo_used; \
|
|
if (func##_last_cpuinfo_used == VP8GetCPUInfo) break; \
|
|
func(); \
|
|
func##_last_cpuinfo_used = VP8GetCPUInfo; \
|
|
} while (0)
|
|
#endif // defined(WEBP_USE_THREAD) && !defined(_WIN32)
|
|
|
|
// Defines an Init + helper function that control multiple initialization of
|
|
// function pointers / tables.
|
|
/* Usage:
|
|
WEBP_DSP_INIT_FUNC(InitFunc) {
|
|
...function body
|
|
}
|
|
*/
|
|
#define WEBP_DSP_INIT_FUNC(name) \
|
|
static WEBP_TSAN_IGNORE_FUNCTION void name##_body(void); \
|
|
WEBP_TSAN_IGNORE_FUNCTION void name(void) { WEBP_DSP_INIT(name##_body); } \
|
|
static WEBP_TSAN_IGNORE_FUNCTION void name##_body(void)
|
|
|
|
#define WEBP_UBSAN_IGNORE_UNDEF
|
|
#define WEBP_UBSAN_IGNORE_UNSIGNED_OVERFLOW
|
|
#if defined(__clang__) && defined(__has_attribute)
|
|
#if __has_attribute(no_sanitize)
|
|
// This macro prevents the undefined behavior sanitizer from reporting
|
|
// failures. This is only meant to silence unaligned loads on platforms that
|
|
// are known to support them.
|
|
#undef WEBP_UBSAN_IGNORE_UNDEF
|
|
#define WEBP_UBSAN_IGNORE_UNDEF __attribute__((no_sanitize("undefined")))
|
|
|
|
// This macro prevents the undefined behavior sanitizer from reporting
|
|
// failures related to unsigned integer overflows. This is only meant to
|
|
// silence cases where this well defined behavior is expected.
|
|
#undef WEBP_UBSAN_IGNORE_UNSIGNED_OVERFLOW
|
|
#define WEBP_UBSAN_IGNORE_UNSIGNED_OVERFLOW \
|
|
__attribute__((no_sanitize("unsigned-integer-overflow")))
|
|
#endif
|
|
#endif
|
|
|
|
// If 'ptr' is NULL, returns NULL. Otherwise returns 'ptr + off'.
|
|
// Prevents undefined behavior sanitizer nullptr-with-nonzero-offset warning.
|
|
#if !defined(WEBP_OFFSET_PTR)
|
|
#define WEBP_OFFSET_PTR(ptr, off) (((ptr) == NULL) ? NULL : ((ptr) + (off)))
|
|
#endif
|
|
|
|
// Regularize the definition of WEBP_SWAP_16BIT_CSP (backward compatibility)
|
|
#if !defined(WEBP_SWAP_16BIT_CSP)
|
|
#define WEBP_SWAP_16BIT_CSP 0
|
|
#endif
|
|
|
|
// some endian fix (e.g.: mips-gcc doesn't define __BIG_ENDIAN__)
|
|
#if !defined(WORDS_BIGENDIAN) && \
|
|
(defined(__BIG_ENDIAN__) || defined(_M_PPC) || \
|
|
(defined(__BYTE_ORDER__) && (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__)))
|
|
#define WORDS_BIGENDIAN
|
|
#endif
|
|
|
|
typedef enum {
|
|
kSSE2,
|
|
kSSE3,
|
|
kSlowSSSE3, // special feature for slow SSSE3 architectures
|
|
kSSE4_1,
|
|
kAVX,
|
|
kAVX2,
|
|
kNEON,
|
|
kMIPS32,
|
|
kMIPSdspR2,
|
|
kMSA
|
|
} CPUFeature;
|
|
|
|
// returns true if the CPU supports the feature.
|
|
typedef int (*VP8CPUInfo)(CPUFeature feature);
|
|
|
|
#endif // WEBP_DSP_CPU_H_
|