2015-12-09 00:51:59 +00:00
|
|
|
/*===---- immintrin.h - Intel intrinsics -----------------------------------===
|
|
|
|
*
|
2019-07-19 20:50:45 +00:00
|
|
|
* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
* See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2015-12-09 00:51:59 +00:00
|
|
|
*
|
|
|
|
*===-----------------------------------------------------------------------===
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef __IMMINTRIN_H
|
|
|
|
#define __IMMINTRIN_H
|
|
|
|
|
2022-02-03 21:18:29 +00:00
|
|
|
#if !defined(__i386__) && !defined(__x86_64__)
|
|
|
|
#error "This header is only meant to be used on x86 and x64 architecture"
|
|
|
|
#endif
|
|
|
|
|
2020-12-16 09:43:57 +00:00
|
|
|
#include <x86gprintrin.h>
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__MMX__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <mmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SSE__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <xmmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SSE2__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <emmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SSE3__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <pmmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SSSE3__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <tmmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__SSE4_2__) || defined(__SSE4_1__))
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <smmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AES__) || defined(__PCLMUL__))
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <wmmintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__CLFLUSHOPT__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <clflushoptintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__CLWB__)
|
2017-10-24 01:43:18 +00:00
|
|
|
#include <clwbintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avxintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX2__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx2intrin.h>
|
2018-08-05 06:20:05 +00:00
|
|
|
#endif
|
2015-12-09 00:51:59 +00:00
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__F16C__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <f16cintrin.h>
|
|
|
|
#endif
|
2017-06-16 18:35:00 +00:00
|
|
|
|
2020-01-22 22:42:02 +00:00
|
|
|
/* No feature check desired due to internal checks */
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <bmiintrin.h>
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__BMI2__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <bmi2intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__LZCNT__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <lzcntintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__POPCNT__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <popcntintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__FMA__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <fmaintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512F__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512fintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VL__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512vlintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512BW__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512bwintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512BITALG__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <avx512bitalgintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512CD__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512cdintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VPOPCNTDQ__)
|
2017-09-30 22:20:12 +00:00
|
|
|
#include <avx512vpopcntdqintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2018-02-23 18:15:16 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512VPOPCNTDQ__))
|
|
|
|
#include <avx512vpopcntdqvlintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VNNI__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <avx512vnniintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2018-02-23 18:15:16 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512VNNI__))
|
|
|
|
#include <avx512vlvnniintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-12-16 09:43:57 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVXVNNI__)
|
|
|
|
#include <avxvnniintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512DQ__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512dqintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2018-02-23 18:15:16 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512BITALG__))
|
|
|
|
#include <avx512vlbitalgintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512BW__))
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512vlbwintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512CD__))
|
|
|
|
#include <avx512vlcdintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512DQ__))
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512vldqintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512ER__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <avx512erintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512IFMA__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <avx512ifmaintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AVX512IFMA__) && defined(__AVX512VL__))
|
|
|
|
#include <avx512ifmavlintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-01-26 20:15:35 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVXIFMA__)
|
|
|
|
#include <avxifmaintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VBMI__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <avx512vbmiintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2017-06-16 18:35:00 +00:00
|
|
|
(defined(__AVX512VBMI__) && defined(__AVX512VL__))
|
|
|
|
#include <avx512vbmivlintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VBMI2__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <avx512vbmi2intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2018-02-23 18:15:16 +00:00
|
|
|
(defined(__AVX512VBMI2__) && defined(__AVX512VL__))
|
|
|
|
#include <avx512vlvbmi2intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512PF__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <avx512pfintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-01-26 20:15:35 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512FP16__)
|
2022-02-03 21:18:29 +00:00
|
|
|
#include <avx512fp16intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-01-26 20:15:35 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VL__) && defined(__AVX512FP16__))
|
2022-02-03 21:18:29 +00:00
|
|
|
#include <avx512vlfp16intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512BF16__)
|
2019-07-19 20:50:45 +00:00
|
|
|
#include <avx512bf16intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2019-07-19 20:50:45 +00:00
|
|
|
(defined(__AVX512VL__) && defined(__AVX512BF16__))
|
|
|
|
#include <avx512vlbf16intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__PKU__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <pkuintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2021-08-16 01:00:10 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__VPCLMULQDQ__)
|
|
|
|
#include <vpclmulqdqintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__VAES__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <vaesintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__GFNI__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <gfniintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-01-26 20:15:35 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVXVNNIINT8__)
|
|
|
|
#include <avxvnniint8intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVXNECONVERT__)
|
|
|
|
#include <avxneconvertintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SHA512__)
|
|
|
|
#include <sha512intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SM3__)
|
|
|
|
#include <sm3intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SM4__)
|
|
|
|
#include <sm4intrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVXVNNIINT16__)
|
|
|
|
#include <avxvnniint16intrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__RDPID__)
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Reads the value of the IA32_TSC_AUX MSR (0xc0000103).
|
2018-08-05 06:20:05 +00:00
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDPID </c> instruction.
|
2024-04-25 21:59:29 +00:00
|
|
|
///
|
|
|
|
/// \returns The 32-bit contents of the MSR.
|
2018-08-05 06:20:05 +00:00
|
|
|
static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("rdpid")))
|
|
|
|
_rdpid_u32(void) {
|
|
|
|
return __builtin_ia32_rdpid();
|
|
|
|
}
|
|
|
|
#endif // __RDPID__
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__RDRND__)
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Returns a 16-bit hardware-generated random value.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDRAND </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __p
|
|
|
|
/// A pointer to a 16-bit memory location to place the random value.
|
|
|
|
/// \returns 1 if the value was successfully generated, 0 otherwise.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_rdrand16_step(unsigned short *__p)
|
|
|
|
{
|
2022-07-28 18:54:23 +00:00
|
|
|
return (int)__builtin_ia32_rdrand16_step(__p);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Returns a 32-bit hardware-generated random value.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDRAND </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __p
|
|
|
|
/// A pointer to a 32-bit memory location to place the random value.
|
|
|
|
/// \returns 1 if the value was successfully generated, 0 otherwise.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_rdrand32_step(unsigned int *__p)
|
|
|
|
{
|
2022-07-28 18:54:23 +00:00
|
|
|
return (int)__builtin_ia32_rdrand32_step(__p);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Returns a 64-bit hardware-generated random value.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDRAND </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __p
|
|
|
|
/// A pointer to a 64-bit memory location to place the random value.
|
|
|
|
/// \returns 1 if the value was successfully generated, 0 otherwise.
|
2017-09-30 22:20:12 +00:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
|
|
|
_rdrand64_step(unsigned long long *__p)
|
|
|
|
{
|
2023-08-11 23:20:14 +00:00
|
|
|
#ifdef __x86_64__
|
2022-07-28 18:54:23 +00:00
|
|
|
return (int)__builtin_ia32_rdrand64_step(__p);
|
2023-01-26 20:15:35 +00:00
|
|
|
#else
|
2023-08-11 23:20:14 +00:00
|
|
|
// We need to emulate the functionality of 64-bit rdrand with 2 32-bit
|
|
|
|
// rdrand instructions.
|
2023-01-26 20:15:35 +00:00
|
|
|
unsigned int __lo, __hi;
|
|
|
|
unsigned int __res_lo = __builtin_ia32_rdrand32_step(&__lo);
|
|
|
|
unsigned int __res_hi = __builtin_ia32_rdrand32_step(&__hi);
|
|
|
|
if (__res_lo && __res_hi) {
|
|
|
|
*__p = ((unsigned long long)__hi << 32) | (unsigned long long)__lo;
|
|
|
|
return 1;
|
|
|
|
} else {
|
|
|
|
*__p = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
2017-09-30 22:20:12 +00:00
|
|
|
#endif
|
2023-08-11 23:20:14 +00:00
|
|
|
}
|
2017-09-30 22:20:12 +00:00
|
|
|
#endif /* __RDRND__ */
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__FSGSBASE__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#ifdef __x86_64__
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Reads the FS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDFSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \returns The lower 32 bits of the FS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_readfsbase_u32(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdfsbase32();
|
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Reads the FS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDFSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \returns The contents of the FS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_readfsbase_u64(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdfsbase64();
|
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Reads the GS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDGSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \returns The lower 32 bits of the GS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_readgsbase_u32(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdgsbase32();
|
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Reads the GS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> RDGSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \returns The contents of the GS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_readgsbase_u64(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdgsbase64();
|
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Modifies the FS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> WRFSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __V
|
|
|
|
/// Value to use for the lower 32 bits of the FS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_writefsbase_u32(unsigned int __V)
|
|
|
|
{
|
2018-08-05 06:20:05 +00:00
|
|
|
__builtin_ia32_wrfsbase32(__V);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Modifies the FS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> WRFSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __V
|
|
|
|
/// Value to use for the FS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_writefsbase_u64(unsigned long long __V)
|
|
|
|
{
|
2018-08-05 06:20:05 +00:00
|
|
|
__builtin_ia32_wrfsbase64(__V);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Modifies the GS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> WRGSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __V
|
|
|
|
/// Value to use for the lower 32 bits of the GS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_writegsbase_u32(unsigned int __V)
|
|
|
|
{
|
2018-08-05 06:20:05 +00:00
|
|
|
__builtin_ia32_wrgsbase32(__V);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
/// Modifies the GS base register.
|
|
|
|
///
|
|
|
|
/// \headerfile <immintrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the <c> WRFSBASE </c> instruction.
|
|
|
|
///
|
|
|
|
/// \param __V
|
|
|
|
/// Value to use for GS base register.
|
2017-06-16 18:35:00 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2015-12-09 00:51:59 +00:00
|
|
|
_writegsbase_u64(unsigned long long __V)
|
|
|
|
{
|
2018-08-05 06:20:05 +00:00
|
|
|
__builtin_ia32_wrgsbase64(__V);
|
2015-12-09 00:51:59 +00:00
|
|
|
}
|
2017-06-16 18:35:00 +00:00
|
|
|
|
2015-12-09 00:51:59 +00:00
|
|
|
#endif
|
|
|
|
#endif /* __FSGSBASE__ */
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__MOVBE__)
|
2019-02-07 23:49:42 +00:00
|
|
|
|
|
|
|
/* The structs used below are to force the load/store to be unaligned. This
|
|
|
|
* is accomplished with the __packed__ attribute. The __may_alias__ prevents
|
|
|
|
* tbaa metadata from being generated based on the struct and the type of the
|
|
|
|
* field inside of it.
|
|
|
|
*/
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Load a 16-bit value from memory and swap its bytes.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the 16-bit value to load.
|
|
|
|
/// \returns The byte-swapped value.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ short __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_loadbe_i16(void const * __P) {
|
|
|
|
struct __loadu_i16 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned short __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
return (short)__builtin_bswap16(((const struct __loadu_i16*)__P)->__v);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Swap the bytes of a 16-bit value and store it to memory.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the memory for storing the swapped value.
|
|
|
|
/// \param __D
|
|
|
|
/// The 16-bit value to be byte-swapped.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_storebe_i16(void * __P, short __D) {
|
|
|
|
struct __storeu_i16 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned short __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
((struct __storeu_i16*)__P)->__v = __builtin_bswap16((unsigned short)__D);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Load a 32-bit value from memory and swap its bytes.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the 32-bit value to load.
|
|
|
|
/// \returns The byte-swapped value.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_loadbe_i32(void const * __P) {
|
|
|
|
struct __loadu_i32 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned int __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
return (int)__builtin_bswap32(((const struct __loadu_i32*)__P)->__v);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Swap the bytes of a 32-bit value and store it to memory.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the memory for storing the swapped value.
|
|
|
|
/// \param __D
|
|
|
|
/// The 32-bit value to be byte-swapped.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_storebe_i32(void * __P, int __D) {
|
|
|
|
struct __storeu_i32 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned int __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
((struct __storeu_i32*)__P)->__v = __builtin_bswap32((unsigned int)__D);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef __x86_64__
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Load a 64-bit value from memory and swap its bytes.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the 64-bit value to load.
|
|
|
|
/// \returns The byte-swapped value.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ long long __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_loadbe_i64(void const * __P) {
|
|
|
|
struct __loadu_i64 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned long long __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
return (long long)__builtin_bswap64(((const struct __loadu_i64*)__P)->__v);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/// Swap the bytes of a 64-bit value and store it to memory.
|
|
|
|
///
|
|
|
|
/// \headerfile <x86intrin.h>
|
|
|
|
///
|
|
|
|
/// This intrinsic corresponds to the MOVBE instruction.
|
|
|
|
///
|
|
|
|
/// \param __P
|
|
|
|
/// A pointer to the memory for storing the swapped value.
|
|
|
|
/// \param __D
|
|
|
|
/// The 64-bit value to be byte-swapped.
|
2019-02-07 23:49:42 +00:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("movbe")))
|
|
|
|
_storebe_i64(void * __P, long long __D) {
|
|
|
|
struct __storeu_i64 {
|
2022-07-28 18:54:23 +00:00
|
|
|
unsigned long long __v;
|
2019-02-07 23:49:42 +00:00
|
|
|
} __attribute__((__packed__, __may_alias__));
|
2022-07-28 18:54:23 +00:00
|
|
|
((struct __storeu_i64*)__P)->__v = __builtin_bswap64((unsigned long long)__D);
|
2019-02-07 23:49:42 +00:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#endif /* __MOVBE */
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__RTM__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <rtmintrin.h>
|
|
|
|
#include <xtestintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SHA__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <shaintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__FXSR__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <fxsrintrin.h>
|
2017-06-16 18:35:00 +00:00
|
|
|
#endif
|
|
|
|
|
2019-07-19 20:50:45 +00:00
|
|
|
/* No feature check desired due to internal MSC_VER checks */
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <xsaveintrin.h>
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__XSAVEOPT__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <xsaveoptintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__XSAVEC__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <xsavecintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__XSAVES__)
|
2017-06-16 18:35:00 +00:00
|
|
|
#include <xsavesintrin.h>
|
|
|
|
#endif
|
2015-12-09 00:51:59 +00:00
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SHSTK__)
|
2018-02-23 18:15:16 +00:00
|
|
|
#include <cetintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2024-04-25 21:59:29 +00:00
|
|
|
/* Intrinsics inside adcintrin.h are available at all times. */
|
|
|
|
#include <adcintrin.h>
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__ADX__)
|
2015-12-09 00:51:59 +00:00
|
|
|
#include <adxintrin.h>
|
2024-04-25 21:59:29 +00:00
|
|
|
#endif
|
2015-12-09 00:51:59 +00:00
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__RDSEED__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <rdseedintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__WBNOINVD__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <wbnoinvdintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__CLDEMOTE__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <cldemoteintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__WAITPKG__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <waitpkgintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__MOVDIRI__) || defined(__MOVDIR64B__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <movdirintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__PCONFIG__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <pconfigintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SGX__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <sgxintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__PTWRITE__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <ptwriteintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__INVPCID__)
|
2018-08-05 06:20:05 +00:00
|
|
|
#include <invpcidintrin.h>
|
|
|
|
#endif
|
2023-01-26 20:15:35 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2023-03-18 23:01:09 +00:00
|
|
|
defined(__AMX_FP16__)
|
2023-01-26 20:15:35 +00:00
|
|
|
#include <amxfp16intrin.h>
|
|
|
|
#endif
|
2018-08-05 06:20:05 +00:00
|
|
|
|
2020-12-16 09:43:57 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__KL__) || defined(__WIDEKL__)
|
|
|
|
#include <keylockerintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
2023-03-18 23:01:09 +00:00
|
|
|
defined(__AMX_TILE__) || defined(__AMX_INT8__) || defined(__AMX_BF16__)
|
2020-08-05 00:17:48 +00:00
|
|
|
#include <amxintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2023-08-11 23:20:14 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AMX_COMPLEX__)
|
|
|
|
#include <amxcomplexintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__AVX512VP2INTERSECT__)
|
2019-07-19 20:50:45 +00:00
|
|
|
#include <avx512vp2intersectintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VL__) && defined(__AVX512VP2INTERSECT__))
|
2019-07-19 20:50:45 +00:00
|
|
|
#include <avx512vlvp2intersectintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__ENQCMD__)
|
2019-07-19 20:50:45 +00:00
|
|
|
#include <enqcmdintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2020-08-05 00:17:48 +00:00
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__SERIALIZE__)
|
|
|
|
#include <serializeintrin.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if !(defined(_MSC_VER) || defined(__SCE__)) || __has_feature(modules) || \
|
|
|
|
defined(__TSXLDTRK__)
|
|
|
|
#include <tsxldtrkintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2019-07-19 20:50:45 +00:00
|
|
|
#if defined(_MSC_VER) && __has_extension(gnu_asm)
|
2018-08-05 06:20:05 +00:00
|
|
|
/* Define the default attributes for these intrinsics */
|
|
|
|
#define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__))
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
/*----------------------------------------------------------------------------*\
|
|
|
|
|* Interlocked Exchange HLE
|
|
|
|
\*----------------------------------------------------------------------------*/
|
|
|
|
#if defined(__i386__) || defined(__x86_64__)
|
|
|
|
static __inline__ long __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedExchange_HLEAcquire(long volatile *_Target, long _Value) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf2 ; lock ; xchg {%0, %1|%1, %0}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+r" (_Value), "+m" (*_Target) :: "memory");
|
|
|
|
return _Value;
|
|
|
|
}
|
|
|
|
static __inline__ long __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedExchange_HLERelease(long volatile *_Target, long _Value) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf3 ; lock ; xchg {%0, %1|%1, %0}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+r" (_Value), "+m" (*_Target) :: "memory");
|
|
|
|
return _Value;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#if defined(__x86_64__)
|
|
|
|
static __inline__ __int64 __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedExchange64_HLEAcquire(__int64 volatile *_Target, __int64 _Value) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf2 ; lock ; xchg {%0, %1|%1, %0}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+r" (_Value), "+m" (*_Target) :: "memory");
|
|
|
|
return _Value;
|
|
|
|
}
|
|
|
|
static __inline__ __int64 __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedExchange64_HLERelease(__int64 volatile *_Target, __int64 _Value) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf3 ; lock ; xchg {%0, %1|%1, %0}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+r" (_Value), "+m" (*_Target) :: "memory");
|
|
|
|
return _Value;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
/*----------------------------------------------------------------------------*\
|
|
|
|
|* Interlocked Compare Exchange HLE
|
|
|
|
\*----------------------------------------------------------------------------*/
|
|
|
|
#if defined(__i386__) || defined(__x86_64__)
|
|
|
|
static __inline__ long __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedCompareExchange_HLEAcquire(long volatile *_Destination,
|
|
|
|
long _Exchange, long _Comparand) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf2 ; lock ; cmpxchg {%2, %1|%1, %2}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+a" (_Comparand), "+m" (*_Destination)
|
|
|
|
: "r" (_Exchange) : "memory");
|
|
|
|
return _Comparand;
|
|
|
|
}
|
|
|
|
static __inline__ long __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedCompareExchange_HLERelease(long volatile *_Destination,
|
|
|
|
long _Exchange, long _Comparand) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf3 ; lock ; cmpxchg {%2, %1|%1, %2}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+a" (_Comparand), "+m" (*_Destination)
|
|
|
|
: "r" (_Exchange) : "memory");
|
|
|
|
return _Comparand;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#if defined(__x86_64__)
|
|
|
|
static __inline__ __int64 __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedCompareExchange64_HLEAcquire(__int64 volatile *_Destination,
|
|
|
|
__int64 _Exchange, __int64 _Comparand) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf2 ; lock ; cmpxchg {%2, %1|%1, %2}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+a" (_Comparand), "+m" (*_Destination)
|
|
|
|
: "r" (_Exchange) : "memory");
|
|
|
|
return _Comparand;
|
|
|
|
}
|
|
|
|
static __inline__ __int64 __DEFAULT_FN_ATTRS
|
|
|
|
_InterlockedCompareExchange64_HLERelease(__int64 volatile *_Destination,
|
|
|
|
__int64 _Exchange, __int64 _Comparand) {
|
2022-02-03 21:18:29 +00:00
|
|
|
__asm__ __volatile__(".byte 0xf3 ; lock ; cmpxchg {%2, %1|%1, %2}"
|
2018-08-05 06:20:05 +00:00
|
|
|
: "+a" (_Comparand), "+m" (*_Destination)
|
|
|
|
: "r" (_Exchange) : "memory");
|
|
|
|
return _Comparand;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#undef __DEFAULT_FN_ATTRS
|
|
|
|
|
2019-07-19 20:50:45 +00:00
|
|
|
#endif /* defined(_MSC_VER) && __has_extension(gnu_asm) */
|
2018-08-05 06:20:05 +00:00
|
|
|
|
2015-12-09 00:51:59 +00:00
|
|
|
#endif /* __IMMINTRIN_H */
|