Visible to Intel only — GUID: GUID-CE4D8580-2831-4147-92BC-4A54BA9271C4
Visible to Intel only — GUID: GUID-CE4D8580-2831-4147-92BC-4A54BA9271C4
Intrinsics for FP Conversion Operations
The prototypes for Intel® Advanced Vector Extensions 512 (Intel® AVX-512) intrinsics are located in the zmmintrin.h header file.
To use these intrinsics, include the immintrin.h file as follows:
#include <immintrin.h>
Intrinsic Name |
Operation |
Corresponding |
---|---|---|
_mm512_cvtps_pd_mm512_mask_cvtps_pd_mm512_maskz_cvtps_pd _mm512_cvt_roundps_pd, _mm512_mask_cvt_roundps_pd, _mm512_maskz_cvt_roundps_pd |
Converts rounded float32 to float 64. |
VCVTPS2PD |
_mm512_cvt_roundps_epi32, _mm512_mask_cvt_roundps_epi32, _mm512_maskz_cvt_roundps_epi32 _mm512_cvtt_roundps_epi32, _mm512_mask_cvtt_roundps_epi32, _mm512_maskz_cvtt_roundps_epi32 |
Converts rounded float32 to int32. |
VCVTPS2DQ/VCVTTPS2DQ |
_mm512_cvt_roundps_epu32, _mm512_mask_cvt_roundps_epu32, _mm512_maskz_cvt_roundps_epu32 _mm512_cvtt_roundps_epu32, _mm512_mask_cvtt_roundps_epu32, _mm512_maskz_cvtt_roundps_epu32 |
Converts rounded float32 to unsigned int32. |
VCVTPS2UDQ/VCVTTPS2UDQ |
_mm_cvt_roundsd_i32, _mm_cvt_roundsd_i64 _mm_cvtt_roundsd_i32, _mm_cvtt_roundsd_i64 |
Converts rounded scalar float64 to int32/int64. |
VCVTSD2SI/VCVTTSD2SI |
_mm_cvt_roundsd_u32, _mm_cvt_roundsd_u64 _mm_cvtt_roundsd_u32, _mm_cvtt_roundsd_u64 |
Converts rounded scalar float64 to unsigned int32/int64. |
VCVTSD2USI/VCVTTSD2USI |
_mm_cvt_roundss_i32, _mm_cvt_roundss_i64 _mm_cvtt_roundss_i32, _mm_cvtt_roundss_i64 |
Converts rounded scalar float32 to int32/int64. |
VCVTSS2SI/VCVTTSS2SI |
_mm_cvt_roundss_u32, _mm_cvt_roundss_u64 _mm_cvtt_roundss_u32, _mm_cvtt_roundss_u64 |
Converts rounded scalar float32 to unsigned int32/int64. |
VCVTSS2USI/VCVTTSS2USI |
_mm512_cvtpd_ps_mm512_mask_cvtpd_ps_mm512_maskz_cvtpd_ps _mm512_cvt_roundpd_ps, _mm512_mask_cvt_roundpd_ps, _mm512_maskz_cvt_roundpd_ps |
Converts rounded float64 to float32. |
VCVTPD2PS |
_mm512_cvt_roundpd_epi32, _mm512_mask_cvt_roundpd_epi32, _mm512_maskz_cvt_roundpd_epi32 _mm512_cvtt_roundpd_epi32, _mm512_mask_cvtt_roundpd_epi32, _mm512_maskz_cvtt_roundpd_epi32 |
Converts rounded float64 to int32. |
VCVTPD2DQ/VCVTTPD2DQ |
_mm512_cvt_roundpd_epu32, _mm512_mask_cvt_roundpd_epu32, _mm512_maskz_cvt_roundpd_epu32 _mm512_cvtt_roundpd_epu32, _mm512_mask_cvtt_roundpd_epu32, _mm512_maskz_cvtt_roundpd_epu32 |
Converts rounded float64 to unsigned int32. |
VCVTPD2UDQ/VCVTTPD2UDQ |
_mm512_cvtph_ps_mm512_mask_cvtph_ps_mm512_maskz_cvtph_ps _mm512_cvt_roundph_ps, _mm512_mask_cvt_roundph_ps, _mm512_maskz_cvt_roundph_ps |
Converts rounded float64 to float32. |
VCVTPH2PS |
_mm512_cvt_roundps_ph, _mm512_mask_cvt_roundps_ph, _mm512_maskz_cvt_roundps_ph |
Converts rounded float32 to scalar float32. |
VCVTPS2PH |
_mm_mask_cvtss_sd_mm_maskz_cvtss_sd _mm_cvt_roundss_sd, _mm_mask_cvt_roundss_sd, _mm_maskz_cvt_roundss_sd |
Converts rounded scalar float32 to scalar float64. |
VCVTSS2SD |
_mm_cvt_roundsd_ss, _mm_mask_cvt_roundsd_ss, _mm_maskz_cvt_roundsd_ss |
Converts rounded scalar float64 to scalar float32. |
VCVTSD2SS |
_mm512_cvtepu32_ps_mm512_mask_cvtepu32_ps_mm512_maskz_cvtepu32_ps _mm512_cvt_roundepu32_ps_mm512_mask_cvt_roundepu32_ps_mm512_maskz_cvt_roundepu32_ps |
Converts packed unsigned int32 to float32. |
VCVTUDQ2PS |
_mm512_cvtss_f32 |
Extracts a float32 value from the first vector element of an __m512. It does so in the most efficient manner possible in the context used. |
MOVSS/VMOVSS |
_mm512_cvtsd_f64 |
Extracts a float64 value from first vector element of an __m512d. It does so in the most efficient manner possible in the context used. |
MOVSD/VMOVSD |
variable | definition |
---|---|
k | writemask used as a selector |
a | first source vector element |
b | second source vector element |
src | source element to use based on writemask result |
round | Rounding control values; these can be one of the following (along with the sae suppress all exceptions flag):
|
_mm512_cvt_roundpd_ps
extern __m256 __cdecl _mm512_cvt_roundpd_ps(__m512d a, int round);
Converts float64 elements in a to float32 elements, and stores the result.
_mm512_mask_cvt_roundpd_ps
extern __m256 __cdecl _mm512_mask_cvt_roundpd_ps(__m256 src, __mmask8 k, __m512d a, int round);
Converts float64 elements in a to float32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvt_roundpd_ps
extern __m256 __cdecl _mm512_maskz_cvt_roundpd_ps(__mmask8 k, __m512d a, int round);
Converts float64 elements in a to float32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtpd_ps
extern __m256 __cdecl _mm512_cvt_pd_ps(__m512d a);
Converts float64 elements in a to float32 elements, and stores the result.
_mm512_mask_cvtpd_ps
extern __m256 __cdecl _mm512_mask_cvt_pd_ps(__m256 src, __mmask8 k, __m512d a);
Converts float64 elements in a to float32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtpd_ps
extern __m256 __cdecl _mm512_maskz_cvt_pd_ps(__mmask8 k, __m512d a);
Converts float64 elements in a to float32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundpd_epi32
extern __m512i __cdecl _mm512_cvt_roundpd_epi32(__m512d a, int round);
Converts float64 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundpd_epi32
extern __m512i __cdecl _mm512_mask_cvt_roundpd_epi32(__m256i src, __mmask8 k, __m512d a, int round);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundpd_epi32
extern __m512i __cdecl _mm512_maskz_cvt_roundpd_epi32(__mmask8 k, __m512d a, int round);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtpd_epi32
extern __m512i __cdecl _mm512_cvtpd_epi32(__m512d a);
Converts float64 elements in a int32 elements, and stores the result.
_mm512_mask_cvtpd_epi32
extern __m512i __cdecl _mm512_mask_cvtpd_epi32(__m256i src, __mmask8 k, __m512d a);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtpd_epi32
extern __m512i __cdecl _mm512_maskz_cvtpd_epi32(__mmask8 k, __m512d a);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtt_roundpd_epi32
extern __m512i __cdecl _mm512_cvtt_roundpd_epi32(__m512d a, int round);
Converts float32 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvtt_roundpd_epi32
extern __m512i __cdecl _mm512_mask_cvtt_roundpd_epi32(__m256i src, __mmask8 k, __m512d a, int round);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvtt_roundpd_epi32
extern __m512i __cdecl _mm512_maskz_cvtt_roundpd_epi32(__mmask8 k, __m512d a, int round);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvttpd_epi32
extern __m512i __cdecl _mm512_cvttpd_epi32(__m512d a);
Converts float64 elements in a int32 elements, and stores the result.
_mm512_mask_cvttpd_epi32
extern __m512i __cdecl _mm512_mask_cvttpd_epi32(__m256i src, __mmask8 k, __m512d a);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvttpd_epi32
extern __m512i __cdecl _mm512_maskz_cvttpd_epi32(__mmask8 k, __m512d a);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundpd_epu32
extern __m512i __cdecl _mm512_cvt_roundpd_epu32(__m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundpd_epu32
extern __m512i __cdecl _mm512_mask_cvt_roundpd_epu32(__m256i src, __mmask16 k, __m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundpd_epu32
extern __m512i __cdecl _mm512_maskz_cvt_roundpd_epu32(__mmask16 k, __m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtpd_epu32
extern __m512i __cdecl _mm512_cvtpd_epu32(__m512 a);
Converts float64 elements in a int32 elements, and stores the result.
_mm512_mask_cvtpd_epu32
extern __m512i __cdecl _mm512_mask_cvtpd_epu32(__m256i src, __mmask16 k, __m512 a);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtpd_epu32
extern __m512i __cdecl _mm512_maskz_cvtpd_epu32(__mmask16 k, __m512 a);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtt_roundpd_epu32
extern __m512i __cdecl _mm512_cvtt_roundpd_epu32(__m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvtt_roundpd_epu32
extern __m512i __cdecl _mm512_mask_cvtt_roundpd_epu32(__m256i src, __mmask16 k, __m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvtt_roundpd_epu32
extern __m512i __cdecl _mm512_maskz_cvtt_roundpd_epu32(__mmask16 k, __m512 a, int round);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvttpd_epu32
extern __m512i __cdecl _mm512_cvttpd_epu32(__m512 a);
Converts float64 elements in a int32 elements, and stores the result.
_mm512_mask_cvttpd_epu32
extern __m512i __cdecl _mm512_mask_cvttpd_epu32(__m256i src, __mmask16 k, __m512 a);
Converts float64 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvttpd_epu32
extern __m512i __cdecl _mm512_maskz_cvttpd_epu32(__mmask16 k, __m512 a);
Converts float64 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtph_ps
extern __m512 __cdecl _mm512_cvtph_ps(__m256i a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the results.
_mm512_mask_cvtph_ps
extern __m512 __cdecl _mm512_mask_cvtph_ps(__m512 src, __mmask16 k, __m256i a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtph_ps
extern __m512 __cdecl _mm512_maskz_cvtph_ps(__mmask16 k, __m256i a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundph_ps
extern __m512 __cdecl _mm512_cvt_roundph_ps(__m256i a, int round);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundph_ps
extern __m512 __cdecl _mm512_mask_cvt_roundph_ps(__m512 src, __mmask16 k, __m256i a, int round);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundph_ps
extern __m512 __cdecl _mm512_maskz_cvt_roundph_ps(__mmask16 k, __m256i a, int round);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvt_roundps_ph
extern __m256i __cdecl _mm512_cvt_roundps_ph(__m512 a, int round);
Converts float32 elements in a to packed half-precision (16-bit) floating-point elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundps_ph
extern __m256i __cdecl _mm512_mask_cvt_roundps_ph(__m256i src, __mmask16 k, __m512 a, int round);
Converts float32 elements in a to packed half-precision (16-bit) floating-point elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundps_ph
extern __m256i __cdecl _mm512_maskz_cvt_roundps_ph(__mmask16 k, __m512 a, int round);
Converts float32 elements in a to packed half-precision (16-bit) floating-point elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtph_ps
extern __m256i __cdecl _mm512_cvtps_ph(__m512 a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the results.
_mm512_mask_cvtph_ps
extern __m256i __cdecl _mm512_mask_cvtps_ph(__m256i src, __mmask16 k, __m512 a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtph_ps
extern __m256i __cdecl _mm512_maskz_cvtps_ph(__mmask16 k, __m512 a);
Converts packed half-precision (16-bit) floating-point elements in a to float32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundps_pd
extern __m512d __cdecl _mm512_cvt_roundps_pd(__m256 a, int round);
Converts float32 elements in a to float64 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundps_pd
extern __m512d __cdecl _mm512_mask_cvt_roundps_pd(__m512d src, __mmask8 k, __m256 a, int round);
Converts float32 elements in a to float64 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundps_pd
extern __m512d __cdecl _mm512_maskz_cvt_roundps_pd(__mmask8 k, __m256 a, int round);
Converts float32 elements in a to float64 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtps_pd
extern __m512d __cdecl _mm512_cvt_ps_pd(__m256 a);
Converts float32 elements in a to float64 elements, and stores the result.
_mm512_mask_cvtps_pd
extern __m512d __cdecl _mm512_mask_cvt_ps_pd(__m512d src, __mmask8 k, __m256 a);
Converts float32 elements in a to float64 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtps_pd
extern __m512d __cdecl _mm512_maskz_cvt_ps_pd(__mmask8 k, __m256 a);
Converts float32 elements in a to float64 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundps_epi32
extern __m512i __cdecl _mm512_cvt_roundps_epi32(__m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundps_epi32
extern __m512i __cdecl _mm512_mask_cvt_roundps_epi32(__m512i src, __mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundps_epi32
extern __m512i __cdecl _mm512_maskz_cvt_roundps_epi32(__mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtps_epi32
extern __m512i __cdecl _mm512_cvtps_epi32(__m512 a);
Converts float32 elements in a int32 elements, and stores the result.
_mm512_mask_cvtps_epi32
extern __m512i __cdecl _mm512_mask_cvtps_epi32(__m512i src, __mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtps_epi32
extern __m512i __cdecl _mm512_maskz_cvtps_epi32(__mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtt_roundps_epi32
extern __m512i __cdecl _mm512_cvtt_roundps_epi32(__m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvtt_roundps_epi32
extern __m512i __cdecl _mm512_mask_cvtt_roundps_epi32(__m512i src, __mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvtt_roundps_epi32
extern __m512i __cdecl _mm512_maskz_cvtt_roundps_epi32(__mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvttps_epi32
extern __m512i __cdecl _mm512_cvttps_epi32(__m512 a);
Converts float32 elements in a int32 elements, and stores the result.
_mm512_mask_cvttps_epi32
extern __m512i __cdecl _mm512_mask_cvttps_epi32(__m512i src, __mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvttps_epi32
extern __m512i __cdecl _mm512_maskz_cvttps_epi32(__mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvt_roundps_epu32
extern __m512i __cdecl _mm512_cvt_roundps_epu32(__m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvt_roundps_epu32
extern __m512i __cdecl _mm512_mask_cvt_roundps_epu32(__m512i src, __mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvt_roundps_epu32
extern __m512i __cdecl _mm512_maskz_cvt_roundps_epu32(__mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvtps_epu32
extern __m512i __cdecl _mm512_cvtps_epu32(__m512 a);
Converts float32 elements in a int32 elements, and stores the result.
_mm512_mask_cvtps_epu32
extern __m512i __cdecl _mm512_mask_cvtps_epu32(__m512i src, __mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvtps_epu32
extern __m512i __cdecl _mm512_maskz_cvtps_epu32(__mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm512_cvtt_roundps_epu32
extern __m512i __cdecl _mm512_cvtt_roundps_epu32(__m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the results.
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_mask_cvtt_roundps_epu32
extern __m512i __cdecl _mm512_mask_cvtt_roundps_epu32(__m512i src, __mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_maskz_cvtt_roundps_epu32
extern __m512i __cdecl _mm512_maskz_cvtt_roundps_epu32(__mmask16 k, __m512 a, int round);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
Pass __MM_FROUND_NO_EXC to sae to suppress all exceptions.
_mm512_cvttps_epu32
extern __m512i __cdecl _mm512_cvttps_epu32(__m512 a);
Converts float32 elements in a int32 elements, and stores the result.
_mm512_mask_cvttps_epu32
extern __m512i __cdecl _mm512_mask_cvttps_epu32(__m512i src, __mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using writemask k (elements are copied from src when the corresponding mask bit is not set).
_mm512_maskz_cvttps_epu32
extern __m512i __cdecl _mm512_maskz_cvttps_epu32(__mmask16 k, __m512 a);
Converts float32 elements in a to int32 elements, and stores the result using zeromask k (elements are zeroed out when the corresponding mask bit is not set).
_mm_cvt_roundss_sd
extern __m128d __cdecl _mm_cvt_roundss_sd(__m128d a, __m128 b, int round);
Converts the lower float32 element in b to a float64 element, stores the result in the lower destination element, and copies the upper element from a to the upper destination element .
_mm_mask_cvt_roundss_sd
extern __m128d __cdecl _mm_mask_cvt_roundss_sd(__m128d src, __mmask8 k, __m128d a, __m128 b, int round);
Converts the lower float32 element in b to a float64 element, stores the result in the lower destination element using writemask k (the element is copied from src when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_maskz_cvt_roundss_sd
extern __m128d __cdecl _mm_maskz_cvt_roundss_sd(__mmask8 k, __m128d a, __m128 b, int round);
Converts the lower float32 element in b to a float64 element, store the result in the lower destination element using zeromask k (the element is zeroed out when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_mask_cvtss_sd
extern __m128d __cdecl _mm_mask_cvt_ss_sd(__m128d src, __mmask8 k, __m128d a, __m128 b);
Converts the lower float32 element in b to a float64 element, stores the result in the lower destination element using writemask k (the element is copied from src when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_maskz_cvtss_sd
extern __m128d __cdecl _mm_maskz_cvt_ss_sd(__mmask8 k, __m128d a, __m128 b);
Converts the lower float32 element in b to a float64 element, stores the result in the lower destination element using zeromask k (the element is zeroed out when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_cvt_roundsd_ss
extern __m128 __cdecl _mm_cvt_roundsd_ss(__m128 a, __m128d b, int round);
Converts float64 elements in b to a single-precision (64-bit) floating-point elements, stores the result in the lower destination element, and copies the upper element from a to the upper destination element .
_mm_mask_cvt_roundsd_ss
extern __m128 __cdecl _mm_mask_cvt_roundsd_ss(__m128 src, __mmask8 k, __m128 a, __m128d b, int round);
Converts float64 elements in b to a single-precision (64-bit) floating-point elements, stores the result in the lower destination element using writemask k (the element is copied from src when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_maskz_cvt_roundsd_ss
extern __m128 __cdecl _mm_maskz_cvt_roundsd_ss(__mmask8 k, __m128 a, __m128d b, int round);
Converts float64 elements in b to a single-precision (64-bit) floating-point elements, the result in the lower destination element using zeromask k (the element is zeroed out when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_mask_cvtsd_ss
extern __m128 __cdecl _mm_mask_cvt_sd_ss(__m128 src, __mmask8 k, __m128 a, __m128d b);
Converts float64 elements in b to a single-precision (64-bit) floating-point elements, stores the result in the lower destination element using writemask k (the element is copied from src when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_maskz_cvtsd_ss
extern __m128 __cdecl _mm_maskz_cvt_sd_ss(__mmask8 k, __m128 a, __m128d b);
Converts float64 elements in b to a single-precision (64-bit) floating-point elements, stores the result in the lower destination element using zeromask k (the element is zeroed out when mask bit 0 is not set), and copy the upper element from a to the upper destination element.
_mm_cvt_roundsd_i32 / _mm_cvt_roundsd_si32
extern int __cdecl _mm_cvt_roundsd_i32(__m128d a, int round); extern int __cdecl _mm_cvt_roundsd_si32(__m128d a, int round);
_mm_cvt_sd_i32 / _mm_cvt_sd_si32
extern __int64 __cdecl _mm_cvt_sd_i32(__m128d); extern __int64 __cdecl _mm_cvt_sd_i64(__m128d);
_mm_cvt_roundsd_i64 / _mm_cvt_roundsd_si64
extern __int64 __cdecl _mm_cvt_roundsd_i64(__m128d, int round); extern __int64 __cdecl _mm_cvt_roundsd_si64(__m128d, int round);
_mm_cvti64 / _mm_cvtsd_si64
extern __m128d __cdecl _mm_cvt_i64_sd(__m128d a, __int64); extern __m128d __cdecl _mm_cvt_si64_sd(__m128d a, __int64);
_mm_cvt_roundsd_u32 / _mm_cvt_roundsd_u64
extern unsigned int __cdecl _mm_cvt_roundsd_u32(__m128d a, int round); extern unsigned __int64 __cdecl _mm_cvt_roundsd_u64(__m128d a, int round);
_mm_cvt_sd_u32 / _mm_cvt_sd_u64
extern unsigned int __cdecl _mm_cvt_sd_u32(__m128d a); extern unsigned __int64 __cdecl _mm_cvt_sd_u64(__m128d a);
_mm_cvt_roundsd_i32 / _mm_cvt_roundsd_si32
extern int __cdecl _mm_cvt_roundsd_i32(__m128d a, int round); extern int __cdecl _mm_cvt_roundsd_si32(__m128d a, int round);
_mm_cvtt_sd_i32 / _mm_cvtt_sd_si32
extern __int64 __cdecl _mm_cvtt_sd_i32(__m128d); extern __int64 __cdecl _mm_cvtt_sd_i64(__m128d);
_mm_cvtt_roundsd_i64 / _mm_cvtt_roundsd_si64
extern __int64 __cdecl _mm_cvtt_roundsd_i64(__m128d, int round); extern __int64 __cdecl _mm_cvtt_roundsd_si64(__m128d, int round);
_mm_cvtti64 / _mm_cvttsd_si64
extern __m128d __cdecl _mm_cvtt_i64_sd(__m128d a, __int64); extern __m128d __cdecl _mm_cvtt_si64_sd(__m128d a, __int64);
_mm_cvtt_roundsd_u32 / _mm_cvtt_roundsd_u64
extern unsigned int __cdecl _mm_cvtt_roundsd_u32(__m128d a, int round); extern unsigned __int64 __cdecl _mm_cvtt_roundsd_u64(__m128d a, int round);
_mm_cvtt_sd_u32 / _mm_cvtt_sd_u64
extern unsigned int __cdecl _mm_cvtt_sd_u32(__m128d a); extern unsigned __int64 __cdecl _mm_cvtt_sd_u64(__m128d a);
_mm_cvt_roundss_i32 / _mm_cvt_roundss_si32
extern int __cdecl _mm_cvt_roundss_i32(__m128d a, int round); extern int __cdecl _mm_cvt_roundss_si32(__m128d a, int round);
_mm_cvt_ss_i32 / _mm_cvt_ss_si32
extern __int64 __cdecl _mm_cvt_ss_i32(__m128d); extern __int64 __cdecl _mm_cvt_ss_i64(__m128d);
_mm_cvt_roundss_i64 / _mm_cvt_roundss_si64
extern __int64 __cdecl _mm_cvt_roundss_i64(__m128d, int round); extern __int64 __cdecl _mm_cvt_roundss_si64(__m128d, int round);
_mm_cvti64 / _mm_cvtss_si64
extern __m128d __cdecl _mm_cvt_i64_sd(__m128d a, __int64); extern __m128d __cdecl _mm_cvt_si64_sd(__m128d a, __int64);
_mm_cvt_roundss_u32 / _mm_cvt_roundss_u64
extern unsigned int __cdecl _mm_cvt_roundss_u32(__m128d a, int round); extern unsigned __int64 __cdecl _mm_cvt_roundss_u64(__m128d a, int round);
_mm_cvt_ss_u32 / _mm_cvt_ss_u64
extern unsigned int __cdecl _mm_cvt_ss_u32(__m128d a); extern unsigned __int64 __cdecl _mm_cvt_ss_u64(__m128d a);
_mm_cvt_roundss_i32 / _mm_cvt_roundss_si32
extern int __cdecl _mm_cvt_roundss_i32(__m128d a, int round); extern int __cdecl _mm_cvt_roundss_si32(__m128d a, int round);
_mm_cvtt_ss_i32 / _mm_cvtt_ss_si32
extern __int64 __cdecl _mm_cvtt_ss_i32(__m128d); extern __int64 __cdecl _mm_cvtt_ss_i64(__m128d);
_mm_cvtt_roundss_i64 / _mm_cvtt_roundss_si64
extern __int64 __cdecl _mm_cvtt_roundss_i64(__m128d, int round); extern __int64 __cdecl _mm_cvtt_roundss_si64(__m128d, int round);
_mm_cvtti64 / _mm_cvttss_si64
extern __m128d __cdecl _mm_cvtt_i64_sd(__m128d a, __int64); extern __m128d __cdecl _mm_cvtt_si64_sd(__m128d a, __int64);
_mm_cvtt_roundss_u32 / _mm_cvtt_roundss_u64
extern unsigned int __cdecl _mm_cvtt_roundss_u32(__m128d a, int round); extern unsigned __int64 __cdecl _mm_cvtt_roundss_u64(__m128d a, int round);
_mm_cvtt_ss_u32 / _mm_cvtt_ss_u64
extern unsigned int __cdecl _mm_cvtt_ss_u32(__m128d a); extern unsigned __int64 __cdecl _mm_cvtt_ss_u64(__m128d a);
_mm512_cvtss_f32
float _mm512_cvtss_f32(__m512 a);
_mm512_cvtsd_f64
double _mm512_cvtsd_f64(__m512d a);