MSVC cvt intrinsics

llama-patch-enable-fma-msvc
anzz1 3 years ago committed by GitHub
parent 82654f1f5a
commit 6ceb761499
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -168,8 +168,13 @@ typedef double ggml_float;
#ifdef __F16C__
#ifdef _MSC_VER
#define GGML_COMPUTE_FP16_TO_FP32(x) _mm_cvtss_f32(_mm_cvtph_ps(_mm_cvtsi32_si128(x)))
#define GGML_COMPUTE_FP32_TO_FP16(x) _mm_extract_epi16(_mm_cvtps_ph(_mm_set_ss(x), 0), 0)
#else
#define GGML_COMPUTE_FP16_TO_FP32(x) _cvtsh_ss(x)
#define GGML_COMPUTE_FP32_TO_FP16(x) _cvtss_sh(x, 0)
#endif
#else

Loading…
Cancel
Save