//! Run-time feature detection for Aarch64 on Windows. use crate::detect::{Feature, cache}; /// Try to read the features using IsProcessorFeaturePresent. pub(crate) fn detect_features() -> cache::Initializer { type DWORD = u32; type BOOL = i32; const FALSE: BOOL = 0; // The following Microsoft documents isn't updated for aarch64. // https://docs.microsoft.com/en-us/windows/win32/api/processthreadsapi/nf-processthreadsapi-isprocessorfeaturepresent // These are defined in winnt.h of Windows SDK const PF_ARM_VFP_32_REGISTERS_AVAILABLE: u32 = 18; const PF_ARM_NEON_INSTRUCTIONS_AVAILABLE: u32 = 19; const PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE: u32 = 30; const PF_ARM_V8_CRC32_INSTRUCTIONS_AVAILABLE: u32 = 31; const PF_ARM_V81_ATOMIC_INSTRUCTIONS_AVAILABLE: u32 = 34; const PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE: u32 = 43; const PF_ARM_V83_JSCVT_INSTRUCTIONS_AVAILABLE: u32 = 44; const PF_ARM_V83_LRCPC_INSTRUCTIONS_AVAILABLE: u32 = 45; const PF_ARM_SVE_INSTRUCTIONS_AVAILABLE: u32 = 46; const PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE: u32 = 47; const PF_ARM_SVE2_1_INSTRUCTIONS_AVAILABLE: u32 = 48; const PF_ARM_SVE_AES_INSTRUCTIONS_AVAILABLE: u32 = 49; const PF_ARM_SVE_PMULL128_INSTRUCTIONS_AVAILABLE: u32 = 50; const PF_ARM_SVE_BITPERM_INSTRUCTIONS_AVAILABLE: u32 = 51; // const PF_ARM_SVE_BF16_INSTRUCTIONS_AVAILABLE: u32 = 52; // const PF_ARM_SVE_EBF16_INSTRUCTIONS_AVAILABLE: u32 = 53; const PF_ARM_SVE_B16B16_INSTRUCTIONS_AVAILABLE: u32 = 54; const PF_ARM_SVE_SHA3_INSTRUCTIONS_AVAILABLE: u32 = 55; const PF_ARM_SVE_SM4_INSTRUCTIONS_AVAILABLE: u32 = 56; // const PF_ARM_SVE_I8MM_INSTRUCTIONS_AVAILABLE: u32 = 57; // const PF_ARM_SVE_F32MM_INSTRUCTIONS_AVAILABLE: u32 = 58; // const PF_ARM_SVE_F64MM_INSTRUCTIONS_AVAILABLE: u32 = 59; unsafe extern "system" { fn IsProcessorFeaturePresent(ProcessorFeature: DWORD) -> BOOL; } let mut value = cache::Initializer::default(); { let mut enable_feature = |f, enable| { if enable { value.set(f as u32); } }; // Some features may be supported on current CPU, // but no way to detect it by OS API. // Also, we require unsafe block for the extern "system" calls. unsafe { enable_feature( Feature::fp, IsProcessorFeaturePresent(PF_ARM_VFP_32_REGISTERS_AVAILABLE) != FALSE, ); enable_feature( Feature::asimd, IsProcessorFeaturePresent(PF_ARM_NEON_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::crc, IsProcessorFeaturePresent(PF_ARM_V8_CRC32_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::lse, IsProcessorFeaturePresent(PF_ARM_V81_ATOMIC_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::dotprod, IsProcessorFeaturePresent(PF_ARM_V82_DP_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::jsconv, IsProcessorFeaturePresent(PF_ARM_V83_JSCVT_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::rcpc, IsProcessorFeaturePresent(PF_ARM_V83_LRCPC_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve, IsProcessorFeaturePresent(PF_ARM_SVE_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2, IsProcessorFeaturePresent(PF_ARM_SVE2_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2p1, IsProcessorFeaturePresent(PF_ARM_SVE2_1_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2_aes, IsProcessorFeaturePresent(PF_ARM_SVE_AES_INSTRUCTIONS_AVAILABLE) != FALSE && IsProcessorFeaturePresent(PF_ARM_SVE_PMULL128_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2_bitperm, IsProcessorFeaturePresent(PF_ARM_SVE_BITPERM_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve_b16b16, IsProcessorFeaturePresent(PF_ARM_SVE_B16B16_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2_sha3, IsProcessorFeaturePresent(PF_ARM_SVE_SHA3_INSTRUCTIONS_AVAILABLE) != FALSE, ); enable_feature( Feature::sve2_sm4, IsProcessorFeaturePresent(PF_ARM_SVE_SM4_INSTRUCTIONS_AVAILABLE) != FALSE, ); // PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE means aes, sha1, sha2 and // pmull support let crypto = IsProcessorFeaturePresent(PF_ARM_V8_CRYPTO_INSTRUCTIONS_AVAILABLE) != FALSE; enable_feature(Feature::aes, crypto); enable_feature(Feature::pmull, crypto); enable_feature(Feature::sha2, crypto); } } value }