| // Copyright 2018 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| // Package cpu implements processor feature detection for |
| // various CPU architectures. |
| package cpu |
| |
| import ( |
| "os" |
| "strings" |
| ) |
| |
| // Initialized reports whether the CPU features were initialized. |
| // |
| // For some GOOS/GOARCH combinations initialization of the CPU features depends |
| // on reading an operating specific file, e.g. /proc/self/auxv on linux/arm |
| // Initialized will report false if reading the file fails. |
| var Initialized bool |
| |
| // CacheLinePad is used to pad structs to avoid false sharing. |
| type CacheLinePad struct{ _ [cacheLineSize]byte } |
| |
| // X86 contains the supported CPU features of the |
| // current X86/AMD64 platform. If the current platform |
| // is not X86/AMD64 then all feature flags are false. |
| // |
| // X86 is padded to avoid false sharing. Further the HasAVX |
| // and HasAVX2 are only set if the OS supports XMM and YMM |
| // registers in addition to the CPUID feature bit being set. |
| var X86 struct { |
| _ CacheLinePad |
| HasAES bool // AES hardware implementation (AES NI) |
| HasADX bool // Multi-precision add-carry instruction extensions |
| HasAVX bool // Advanced vector extension |
| HasAVX2 bool // Advanced vector extension 2 |
| HasAVX512 bool // Advanced vector extension 512 |
| HasAVX512F bool // Advanced vector extension 512 Foundation Instructions |
| HasAVX512CD bool // Advanced vector extension 512 Conflict Detection Instructions |
| HasAVX512ER bool // Advanced vector extension 512 Exponential and Reciprocal Instructions |
| HasAVX512PF bool // Advanced vector extension 512 Prefetch Instructions |
| HasAVX512VL bool // Advanced vector extension 512 Vector Length Extensions |
| HasAVX512BW bool // Advanced vector extension 512 Byte and Word Instructions |
| HasAVX512DQ bool // Advanced vector extension 512 Doubleword and Quadword Instructions |
| HasAVX512IFMA bool // Advanced vector extension 512 Integer Fused Multiply Add |
| HasAVX512VBMI bool // Advanced vector extension 512 Vector Byte Manipulation Instructions |
| HasAVX5124VNNIW bool // Advanced vector extension 512 Vector Neural Network Instructions Word variable precision |
| HasAVX5124FMAPS bool // Advanced vector extension 512 Fused Multiply Accumulation Packed Single precision |
| HasAVX512VPOPCNTDQ bool // Advanced vector extension 512 Double and quad word population count instructions |
| HasAVX512VPCLMULQDQ bool // Advanced vector extension 512 Vector carry-less multiply operations |
| HasAVX512VNNI bool // Advanced vector extension 512 Vector Neural Network Instructions |
| HasAVX512GFNI bool // Advanced vector extension 512 Galois field New Instructions |
| HasAVX512VAES bool // Advanced vector extension 512 Vector AES instructions |
| HasAVX512VBMI2 bool // Advanced vector extension 512 Vector Byte Manipulation Instructions 2 |
| HasAVX512BITALG bool // Advanced vector extension 512 Bit Algorithms |
| HasAVX512BF16 bool // Advanced vector extension 512 BFloat16 Instructions |
| HasAMXTile bool // Advanced Matrix Extension Tile instructions |
| HasAMXInt8 bool // Advanced Matrix Extension Int8 instructions |
| HasAMXBF16 bool // Advanced Matrix Extension BFloat16 instructions |
| HasBMI1 bool // Bit manipulation instruction set 1 |
| HasBMI2 bool // Bit manipulation instruction set 2 |
| HasCX16 bool // Compare and exchange 16 Bytes |
| HasERMS bool // Enhanced REP for MOVSB and STOSB |
| HasFMA bool // Fused-multiply-add instructions |
| HasOSXSAVE bool // OS supports XSAVE/XRESTOR for saving/restoring XMM registers. |
| HasPCLMULQDQ bool // PCLMULQDQ instruction - most often used for AES-GCM |
| HasPOPCNT bool // Hamming weight instruction POPCNT. |
| HasRDRAND bool // RDRAND instruction (on-chip random number generator) |
| HasRDSEED bool // RDSEED instruction (on-chip random number generator) |
| HasSSE2 bool // Streaming SIMD extension 2 (always available on amd64) |
| HasSSE3 bool // Streaming SIMD extension 3 |
| HasSSSE3 bool // Supplemental streaming SIMD extension 3 |
| HasSSE41 bool // Streaming SIMD extension 4 and 4.1 |
| HasSSE42 bool // Streaming SIMD extension 4 and 4.2 |
| _ CacheLinePad |
| } |
| |
| // ARM64 contains the supported CPU features of the |
| // current ARMv8(aarch64) platform. If the current platform |
| // is not arm64 then all feature flags are false. |
| var ARM64 struct { |
| _ CacheLinePad |
| HasFP bool // Floating-point instruction set (always available) |
| HasASIMD bool // Advanced SIMD (always available) |
| HasEVTSTRM bool // Event stream support |
| HasAES bool // AES hardware implementation |
| HasPMULL bool // Polynomial multiplication instruction set |
| HasSHA1 bool // SHA1 hardware implementation |
| HasSHA2 bool // SHA2 hardware implementation |
| HasCRC32 bool // CRC32 hardware implementation |
| HasATOMICS bool // Atomic memory operation instruction set |
| HasFPHP bool // Half precision floating-point instruction set |
| HasASIMDHP bool // Advanced SIMD half precision instruction set |
| HasCPUID bool // CPUID identification scheme registers |
| HasASIMDRDM bool // Rounding double multiply add/subtract instruction set |
| HasJSCVT bool // Javascript conversion from floating-point to integer |
| HasFCMA bool // Floating-point multiplication and addition of complex numbers |
| HasLRCPC bool // Release Consistent processor consistent support |
| HasDCPOP bool // Persistent memory support |
| HasSHA3 bool // SHA3 hardware implementation |
| HasSM3 bool // SM3 hardware implementation |
| HasSM4 bool // SM4 hardware implementation |
| HasASIMDDP bool // Advanced SIMD double precision instruction set |
| HasSHA512 bool // SHA512 hardware implementation |
| HasSVE bool // Scalable Vector Extensions |
| HasSVE2 bool // Scalable Vector Extensions 2 |
| HasASIMDFHM bool // Advanced SIMD multiplication FP16 to FP32 |
| HasDIT bool // Data Independent Timing support |
| HasI8MM bool // Advanced SIMD Int8 matrix multiplication instructions |
| _ CacheLinePad |
| } |
| |
| // ARM contains the supported CPU features of the current ARM (32-bit) platform. |
| // All feature flags are false if: |
| // 1. the current platform is not arm, or |
| // 2. the current operating system is not Linux. |
| var ARM struct { |
| _ CacheLinePad |
| HasSWP bool // SWP instruction support |
| HasHALF bool // Half-word load and store support |
| HasTHUMB bool // ARM Thumb instruction set |
| Has26BIT bool // Address space limited to 26-bits |
| HasFASTMUL bool // 32-bit operand, 64-bit result multiplication support |
| HasFPA bool // Floating point arithmetic support |
| HasVFP bool // Vector floating point support |
| HasEDSP bool // DSP Extensions support |
| HasJAVA bool // Java instruction set |
| HasIWMMXT bool // Intel Wireless MMX technology support |
| HasCRUNCH bool // MaverickCrunch context switching and handling |
| HasTHUMBEE bool // Thumb EE instruction set |
| HasNEON bool // NEON instruction set |
| HasVFPv3 bool // Vector floating point version 3 support |
| HasVFPv3D16 bool // Vector floating point version 3 D8-D15 |
| HasTLS bool // Thread local storage support |
| HasVFPv4 bool // Vector floating point version 4 support |
| HasIDIVA bool // Integer divide instruction support in ARM mode |
| HasIDIVT bool // Integer divide instruction support in Thumb mode |
| HasVFPD32 bool // Vector floating point version 3 D15-D31 |
| HasLPAE bool // Large Physical Address Extensions |
| HasEVTSTRM bool // Event stream support |
| HasAES bool // AES hardware implementation |
| HasPMULL bool // Polynomial multiplication instruction set |
| HasSHA1 bool // SHA1 hardware implementation |
| HasSHA2 bool // SHA2 hardware implementation |
| HasCRC32 bool // CRC32 hardware implementation |
| _ CacheLinePad |
| } |
| |
| // MIPS64X contains the supported CPU features of the current mips64/mips64le |
| // platforms. If the current platform is not mips64/mips64le or the current |
| // operating system is not Linux then all feature flags are false. |
| var MIPS64X struct { |
| _ CacheLinePad |
| HasMSA bool // MIPS SIMD architecture |
| _ CacheLinePad |
| } |
| |
| // PPC64 contains the supported CPU features of the current ppc64/ppc64le platforms. |
| // If the current platform is not ppc64/ppc64le then all feature flags are false. |
| // |
| // For ppc64/ppc64le, it is safe to check only for ISA level starting on ISA v3.00, |
| // since there are no optional categories. There are some exceptions that also |
| // require kernel support to work (DARN, SCV), so there are feature bits for |
| // those as well. The struct is padded to avoid false sharing. |
| var PPC64 struct { |
| _ CacheLinePad |
| HasDARN bool // Hardware random number generator (requires kernel enablement) |
| HasSCV bool // Syscall vectored (requires kernel enablement) |
| IsPOWER8 bool // ISA v2.07 (POWER8) |
| IsPOWER9 bool // ISA v3.00 (POWER9), implies IsPOWER8 |
| _ CacheLinePad |
| } |
| |
| // S390X contains the supported CPU features of the current IBM Z |
| // (s390x) platform. If the current platform is not IBM Z then all |
| // feature flags are false. |
| // |
| // S390X is padded to avoid false sharing. Further HasVX is only set |
| // if the OS supports vector registers in addition to the STFLE |
| // feature bit being set. |
| var S390X struct { |
| _ CacheLinePad |
| HasZARCH bool // z/Architecture mode is active [mandatory] |
| HasSTFLE bool // store facility list extended |
| HasLDISP bool // long (20-bit) displacements |
| HasEIMM bool // 32-bit immediates |
| HasDFP bool // decimal floating point |
| HasETF3EH bool // ETF-3 enhanced |
| HasMSA bool // message security assist (CPACF) |
| HasAES bool // KM-AES{128,192,256} functions |
| HasAESCBC bool // KMC-AES{128,192,256} functions |
| HasAESCTR bool // KMCTR-AES{128,192,256} functions |
| HasAESGCM bool // KMA-GCM-AES{128,192,256} functions |
| HasGHASH bool // KIMD-GHASH function |
| HasSHA1 bool // K{I,L}MD-SHA-1 functions |
| HasSHA256 bool // K{I,L}MD-SHA-256 functions |
| HasSHA512 bool // K{I,L}MD-SHA-512 functions |
| HasSHA3 bool // K{I,L}MD-SHA3-{224,256,384,512} and K{I,L}MD-SHAKE-{128,256} functions |
| HasVX bool // vector facility |
| HasVXE bool // vector-enhancements facility 1 |
| _ CacheLinePad |
| } |
| |
| // RISCV64 contains the supported CPU features and performance characteristics for riscv64 |
| // platforms. The booleans in RISCV64, with the exception of HasFastMisaligned, indicate |
| // the presence of RISC-V extensions. |
| // |
| // It is safe to assume that all the RV64G extensions are supported and so they are omitted from |
| // this structure. As riscv64 Go programs require at least RV64G, the code that populates |
| // this structure cannot run successfully if some of the RV64G extensions are missing. |
| // The struct is padded to avoid false sharing. |
| var RISCV64 struct { |
| _ CacheLinePad |
| HasFastMisaligned bool // Fast misaligned accesses |
| HasC bool // Compressed instruction-set extension |
| HasV bool // Vector extension compatible with RVV 1.0 |
| HasZba bool // Address generation instructions extension |
| HasZbb bool // Basic bit-manipulation extension |
| HasZbs bool // Single-bit instructions extension |
| _ CacheLinePad |
| } |
| |
| func init() { |
| archInit() |
| initOptions() |
| processOptions() |
| } |
| |
| // options contains the cpu debug options that can be used in GODEBUG. |
| // Options are arch dependent and are added by the arch specific initOptions functions. |
| // Features that are mandatory for the specific GOARCH should have the Required field set |
| // (e.g. SSE2 on amd64). |
| var options []option |
| |
| // Option names should be lower case. e.g. avx instead of AVX. |
| type option struct { |
| Name string |
| Feature *bool |
| Specified bool // whether feature value was specified in GODEBUG |
| Enable bool // whether feature should be enabled |
| Required bool // whether feature is mandatory and can not be disabled |
| } |
| |
| func processOptions() { |
| env := os.Getenv("GODEBUG") |
| field: |
| for env != "" { |
| field := "" |
| i := strings.IndexByte(env, ',') |
| if i < 0 { |
| field, env = env, "" |
| } else { |
| field, env = env[:i], env[i+1:] |
| } |
| if len(field) < 4 || field[:4] != "cpu." { |
| continue |
| } |
| i = strings.IndexByte(field, '=') |
| if i < 0 { |
| print("GODEBUG sys/cpu: no value specified for \"", field, "\"\n") |
| continue |
| } |
| key, value := field[4:i], field[i+1:] // e.g. "SSE2", "on" |
| |
| var enable bool |
| switch value { |
| case "on": |
| enable = true |
| case "off": |
| enable = false |
| default: |
| print("GODEBUG sys/cpu: value \"", value, "\" not supported for cpu option \"", key, "\"\n") |
| continue field |
| } |
| |
| if key == "all" { |
| for i := range options { |
| options[i].Specified = true |
| options[i].Enable = enable || options[i].Required |
| } |
| continue field |
| } |
| |
| for i := range options { |
| if options[i].Name == key { |
| options[i].Specified = true |
| options[i].Enable = enable |
| continue field |
| } |
| } |
| |
| print("GODEBUG sys/cpu: unknown cpu feature \"", key, "\"\n") |
| } |
| |
| for _, o := range options { |
| if !o.Specified { |
| continue |
| } |
| |
| if o.Enable && !*o.Feature { |
| print("GODEBUG sys/cpu: can not enable \"", o.Name, "\", missing CPU support\n") |
| continue |
| } |
| |
| if !o.Enable && o.Required { |
| print("GODEBUG sys/cpu: can not disable \"", o.Name, "\", required CPU feature\n") |
| continue |
| } |
| |
| *o.Feature = o.Enable |
| } |
| } |