| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290 | // Copyright 2018 The Go Authors. All rights reserved.// Use of this source code is governed by a BSD-style// license that can be found in the LICENSE file.// Package cpu implements processor feature detection for// various CPU architectures.package cpuimport (	"os"	"strings")// Initialized reports whether the CPU features were initialized.//// For some GOOS/GOARCH combinations initialization of the CPU features depends// on reading an operating specific file, e.g. /proc/self/auxv on linux/arm// Initialized will report false if reading the file fails.var Initialized bool// CacheLinePad is used to pad structs to avoid false sharing.type CacheLinePad struct{ _ [cacheLineSize]byte }// X86 contains the supported CPU features of the// current X86/AMD64 platform. If the current platform// is not X86/AMD64 then all feature flags are false.//// X86 is padded to avoid false sharing. Further the HasAVX// and HasAVX2 are only set if the OS supports XMM and YMM// registers in addition to the CPUID feature bit being set.var X86 struct {	_                   CacheLinePad	HasAES              bool // AES hardware implementation (AES NI)	HasADX              bool // Multi-precision add-carry instruction extensions	HasAVX              bool // Advanced vector extension	HasAVX2             bool // Advanced vector extension 2	HasAVX512           bool // Advanced vector extension 512	HasAVX512F          bool // Advanced vector extension 512 Foundation Instructions	HasAVX512CD         bool // Advanced vector extension 512 Conflict Detection Instructions	HasAVX512ER         bool // Advanced vector extension 512 Exponential and Reciprocal Instructions	HasAVX512PF         bool // Advanced vector extension 512 Prefetch Instructions	HasAVX512VL         bool // Advanced vector extension 512 Vector Length Extensions	HasAVX512BW         bool // Advanced vector extension 512 Byte and Word Instructions	HasAVX512DQ         bool // Advanced vector extension 512 Doubleword and Quadword Instructions	HasAVX512IFMA       bool // Advanced vector extension 512 Integer Fused Multiply Add	HasAVX512VBMI       bool // Advanced vector extension 512 Vector Byte Manipulation Instructions	HasAVX5124VNNIW     bool // Advanced vector extension 512 Vector Neural Network Instructions Word variable precision	HasAVX5124FMAPS     bool // Advanced vector extension 512 Fused Multiply Accumulation Packed Single precision	HasAVX512VPOPCNTDQ  bool // Advanced vector extension 512 Double and quad word population count instructions	HasAVX512VPCLMULQDQ bool // Advanced vector extension 512 Vector carry-less multiply operations	HasAVX512VNNI       bool // Advanced vector extension 512 Vector Neural Network Instructions	HasAVX512GFNI       bool // Advanced vector extension 512 Galois field New Instructions	HasAVX512VAES       bool // Advanced vector extension 512 Vector AES instructions	HasAVX512VBMI2      bool // Advanced vector extension 512 Vector Byte Manipulation Instructions 2	HasAVX512BITALG     bool // Advanced vector extension 512 Bit Algorithms	HasAVX512BF16       bool // Advanced vector extension 512 BFloat16 Instructions	HasAMXTile          bool // Advanced Matrix Extension Tile instructions	HasAMXInt8          bool // Advanced Matrix Extension Int8 instructions	HasAMXBF16          bool // Advanced Matrix Extension BFloat16 instructions	HasBMI1             bool // Bit manipulation instruction set 1	HasBMI2             bool // Bit manipulation instruction set 2	HasCX16             bool // Compare and exchange 16 Bytes	HasERMS             bool // Enhanced REP for MOVSB and STOSB	HasFMA              bool // Fused-multiply-add instructions	HasOSXSAVE          bool // OS supports XSAVE/XRESTOR for saving/restoring XMM registers.	HasPCLMULQDQ        bool // PCLMULQDQ instruction - most often used for AES-GCM	HasPOPCNT           bool // Hamming weight instruction POPCNT.	HasRDRAND           bool // RDRAND instruction (on-chip random number generator)	HasRDSEED           bool // RDSEED instruction (on-chip random number generator)	HasSSE2             bool // Streaming SIMD extension 2 (always available on amd64)	HasSSE3             bool // Streaming SIMD extension 3	HasSSSE3            bool // Supplemental streaming SIMD extension 3	HasSSE41            bool // Streaming SIMD extension 4 and 4.1	HasSSE42            bool // Streaming SIMD extension 4 and 4.2	_                   CacheLinePad}// ARM64 contains the supported CPU features of the// current ARMv8(aarch64) platform. If the current platform// is not arm64 then all feature flags are false.var ARM64 struct {	_           CacheLinePad	HasFP       bool // Floating-point instruction set (always available)	HasASIMD    bool // Advanced SIMD (always available)	HasEVTSTRM  bool // Event stream support	HasAES      bool // AES hardware implementation	HasPMULL    bool // Polynomial multiplication instruction set	HasSHA1     bool // SHA1 hardware implementation	HasSHA2     bool // SHA2 hardware implementation	HasCRC32    bool // CRC32 hardware implementation	HasATOMICS  bool // Atomic memory operation instruction set	HasFPHP     bool // Half precision floating-point instruction set	HasASIMDHP  bool // Advanced SIMD half precision instruction set	HasCPUID    bool // CPUID identification scheme registers	HasASIMDRDM bool // Rounding double multiply add/subtract instruction set	HasJSCVT    bool // Javascript conversion from floating-point to integer	HasFCMA     bool // Floating-point multiplication and addition of complex numbers	HasLRCPC    bool // Release Consistent processor consistent support	HasDCPOP    bool // Persistent memory support	HasSHA3     bool // SHA3 hardware implementation	HasSM3      bool // SM3 hardware implementation	HasSM4      bool // SM4 hardware implementation	HasASIMDDP  bool // Advanced SIMD double precision instruction set	HasSHA512   bool // SHA512 hardware implementation	HasSVE      bool // Scalable Vector Extensions	HasASIMDFHM bool // Advanced SIMD multiplication FP16 to FP32	_           CacheLinePad}// ARM contains the supported CPU features of the current ARM (32-bit) platform.// All feature flags are false if://  1. the current platform is not arm, or//  2. the current operating system is not Linux.var ARM struct {	_           CacheLinePad	HasSWP      bool // SWP instruction support	HasHALF     bool // Half-word load and store support	HasTHUMB    bool // ARM Thumb instruction set	Has26BIT    bool // Address space limited to 26-bits	HasFASTMUL  bool // 32-bit operand, 64-bit result multiplication support	HasFPA      bool // Floating point arithmetic support	HasVFP      bool // Vector floating point support	HasEDSP     bool // DSP Extensions support	HasJAVA     bool // Java instruction set	HasIWMMXT   bool // Intel Wireless MMX technology support	HasCRUNCH   bool // MaverickCrunch context switching and handling	HasTHUMBEE  bool // Thumb EE instruction set	HasNEON     bool // NEON instruction set	HasVFPv3    bool // Vector floating point version 3 support	HasVFPv3D16 bool // Vector floating point version 3 D8-D15	HasTLS      bool // Thread local storage support	HasVFPv4    bool // Vector floating point version 4 support	HasIDIVA    bool // Integer divide instruction support in ARM mode	HasIDIVT    bool // Integer divide instruction support in Thumb mode	HasVFPD32   bool // Vector floating point version 3 D15-D31	HasLPAE     bool // Large Physical Address Extensions	HasEVTSTRM  bool // Event stream support	HasAES      bool // AES hardware implementation	HasPMULL    bool // Polynomial multiplication instruction set	HasSHA1     bool // SHA1 hardware implementation	HasSHA2     bool // SHA2 hardware implementation	HasCRC32    bool // CRC32 hardware implementation	_           CacheLinePad}// MIPS64X contains the supported CPU features of the current mips64/mips64le// platforms. If the current platform is not mips64/mips64le or the current// operating system is not Linux then all feature flags are false.var MIPS64X struct {	_      CacheLinePad	HasMSA bool // MIPS SIMD architecture	_      CacheLinePad}// PPC64 contains the supported CPU features of the current ppc64/ppc64le platforms.// If the current platform is not ppc64/ppc64le then all feature flags are false.//// For ppc64/ppc64le, it is safe to check only for ISA level starting on ISA v3.00,// since there are no optional categories. There are some exceptions that also// require kernel support to work (DARN, SCV), so there are feature bits for// those as well. The struct is padded to avoid false sharing.var PPC64 struct {	_        CacheLinePad	HasDARN  bool // Hardware random number generator (requires kernel enablement)	HasSCV   bool // Syscall vectored (requires kernel enablement)	IsPOWER8 bool // ISA v2.07 (POWER8)	IsPOWER9 bool // ISA v3.00 (POWER9), implies IsPOWER8	_        CacheLinePad}// S390X contains the supported CPU features of the current IBM Z// (s390x) platform. If the current platform is not IBM Z then all// feature flags are false.//// S390X is padded to avoid false sharing. Further HasVX is only set// if the OS supports vector registers in addition to the STFLE// feature bit being set.var S390X struct {	_         CacheLinePad	HasZARCH  bool // z/Architecture mode is active [mandatory]	HasSTFLE  bool // store facility list extended	HasLDISP  bool // long (20-bit) displacements	HasEIMM   bool // 32-bit immediates	HasDFP    bool // decimal floating point	HasETF3EH bool // ETF-3 enhanced	HasMSA    bool // message security assist (CPACF)	HasAES    bool // KM-AES{128,192,256} functions	HasAESCBC bool // KMC-AES{128,192,256} functions	HasAESCTR bool // KMCTR-AES{128,192,256} functions	HasAESGCM bool // KMA-GCM-AES{128,192,256} functions	HasGHASH  bool // KIMD-GHASH function	HasSHA1   bool // K{I,L}MD-SHA-1 functions	HasSHA256 bool // K{I,L}MD-SHA-256 functions	HasSHA512 bool // K{I,L}MD-SHA-512 functions	HasSHA3   bool // K{I,L}MD-SHA3-{224,256,384,512} and K{I,L}MD-SHAKE-{128,256} functions	HasVX     bool // vector facility	HasVXE    bool // vector-enhancements facility 1	_         CacheLinePad}func init() {	archInit()	initOptions()	processOptions()}// options contains the cpu debug options that can be used in GODEBUG.// Options are arch dependent and are added by the arch specific initOptions functions.// Features that are mandatory for the specific GOARCH should have the Required field set// (e.g. SSE2 on amd64).var options []option// Option names should be lower case. e.g. avx instead of AVX.type option struct {	Name      string	Feature   *bool	Specified bool // whether feature value was specified in GODEBUG	Enable    bool // whether feature should be enabled	Required  bool // whether feature is mandatory and can not be disabled}func processOptions() {	env := os.Getenv("GODEBUG")field:	for env != "" {		field := ""		i := strings.IndexByte(env, ',')		if i < 0 {			field, env = env, ""		} else {			field, env = env[:i], env[i+1:]		}		if len(field) < 4 || field[:4] != "cpu." {			continue		}		i = strings.IndexByte(field, '=')		if i < 0 {			print("GODEBUG sys/cpu: no value specified for \"", field, "\"\n")			continue		}		key, value := field[4:i], field[i+1:] // e.g. "SSE2", "on"		var enable bool		switch value {		case "on":			enable = true		case "off":			enable = false		default:			print("GODEBUG sys/cpu: value \"", value, "\" not supported for cpu option \"", key, "\"\n")			continue field		}		if key == "all" {			for i := range options {				options[i].Specified = true				options[i].Enable = enable || options[i].Required			}			continue field		}		for i := range options {			if options[i].Name == key {				options[i].Specified = true				options[i].Enable = enable				continue field			}		}		print("GODEBUG sys/cpu: unknown cpu feature \"", key, "\"\n")	}	for _, o := range options {		if !o.Specified {			continue		}		if o.Enable && !*o.Feature {			print("GODEBUG sys/cpu: can not enable \"", o.Name, "\", missing CPU support\n")			continue		}		if !o.Enable && o.Required {			print("GODEBUG sys/cpu: can not disable \"", o.Name, "\", required CPU feature\n")			continue		}		*o.Feature = o.Enable	}}
 |