Skip to content

Commit

Permalink
cpu: add support for AVX-VNNI and IFMA detection
Browse files Browse the repository at this point in the history
Added detection for x86 AVX-VNNI (VEX-coded Vector Neural Network
Instructions) and AVX-IFMA (VEX-coded Integer Fused Multiply Add),
including both the base VNNI set and the Int8 extention.

Fixes golang/go#71142

Change-Id: I9e8d18b2e8bf81d5d4313a4a47fdf731fb3d44dd
GitHub-Last-Rev: 32ea443
GitHub-Pull-Request: #242
Reviewed-on: https://go-review.googlesource.com/c/sys/+/641155
LUCI-TryBot-Result: Go LUCI <golang-scoped@luci-project-accounts.iam.gserviceaccount.com>
Reviewed-by: Michael Pratt <mpratt@google.com>
Auto-Submit: Ian Lance Taylor <iant@google.com>
Reviewed-by: Ian Lance Taylor <iant@google.com>
  • Loading branch information
Grigorii Khvatskii authored and gopherbot committed Jan 10, 2025
1 parent 1c14dca commit c756214
Show file tree
Hide file tree
Showing 3 changed files with 54 additions and 4 deletions.
3 changes: 3 additions & 0 deletions cpu/cpu.go
Original file line number Diff line number Diff line change
Expand Up @@ -72,6 +72,9 @@ var X86 struct {
HasSSSE3 bool // Supplemental streaming SIMD extension 3
HasSSE41 bool // Streaming SIMD extension 4 and 4.1
HasSSE42 bool // Streaming SIMD extension 4 and 4.2
HasAVXIFMA bool // Advanced vector extension Integer Fused Multiply Add
HasAVXVNNI bool // Advanced vector extension Vector Neural Network Instructions
HasAVXVNNIInt8 bool // Advanced vector extension Vector Neural Network Int8 instructions
_ CacheLinePad
}

Expand Down
34 changes: 34 additions & 0 deletions cpu/cpu_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,40 @@ func TestAVX512HasAVX2AndAVX(t *testing.T) {
}
}

func TestAVX512BF16HasAVX512(t *testing.T) {
if runtime.GOARCH == "amd64" {
if cpu.X86.HasAVX512BF16 && !cpu.X86.HasAVX512 {
t.Fatal("HasAVX512 expected true, got false")
}
}
}

func TestAVXVNNIHasAVX(t *testing.T) {
if cpu.X86.HasAVXVNNI && !cpu.X86.HasAVX {
t.Fatal("HasAVX expected true, got false")
}
}

func TestAVXIFMAHasAVXVNNIAndAVX(t *testing.T) {
if cpu.X86.HasAVXIFMA && !cpu.X86.HasAVX {
t.Fatal("HasAVX expected true, got false")
}

if cpu.X86.HasAVXIFMA && !cpu.X86.HasAVXVNNI {
t.Fatal("HasAVXVNNI expected true, got false")
}
}

func TestAVXVNNIInt8HasAVXVNNIAndAVX(t *testing.T) {
if cpu.X86.HasAVXVNNIInt8 && !cpu.X86.HasAVXVNNI {
t.Fatal("HasAVXVNNI expected true, got false")
}

if cpu.X86.HasAVXVNNIInt8 && !cpu.X86.HasAVX {
t.Fatal("HasAVX expected true, got false")
}
}

func TestARM64minimalFeatures(t *testing.T) {
if runtime.GOARCH != "arm64" || runtime.GOOS == "ios" {
return
Expand Down
21 changes: 17 additions & 4 deletions cpu/cpu_x86.go
Original file line number Diff line number Diff line change
Expand Up @@ -53,6 +53,9 @@ func initOptions() {
{Name: "sse41", Feature: &X86.HasSSE41},
{Name: "sse42", Feature: &X86.HasSSE42},
{Name: "ssse3", Feature: &X86.HasSSSE3},
{Name: "avxifma", Feature: &X86.HasAVXIFMA},
{Name: "avxvnni", Feature: &X86.HasAVXVNNI},
{Name: "avxvnniint8", Feature: &X86.HasAVXVNNIInt8},

// These capabilities should always be enabled on amd64:
{Name: "sse2", Feature: &X86.HasSSE2, Required: runtime.GOARCH == "amd64"},
Expand Down Expand Up @@ -106,7 +109,7 @@ func archInit() {
return
}

_, ebx7, ecx7, edx7 := cpuid(7, 0)
eax7, ebx7, ecx7, edx7 := cpuid(7, 0)
X86.HasBMI1 = isSet(3, ebx7)
X86.HasAVX2 = isSet(5, ebx7) && osSupportsAVX
X86.HasBMI2 = isSet(8, ebx7)
Expand Down Expand Up @@ -134,14 +137,24 @@ func archInit() {
X86.HasAVX512VAES = isSet(9, ecx7)
X86.HasAVX512VBMI2 = isSet(6, ecx7)
X86.HasAVX512BITALG = isSet(12, ecx7)

eax71, _, _, _ := cpuid(7, 1)
X86.HasAVX512BF16 = isSet(5, eax71)
}

X86.HasAMXTile = isSet(24, edx7)
X86.HasAMXInt8 = isSet(25, edx7)
X86.HasAMXBF16 = isSet(22, edx7)

// These features depend on the second level of extended features.
if eax7 >= 1 {
eax71, _, _, edx71 := cpuid(7, 1)
if X86.HasAVX512 {
X86.HasAVX512BF16 = isSet(5, eax71)
}
if X86.HasAVX {
X86.HasAVXIFMA = isSet(23, eax71)
X86.HasAVXVNNI = isSet(4, eax71)
X86.HasAVXVNNIInt8 = isSet(4, edx71)
}
}
}

func isSet(bitpos uint, value uint32) bool {
Expand Down

0 comments on commit c756214

Please sign in to comment.