116 lines
4.1 KiB
Diff
116 lines
4.1 KiB
Diff
|
|
From 98f5dbc3fd8390728401528786ac94b39f0581ee Mon Sep 17 00:00:00 2001
|
||
|
|
From: Jing Liu <jing2.liu@intel.com>
|
||
|
|
Date: Wed, 16 Feb 2022 22:04:28 -0800
|
||
|
|
Subject: [PATCH 03/10] x86: Add AMX XTILECFG and XTILEDATA components
|
||
|
|
|
||
|
|
from mainline-v7.0.0-rc0
|
||
|
|
commit 1f16764f7d4515bfd5e4ae0aae814fa280a7d0c8
|
||
|
|
category: feature
|
||
|
|
feature: SPR AMX support for Qemu
|
||
|
|
bugzilla: https://gitee.com/openeuler/intel-qemu/issues/I5VHOB
|
||
|
|
|
||
|
|
Intel-SIG: commit 1f16764f7d45 ("x86: Add AMX XTILECFG and XTILEDATA components")
|
||
|
|
|
||
|
|
-------------------------------------------------------------
|
||
|
|
|
||
|
|
x86: Add AMX XTILECFG and XTILEDATA components
|
||
|
|
|
||
|
|
The AMX TILECFG register and the TMMx tile data registers are
|
||
|
|
saved/restored via XSAVE, respectively in state component 17
|
||
|
|
(64 bytes) and state component 18 (8192 bytes).
|
||
|
|
|
||
|
|
Add AMX feature bits to x86_ext_save_areas array to set
|
||
|
|
up AMX components. Add structs that define the layout of
|
||
|
|
AMX XSAVE areas and use QEMU_BUILD_BUG_ON to validate the
|
||
|
|
structs sizes.
|
||
|
|
|
||
|
|
Signed-off-by: Jing Liu <jing2.liu@intel.com>
|
||
|
|
Signed-off-by: Yang Zhong <yang.zhong@intel.com>
|
||
|
|
Message-Id: <20220217060434.52460-3-yang.zhong@intel.com>
|
||
|
|
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
|
||
|
|
Signed-off-by: Jason Zeng <jason.zeng@intel.com>
|
||
|
|
---
|
||
|
|
target/i386/cpu.c | 8 ++++++++
|
||
|
|
target/i386/cpu.h | 18 +++++++++++++++++-
|
||
|
|
2 files changed, 25 insertions(+), 1 deletion(-)
|
||
|
|
|
||
|
|
diff --git a/target/i386/cpu.c b/target/i386/cpu.c
|
||
|
|
index 532ca45015..31d63be081 100644
|
||
|
|
--- a/target/i386/cpu.c
|
||
|
|
+++ b/target/i386/cpu.c
|
||
|
|
@@ -1401,6 +1401,14 @@ ExtSaveArea x86_ext_save_areas[XSAVE_STATE_AREA_COUNT] = {
|
||
|
|
[XSTATE_PKRU_BIT] =
|
||
|
|
{ .feature = FEAT_7_0_ECX, .bits = CPUID_7_0_ECX_PKU,
|
||
|
|
.size = sizeof(XSavePKRU) },
|
||
|
|
+ [XSTATE_XTILE_CFG_BIT] = {
|
||
|
|
+ .feature = FEAT_7_0_EDX, .bits = CPUID_7_0_EDX_AMX_TILE,
|
||
|
|
+ .size = sizeof(XSaveXTILECFG),
|
||
|
|
+ },
|
||
|
|
+ [XSTATE_XTILE_DATA_BIT] = {
|
||
|
|
+ .feature = FEAT_7_0_EDX, .bits = CPUID_7_0_EDX_AMX_TILE,
|
||
|
|
+ .size = sizeof(XSaveXTILEDATA)
|
||
|
|
+ },
|
||
|
|
};
|
||
|
|
|
||
|
|
static uint32_t xsave_area_size(uint64_t mask)
|
||
|
|
diff --git a/target/i386/cpu.h b/target/i386/cpu.h
|
||
|
|
index 52330d1112..cc431b1d76 100644
|
||
|
|
--- a/target/i386/cpu.h
|
||
|
|
+++ b/target/i386/cpu.h
|
||
|
|
@@ -538,6 +538,8 @@ typedef enum X86Seg {
|
||
|
|
#define XSTATE_ZMM_Hi256_BIT 6
|
||
|
|
#define XSTATE_Hi16_ZMM_BIT 7
|
||
|
|
#define XSTATE_PKRU_BIT 9
|
||
|
|
+#define XSTATE_XTILE_CFG_BIT 17
|
||
|
|
+#define XSTATE_XTILE_DATA_BIT 18
|
||
|
|
|
||
|
|
#define XSTATE_FP_MASK (1ULL << XSTATE_FP_BIT)
|
||
|
|
#define XSTATE_SSE_MASK (1ULL << XSTATE_SSE_BIT)
|
||
|
|
@@ -846,6 +848,8 @@ typedef uint64_t FeatureWordArray[FEATURE_WORDS];
|
||
|
|
#define CPUID_7_0_EDX_TSX_LDTRK (1U << 16)
|
||
|
|
/* AVX512_FP16 instruction */
|
||
|
|
#define CPUID_7_0_EDX_AVX512_FP16 (1U << 23)
|
||
|
|
+/* AMX tile (two-dimensional register) */
|
||
|
|
+#define CPUID_7_0_EDX_AMX_TILE (1U << 24)
|
||
|
|
/* Speculation Control */
|
||
|
|
#define CPUID_7_0_EDX_SPEC_CTRL (1U << 26)
|
||
|
|
/* Single Thread Indirect Branch Predictors */
|
||
|
|
@@ -1349,6 +1353,16 @@ typedef struct XSavePKRU {
|
||
|
|
uint32_t padding;
|
||
|
|
} XSavePKRU;
|
||
|
|
|
||
|
|
+/* Ext. save area 17: AMX XTILECFG state */
|
||
|
|
+typedef struct XSaveXTILECFG {
|
||
|
|
+ uint8_t xtilecfg[64];
|
||
|
|
+} XSaveXTILECFG;
|
||
|
|
+
|
||
|
|
+/* Ext. save area 18: AMX XTILEDATA state */
|
||
|
|
+typedef struct XSaveXTILEDATA {
|
||
|
|
+ uint8_t xtiledata[8][1024];
|
||
|
|
+} XSaveXTILEDATA;
|
||
|
|
+
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSaveAVX) != 0x100);
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSaveBNDREG) != 0x40);
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSaveBNDCSR) != 0x40);
|
||
|
|
@@ -1356,6 +1370,8 @@ QEMU_BUILD_BUG_ON(sizeof(XSaveOpmask) != 0x40);
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSaveZMM_Hi256) != 0x200);
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSaveHi16_ZMM) != 0x400);
|
||
|
|
QEMU_BUILD_BUG_ON(sizeof(XSavePKRU) != 0x8);
|
||
|
|
+QEMU_BUILD_BUG_ON(sizeof(XSaveXTILECFG) != 0x40);
|
||
|
|
+QEMU_BUILD_BUG_ON(sizeof(XSaveXTILEDATA) != 0x2000);
|
||
|
|
|
||
|
|
typedef struct ExtSaveArea {
|
||
|
|
uint32_t feature, bits;
|
||
|
|
@@ -1363,7 +1379,7 @@ typedef struct ExtSaveArea {
|
||
|
|
uint32_t ecx;
|
||
|
|
} ExtSaveArea;
|
||
|
|
|
||
|
|
-#define XSAVE_STATE_AREA_COUNT (XSTATE_PKRU_BIT + 1)
|
||
|
|
+#define XSAVE_STATE_AREA_COUNT (XSTATE_XTILE_DATA_BIT + 1)
|
||
|
|
|
||
|
|
extern ExtSaveArea x86_ext_save_areas[XSAVE_STATE_AREA_COUNT];
|
||
|
|
|
||
|
|
--
|
||
|
|
2.27.0
|
||
|
|
|