@@ -73,6 +73,7 @@ TARGETS += user
TARGETS += vDSO
TARGETS += vm
TARGETS += x86
+TARGETS += xsave
TARGETS += zram
#Please keep the TARGETS list alphabetically sorted
# Run "make quicktest=1 run_tests" or
new file mode 100644
@@ -0,0 +1,2 @@
+# SPDX-License-Identifier: GPL-2.0-only
+xsave_instruction
new file mode 100644
@@ -0,0 +1,6 @@
+# SPDX-License-Identifier: GPL-2.0-only
+CFLAGS := -g -Wall -mxsave -O2
+
+TEST_GEN_PROGS := xsave_instruction
+
+include ../lib.mk
new file mode 100644
@@ -0,0 +1,246 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+
+#include <stdio.h>
+#include <stdint.h>
+#include <stdlib.h>
+#include <x86intrin.h>
+#include <string.h>
+#include <signal.h>
+#include <unistd.h>
+#include "../kselftest.h"
+
+#ifdef __i386__
+#define XSAVE _xsave
+#else
+#define XSAVE _xsave64
+#endif
+
+#ifdef __i386__
+#define XRSTOR _xrstor
+#else
+#define XRSTOR _xrstor64
+#endif
+
+#define SAVE_MASK 0xffffffffffffffff
+#define RESULT_PASS 0
+#define RESULT_FAIL 1
+#define RESULT_ERROR 3
+#define CHANGE 10
+#define NO_CHANGE 11
+
+/* Copied from Linux kernel */
+static inline void native_cpuid(unsigned int *eax, unsigned int *ebx,
+ unsigned int *ecx, unsigned int *edx)
+{
+ /* ecx is often an input as well as an output. */
+ asm volatile("cpuid"
+ : "=a" (*eax),
+ "=b" (*ebx),
+ "=c" (*ecx),
+ "=d" (*edx)
+ : "0" (*eax), "2" (*ecx)
+ : "memory");
+}
+
+void execution_failed(char *reason)
+{
+ ksft_test_result_xfail("%s", reason);
+ ksft_exit_fail();
+}
+
+int get_xsave_size(void)
+{
+ unsigned int eax, ebx, ecx, edx;
+
+ eax = 0x0d;
+ ebx = 0;
+ ecx = 0;
+ edx = 0;
+ native_cpuid(&eax, &ebx, &ecx, &edx);
+
+ return (int)ecx;
+}
+
+void dump_buffer(unsigned char *buf, int size)
+{
+ int i, j;
+
+ printf("xsave size = %d (%03xh)\n", size, size);
+
+ for (i = 0; i < size; i += 16) {
+ printf("%04x: ", i);
+
+ for (j = i; ((j < i + 16) && (j < size)); j++)
+ printf("%02x ", buf[j]);
+ printf("\n");
+ }
+}
+
+void show_part_buf(unsigned char *buf0, unsigned char *buf1, int start,
+ int size)
+{
+ int c;
+
+ printf("%04x: ", start);
+ for (c = start; ((c < start + 16) && (c < size)); c++)
+ printf("%02x ", buf0[c]);
+ printf(" -> ");
+ for (c = start; ((c < start + 16) && (c < size)); c++)
+ printf("%02x ", buf1[c]);
+ printf("\n");
+}
+
+int show_buf_diff(unsigned char *buf0, unsigned char *buf1, int size)
+{
+ int a, b, result_buf = RESULT_PASS;
+
+ for (a = 0; a < size; a += 16) {
+ /* SDM "XSAVE Area": XSAVE feature set does not use bytes 511:416 */
+ if ((a >= 416) && (a <= 511))
+ continue;
+
+ for (b = a; ((b < a + 16) && (b < size)); b++) {
+ if (buf0[b] != buf1[b]) {
+ show_part_buf(buf0, buf1, a, size);
+ result_buf = RESULT_FAIL;
+ break;
+ }
+ }
+ }
+
+ return result_buf;
+}
+
+int check_xsave_reserved_header(unsigned char *buf0,
+ unsigned char *buf1, int size, const char *test_name)
+{
+ int a, b, result_resv_header = RESULT_PASS;
+
+ /* SDM "Form of XRSTOR": Bytes 63:16 of the XSAVE header should 0 */
+ for (a = 528; a < 576 ; a += 16) {
+ for (b = a; ((b < a + 16) && (b < size)); b++) {
+ if ((buf0[b] != 0) || (buf1[b] != 0)) {
+ ksft_print_msg("%s FAIL: buf0[%d]:%d or buf1[%d]:%d not 0\n",
+ test_name, b, buf0[b], b, buf1[b]);
+ show_part_buf(buf0, buf1, a, size);
+ result_resv_header = RESULT_FAIL;
+ break;
+ }
+ }
+ }
+
+ return result_resv_header;
+}
+
+int check_xsave_buf(unsigned char *buf0, unsigned char *buf1,
+ int size, const char *test_name, int change)
+{
+ int result_buf = RESULT_ERROR, result_resv_header = RESULT_ERROR;
+
+ switch (change) {
+ case CHANGE:
+ if (show_buf_diff(buf0, buf1, size))
+ result_buf = RESULT_PASS;
+ else {
+ ksft_print_msg("%s FAIL: xsave content was same\n", test_name);
+ result_buf = RESULT_FAIL;
+ }
+ break;
+ case NO_CHANGE:
+ if (show_buf_diff(buf0, buf1, size)) {
+ ksft_print_msg("%s FAIL: xsave content changed\n", test_name);
+ show_buf_diff(buf0, buf1, size);
+ result_buf = RESULT_FAIL;
+ } else
+ result_buf = RESULT_PASS;
+ break;
+ default:
+ ksft_test_result_error("%s ERROR: invalid change:%d\n", test_name,
+ change);
+ break;
+ }
+
+ result_resv_header = check_xsave_reserved_header(buf0, buf1, size,
+ test_name);
+
+ return (result_buf || result_resv_header);
+}
+
+void check_result(int result, const char *test_name)
+{
+ switch (result) {
+ case RESULT_PASS:
+ ksft_test_result_pass("%s PASS\n", test_name);
+ break;
+ case RESULT_FAIL:
+ ksft_test_result_fail("%s FAIL\n", test_name);
+ break;
+ case RESULT_ERROR:
+ ksft_test_result_fail("%s ERROR\n", test_name);
+ break;
+ default:
+ ksft_test_result_error("%s ERROR: invalid result:%c\n",
+ test_name, result);
+ break;
+ }
+}
+
+void populate_fpu_regs(void)
+{
+ uint32_t ui32;
+ uint64_t ui64;
+
+ ui32 = 1;
+ ui64 = 0xBAB00500FAB7;
+
+ /* Initialize FPU and push different values onto FPU register stack: */
+ asm volatile ("finit");
+ asm volatile ("fldl %0" : : "m" (ui64));
+ asm volatile ("flds %0" : : "m" (ui32));
+ ui64 += 0x93ABE13;
+ asm volatile ("fldl %0" : : "m" (ui64));
+ ui64 += 0x93;
+ asm volatile ("fldl %0" : : "m" (ui64));
+ asm volatile ("flds %0" : : "m" (ui32));
+ asm volatile ("fldl %0" : : "m" (ui64));
+ ui64 -= 0x21;
+ asm volatile ("fldl %0" : : "m" (ui64));
+ asm volatile ("flds %0" : : "m" (ui32));
+ asm volatile ("fldl %0" : : "m" (ui64));
+
+ /* Fill each remaining YMM register with a different value: */
+ asm volatile ("vbroadcastss %0, %%ymm0" : : "m" (ui32));
+ ui32 = 0xFAFBABAF;
+ asm volatile ("vbroadcastss %0, %%ymm1" : : "m" (ui32));
+ ui32 -= 0xA;
+ asm volatile ("vbroadcastss %0, %%ymm2" : : "m" (ui32));
+ ui32 -= 0xB;
+ asm volatile ("vbroadcastss %0, %%ymm3" : : "m" (ui32));
+ ui32 -= 0x3;
+ asm volatile ("vbroadcastss %0, %%ymm4" : : "m" (ui32));
+ ui32 += 0xA;
+ asm volatile ("vbroadcastss %0, %%ymm5" : : "m" (ui32));
+ ui32 -= 0x7;
+ asm volatile ("vbroadcastss %0, %%ymm6" : : "m" (ui32));
+ ui32 -= 0xABABA;
+ asm volatile ("vbroadcastss %0, %%ymm7" : : "m" (ui32));
+
+ #ifndef __i386__
+ ui32 += 0xF7;
+ asm volatile ("vbroadcastss %0, %%ymm8" : : "m" (ui32));
+ ui32 -= 0x7;
+ asm volatile ("vbroadcastss %0, %%ymm9" : : "m" (ui32));
+ ui32 += 0x2;
+ asm volatile ("vbroadcastss %0, %%ymm10" : : "m" (ui32));
+ ui32 += 0xD;
+ asm volatile ("vbroadcastss %0, %%ymm11" : : "m" (ui32));
+ ui32 -= 0x4;
+ asm volatile ("vbroadcastss %0, %%ymm12" : : "m" (ui32));
+ ui32 -= 0xDD;
+ asm volatile ("vbroadcastss %0, %%ymm13" : : "m" (ui32));
+ ui32 -= 0xABD;
+ asm volatile ("vbroadcastss %0, %%ymm14" : : "m" (ui32));
+ ui32 += 0xBEBABF456;
+ asm volatile ("vbroadcastss %0, %%ymm15" : : "m" (ui32));
+ #endif
+}
new file mode 100644
@@ -0,0 +1,83 @@
+// SPDX-License-Identifier: GPL-2.0-only
+/*
+ * Test kernel support for XSAVE-managed features.
+ */
+
+#include <stdio.h>
+#include <stdint.h>
+#include <stdlib.h>
+#include <x86intrin.h>
+#include <string.h>
+#include <signal.h>
+#include <unistd.h>
+
+#include "../kselftest.h"
+#include "xsave_common.h"
+
+static unsigned char *xsave_buf0, *xsave_buf1;
+
+static void set_ymm0_reg(uint32_t ui32)
+{
+ asm volatile ("vbroadcastss %0, %%ymm0" : : "m" (ui32));
+}
+
+static void dump_xsave_content(int xsave_size)
+{
+ XSAVE(xsave_buf0, SAVE_MASK);
+ dump_buffer(xsave_buf0, xsave_size);
+ ksft_print_msg("Entire contents of XSAVE is as above\n");
+}
+
+static void test_xsave_ymm_change(int xsave_size)
+{
+ const char *test_name = "xsave test after ymm change";
+ uint32_t ui32_set = 0x1234, ui32_change = 0x5678;
+ int result = RESULT_ERROR;
+
+ set_ymm0_reg(ui32_set);
+ XSAVE(xsave_buf0, SAVE_MASK);
+ set_ymm0_reg(ui32_change);
+ XSAVE(xsave_buf1, SAVE_MASK);
+ result = check_xsave_buf(xsave_buf0, xsave_buf1, xsave_size, test_name,
+ CHANGE);
+ check_result(result, test_name);
+}
+
+static void test_xsave_xrstor(int xsave_size)
+{
+ const char *test_name = "xsave after xrstor test";
+ int result = RESULT_ERROR;
+
+ XSAVE(xsave_buf0, SAVE_MASK);
+ XRSTOR(xsave_buf0, SAVE_MASK);
+ XSAVE(xsave_buf1, SAVE_MASK);
+ result = check_xsave_buf(xsave_buf0, xsave_buf1, xsave_size, test_name,
+ NO_CHANGE);
+ check_result(result, test_name);
+}
+
+int main(void)
+{
+ int xsave_size;
+
+ ksft_print_header();
+ ksft_set_plan(2);
+
+ xsave_size = get_xsave_size();
+ /* SDM XSAVE: misalignment to a 64-byte boundary will result in #GP */
+ xsave_buf0 = aligned_alloc(64, xsave_size);
+ if (!xsave_buf0)
+ execution_failed("aligned_alloc xsave_buf0 failed\n");
+ xsave_buf1 = aligned_alloc(64, xsave_size);
+ if (!xsave_buf1)
+ execution_failed("aligned_alloc xsave_buf1 failed\n");
+
+ populate_fpu_regs();
+ /* Show the entire contents of xsave for issue debug */
+ dump_xsave_content(xsave_size);
+
+ test_xsave_ymm_change(xsave_size);
+ test_xsave_xrstor(xsave_size);
+
+ ksft_exit(!ksft_get_fail_cnt());
+}
The XSAVE feature set supports the saving and restoring of state components, and XSAVE feature is used for process context switching. XSAVE state components include FPU-related x87 state, SSE state, AVX state, etc. This case tests and verifies the basic functions of XSAVE/XRSTOR in user space: display and test the content changes of XSAVE; when the xstate in the same process on the x86 platform is unchanged, the contents of XRSTOR and XSAVE should be the same. This case is the most basic test of XSAVE function. Signed-off-by: Pengfei Xu <pengfei.xu@intel.com> Reported-by: kernel test robot <lkp@intel.com> # compile issues during review --- tools/testing/selftests/Makefile | 1 + tools/testing/selftests/xsave/.gitignore | 2 + tools/testing/selftests/xsave/Makefile | 6 + tools/testing/selftests/xsave/xsave_common.h | 246 ++++++++++++++++++ .../selftests/xsave/xsave_instruction.c | 83 ++++++ 5 files changed, 338 insertions(+) create mode 100644 tools/testing/selftests/xsave/.gitignore create mode 100644 tools/testing/selftests/xsave/Makefile create mode 100644 tools/testing/selftests/xsave/xsave_common.h create mode 100644 tools/testing/selftests/xsave/xsave_instruction.c