xref: /linux/tools/testing/selftests/x86/amx.c (revision bb9ae1a66c85eeb626864efd812c62026e126ec0)
1 // SPDX-License-Identifier: GPL-2.0
2 
3 #define _GNU_SOURCE
4 #include <err.h>
5 #include <errno.h>
6 #include <pthread.h>
7 #include <setjmp.h>
8 #include <stdio.h>
9 #include <string.h>
10 #include <stdbool.h>
11 #include <unistd.h>
12 #include <x86intrin.h>
13 
14 #include <sys/auxv.h>
15 #include <sys/mman.h>
16 #include <sys/shm.h>
17 #include <sys/ptrace.h>
18 #include <sys/syscall.h>
19 #include <sys/wait.h>
20 #include <sys/uio.h>
21 
22 #include "../kselftest.h" /* For __cpuid_count() */
23 
24 #ifndef __x86_64__
25 # error This test is 64-bit only
26 #endif
27 
28 #define XSAVE_HDR_OFFSET	512
29 #define XSAVE_HDR_SIZE		64
30 
31 struct xsave_buffer {
32 	union {
33 		struct {
34 			char legacy[XSAVE_HDR_OFFSET];
35 			char header[XSAVE_HDR_SIZE];
36 			char extended[0];
37 		};
38 		char bytes[0];
39 	};
40 };
41 
42 static inline void xsave(struct xsave_buffer *xbuf, uint64_t rfbm)
43 {
44 	uint32_t rfbm_lo = rfbm;
45 	uint32_t rfbm_hi = rfbm >> 32;
46 
47 	asm volatile("xsave (%%rdi)"
48 		     : : "D" (xbuf), "a" (rfbm_lo), "d" (rfbm_hi)
49 		     : "memory");
50 }
51 
52 static inline void xrstor(struct xsave_buffer *xbuf, uint64_t rfbm)
53 {
54 	uint32_t rfbm_lo = rfbm;
55 	uint32_t rfbm_hi = rfbm >> 32;
56 
57 	asm volatile("xrstor (%%rdi)"
58 		     : : "D" (xbuf), "a" (rfbm_lo), "d" (rfbm_hi));
59 }
60 
61 /* err() exits and will not return */
62 #define fatal_error(msg, ...)	err(1, "[FAIL]\t" msg, ##__VA_ARGS__)
63 
64 static void sethandler(int sig, void (*handler)(int, siginfo_t *, void *),
65 		       int flags)
66 {
67 	struct sigaction sa;
68 
69 	memset(&sa, 0, sizeof(sa));
70 	sa.sa_sigaction = handler;
71 	sa.sa_flags = SA_SIGINFO | flags;
72 	sigemptyset(&sa.sa_mask);
73 	if (sigaction(sig, &sa, 0))
74 		fatal_error("sigaction");
75 }
76 
77 static void clearhandler(int sig)
78 {
79 	struct sigaction sa;
80 
81 	memset(&sa, 0, sizeof(sa));
82 	sa.sa_handler = SIG_DFL;
83 	sigemptyset(&sa.sa_mask);
84 	if (sigaction(sig, &sa, 0))
85 		fatal_error("sigaction");
86 }
87 
88 #define XFEATURE_XTILECFG	17
89 #define XFEATURE_XTILEDATA	18
90 #define XFEATURE_MASK_XTILECFG	(1 << XFEATURE_XTILECFG)
91 #define XFEATURE_MASK_XTILEDATA	(1 << XFEATURE_XTILEDATA)
92 #define XFEATURE_MASK_XTILE	(XFEATURE_MASK_XTILECFG | XFEATURE_MASK_XTILEDATA)
93 
94 #define CPUID_LEAF1_ECX_XSAVE_MASK	(1 << 26)
95 #define CPUID_LEAF1_ECX_OSXSAVE_MASK	(1 << 27)
96 
97 static uint32_t xbuf_size;
98 
99 static struct {
100 	uint32_t xbuf_offset;
101 	uint32_t size;
102 } xtiledata;
103 
104 #define CPUID_LEAF_XSTATE		0xd
105 #define CPUID_SUBLEAF_XSTATE_USER	0x0
106 #define TILE_CPUID			0x1d
107 #define TILE_PALETTE_ID			0x1
108 
109 static void check_cpuid_xtiledata(void)
110 {
111 	uint32_t eax, ebx, ecx, edx;
112 
113 	__cpuid_count(CPUID_LEAF_XSTATE, CPUID_SUBLEAF_XSTATE_USER,
114 		      eax, ebx, ecx, edx);
115 
116 	/*
117 	 * EBX enumerates the size (in bytes) required by the XSAVE
118 	 * instruction for an XSAVE area containing all the user state
119 	 * components corresponding to bits currently set in XCR0.
120 	 *
121 	 * Stash that off so it can be used to allocate buffers later.
122 	 */
123 	xbuf_size = ebx;
124 
125 	__cpuid_count(CPUID_LEAF_XSTATE, XFEATURE_XTILEDATA,
126 		      eax, ebx, ecx, edx);
127 	/*
128 	 * eax: XTILEDATA state component size
129 	 * ebx: XTILEDATA state component offset in user buffer
130 	 */
131 	if (!eax || !ebx)
132 		fatal_error("xstate cpuid: invalid tile data size/offset: %d/%d",
133 				eax, ebx);
134 
135 	xtiledata.size	      = eax;
136 	xtiledata.xbuf_offset = ebx;
137 }
138 
139 /* The helpers for managing XSAVE buffer and tile states: */
140 
141 struct xsave_buffer *alloc_xbuf(void)
142 {
143 	struct xsave_buffer *xbuf;
144 
145 	/* XSAVE buffer should be 64B-aligned. */
146 	xbuf = aligned_alloc(64, xbuf_size);
147 	if (!xbuf)
148 		fatal_error("aligned_alloc()");
149 	return xbuf;
150 }
151 
152 static inline void clear_xstate_header(struct xsave_buffer *buffer)
153 {
154 	memset(&buffer->header, 0, sizeof(buffer->header));
155 }
156 
157 static inline void set_xstatebv(struct xsave_buffer *buffer, uint64_t bv)
158 {
159 	/* XSTATE_BV is at the beginning of the header: */
160 	*(uint64_t *)(&buffer->header) = bv;
161 }
162 
163 static void set_rand_tiledata(struct xsave_buffer *xbuf)
164 {
165 	int *ptr = (int *)&xbuf->bytes[xtiledata.xbuf_offset];
166 	int data;
167 	int i;
168 
169 	/*
170 	 * Ensure that 'data' is never 0.  This ensures that
171 	 * the registers are never in their initial configuration
172 	 * and thus never tracked as being in the init state.
173 	 */
174 	data = rand() | 1;
175 
176 	for (i = 0; i < xtiledata.size / sizeof(int); i++, ptr++)
177 		*ptr = data;
178 }
179 
180 struct xsave_buffer *stashed_xsave;
181 
182 static void init_stashed_xsave(void)
183 {
184 	stashed_xsave = alloc_xbuf();
185 	if (!stashed_xsave)
186 		fatal_error("failed to allocate stashed_xsave\n");
187 	clear_xstate_header(stashed_xsave);
188 }
189 
190 static void free_stashed_xsave(void)
191 {
192 	free(stashed_xsave);
193 }
194 
195 /* See 'struct _fpx_sw_bytes' at sigcontext.h */
196 #define SW_BYTES_OFFSET		464
197 /* N.B. The struct's field name varies so read from the offset. */
198 #define SW_BYTES_BV_OFFSET	(SW_BYTES_OFFSET + 8)
199 
200 static inline struct _fpx_sw_bytes *get_fpx_sw_bytes(void *buffer)
201 {
202 	return (struct _fpx_sw_bytes *)(buffer + SW_BYTES_OFFSET);
203 }
204 
205 static inline uint64_t get_fpx_sw_bytes_features(void *buffer)
206 {
207 	return *(uint64_t *)(buffer + SW_BYTES_BV_OFFSET);
208 }
209 
210 /* Work around printf() being unsafe in signals: */
211 #define SIGNAL_BUF_LEN 1000
212 char signal_message_buffer[SIGNAL_BUF_LEN];
213 void sig_print(char *msg)
214 {
215 	int left = SIGNAL_BUF_LEN - strlen(signal_message_buffer) - 1;
216 
217 	strncat(signal_message_buffer, msg, left);
218 }
219 
220 static volatile bool noperm_signaled;
221 static int noperm_errs;
222 /*
223  * Signal handler for when AMX is used but
224  * permission has not been obtained.
225  */
226 static void handle_noperm(int sig, siginfo_t *si, void *ctx_void)
227 {
228 	ucontext_t *ctx = (ucontext_t *)ctx_void;
229 	void *xbuf = ctx->uc_mcontext.fpregs;
230 	struct _fpx_sw_bytes *sw_bytes;
231 	uint64_t features;
232 
233 	/* Reset the signal message buffer: */
234 	signal_message_buffer[0] = '\0';
235 	sig_print("\tAt SIGILL handler,\n");
236 
237 	if (si->si_code != ILL_ILLOPC) {
238 		noperm_errs++;
239 		sig_print("[FAIL]\tInvalid signal code.\n");
240 	} else {
241 		sig_print("[OK]\tValid signal code (ILL_ILLOPC).\n");
242 	}
243 
244 	sw_bytes = get_fpx_sw_bytes(xbuf);
245 	/*
246 	 * Without permission, the signal XSAVE buffer should not
247 	 * have room for AMX register state (aka. xtiledata).
248 	 * Check that the size does not overlap with where xtiledata
249 	 * will reside.
250 	 *
251 	 * This also implies that no state components *PAST*
252 	 * XTILEDATA (features >=19) can be present in the buffer.
253 	 */
254 	if (sw_bytes->xstate_size <= xtiledata.xbuf_offset) {
255 		sig_print("[OK]\tValid xstate size\n");
256 	} else {
257 		noperm_errs++;
258 		sig_print("[FAIL]\tInvalid xstate size\n");
259 	}
260 
261 	features = get_fpx_sw_bytes_features(xbuf);
262 	/*
263 	 * Without permission, the XTILEDATA feature
264 	 * bit should not be set.
265 	 */
266 	if ((features & XFEATURE_MASK_XTILEDATA) == 0) {
267 		sig_print("[OK]\tValid xstate mask\n");
268 	} else {
269 		noperm_errs++;
270 		sig_print("[FAIL]\tInvalid xstate mask\n");
271 	}
272 
273 	noperm_signaled = true;
274 	ctx->uc_mcontext.gregs[REG_RIP] += 3; /* Skip the faulting XRSTOR */
275 }
276 
277 /* Return true if XRSTOR is successful; otherwise, false. */
278 static inline bool xrstor_safe(struct xsave_buffer *xbuf, uint64_t mask)
279 {
280 	noperm_signaled = false;
281 	xrstor(xbuf, mask);
282 
283 	/* Print any messages produced by the signal code: */
284 	printf("%s", signal_message_buffer);
285 	/*
286 	 * Reset the buffer to make sure any future printing
287 	 * only outputs new messages:
288 	 */
289 	signal_message_buffer[0] = '\0';
290 
291 	if (noperm_errs)
292 		fatal_error("saw %d errors in noperm signal handler\n", noperm_errs);
293 
294 	return !noperm_signaled;
295 }
296 
297 /*
298  * Use XRSTOR to populate the XTILEDATA registers with
299  * random data.
300  *
301  * Return true if successful; otherwise, false.
302  */
303 static inline bool load_rand_tiledata(struct xsave_buffer *xbuf)
304 {
305 	clear_xstate_header(xbuf);
306 	set_xstatebv(xbuf, XFEATURE_MASK_XTILEDATA);
307 	set_rand_tiledata(xbuf);
308 	return xrstor_safe(xbuf, XFEATURE_MASK_XTILEDATA);
309 }
310 
311 /* Return XTILEDATA to its initial configuration. */
312 static inline void init_xtiledata(void)
313 {
314 	clear_xstate_header(stashed_xsave);
315 	xrstor_safe(stashed_xsave, XFEATURE_MASK_XTILEDATA);
316 }
317 
318 enum expected_result { FAIL_EXPECTED, SUCCESS_EXPECTED };
319 
320 /* arch_prctl() and sigaltstack() test */
321 
322 #define ARCH_GET_XCOMP_SUPP	0x1021
323 #define ARCH_GET_XCOMP_PERM	0x1022
324 #define ARCH_REQ_XCOMP_PERM	0x1023
325 
326 static void req_xtiledata_perm(void)
327 {
328 	syscall(SYS_arch_prctl, ARCH_REQ_XCOMP_PERM, XFEATURE_XTILEDATA);
329 }
330 
331 static void validate_req_xcomp_perm(enum expected_result exp)
332 {
333 	unsigned long bitmask, expected_bitmask;
334 	long rc;
335 
336 	rc = syscall(SYS_arch_prctl, ARCH_GET_XCOMP_PERM, &bitmask);
337 	if (rc) {
338 		fatal_error("prctl(ARCH_GET_XCOMP_PERM) error: %ld", rc);
339 	} else if (!(bitmask & XFEATURE_MASK_XTILECFG)) {
340 		fatal_error("ARCH_GET_XCOMP_PERM returns XFEATURE_XTILECFG off.");
341 	}
342 
343 	rc = syscall(SYS_arch_prctl, ARCH_REQ_XCOMP_PERM, XFEATURE_XTILEDATA);
344 	if (exp == FAIL_EXPECTED) {
345 		if (rc) {
346 			printf("[OK]\tARCH_REQ_XCOMP_PERM saw expected failure..\n");
347 			return;
348 		}
349 
350 		fatal_error("ARCH_REQ_XCOMP_PERM saw unexpected success.\n");
351 	} else if (rc) {
352 		fatal_error("ARCH_REQ_XCOMP_PERM saw unexpected failure.\n");
353 	}
354 
355 	expected_bitmask = bitmask | XFEATURE_MASK_XTILEDATA;
356 
357 	rc = syscall(SYS_arch_prctl, ARCH_GET_XCOMP_PERM, &bitmask);
358 	if (rc) {
359 		fatal_error("prctl(ARCH_GET_XCOMP_PERM) error: %ld", rc);
360 	} else if (bitmask != expected_bitmask) {
361 		fatal_error("ARCH_REQ_XCOMP_PERM set a wrong bitmask: %lx, expected: %lx.\n",
362 			    bitmask, expected_bitmask);
363 	} else {
364 		printf("\tARCH_REQ_XCOMP_PERM is successful.\n");
365 	}
366 }
367 
368 static void validate_xcomp_perm(enum expected_result exp)
369 {
370 	bool load_success = load_rand_tiledata(stashed_xsave);
371 
372 	if (exp == FAIL_EXPECTED) {
373 		if (load_success) {
374 			noperm_errs++;
375 			printf("[FAIL]\tLoad tiledata succeeded.\n");
376 		} else {
377 			printf("[OK]\tLoad tiledata failed.\n");
378 		}
379 	} else if (exp == SUCCESS_EXPECTED) {
380 		if (load_success) {
381 			printf("[OK]\tLoad tiledata succeeded.\n");
382 		} else {
383 			noperm_errs++;
384 			printf("[FAIL]\tLoad tiledata failed.\n");
385 		}
386 	}
387 }
388 
389 #ifndef AT_MINSIGSTKSZ
390 #  define AT_MINSIGSTKSZ	51
391 #endif
392 
393 static void *alloc_altstack(unsigned int size)
394 {
395 	void *altstack;
396 
397 	altstack = mmap(NULL, size, PROT_READ | PROT_WRITE,
398 			MAP_PRIVATE | MAP_ANONYMOUS | MAP_STACK, -1, 0);
399 
400 	if (altstack == MAP_FAILED)
401 		fatal_error("mmap() for altstack");
402 
403 	return altstack;
404 }
405 
406 static void setup_altstack(void *addr, unsigned long size, enum expected_result exp)
407 {
408 	stack_t ss;
409 	int rc;
410 
411 	memset(&ss, 0, sizeof(ss));
412 	ss.ss_size = size;
413 	ss.ss_sp = addr;
414 
415 	rc = sigaltstack(&ss, NULL);
416 
417 	if (exp == FAIL_EXPECTED) {
418 		if (rc) {
419 			printf("[OK]\tsigaltstack() failed.\n");
420 		} else {
421 			fatal_error("sigaltstack() succeeded unexpectedly.\n");
422 		}
423 	} else if (rc) {
424 		fatal_error("sigaltstack()");
425 	}
426 }
427 
428 static void test_dynamic_sigaltstack(void)
429 {
430 	unsigned int small_size, enough_size;
431 	unsigned long minsigstksz;
432 	void *altstack;
433 
434 	minsigstksz = getauxval(AT_MINSIGSTKSZ);
435 	printf("\tAT_MINSIGSTKSZ = %lu\n", minsigstksz);
436 	/*
437 	 * getauxval() itself can return 0 for failure or
438 	 * success.  But, in this case, AT_MINSIGSTKSZ
439 	 * will always return a >=0 value if implemented.
440 	 * Just check for 0.
441 	 */
442 	if (minsigstksz == 0) {
443 		printf("no support for AT_MINSIGSTKSZ, skipping sigaltstack tests\n");
444 		return;
445 	}
446 
447 	enough_size = minsigstksz * 2;
448 
449 	altstack = alloc_altstack(enough_size);
450 	printf("\tAllocate memory for altstack (%u bytes).\n", enough_size);
451 
452 	/*
453 	 * Try setup_altstack() with a size which can not fit
454 	 * XTILEDATA.  ARCH_REQ_XCOMP_PERM should fail.
455 	 */
456 	small_size = minsigstksz - xtiledata.size;
457 	printf("\tAfter sigaltstack() with small size (%u bytes).\n", small_size);
458 	setup_altstack(altstack, small_size, SUCCESS_EXPECTED);
459 	validate_req_xcomp_perm(FAIL_EXPECTED);
460 
461 	/*
462 	 * Try setup_altstack() with a size derived from
463 	 * AT_MINSIGSTKSZ.  It should be more than large enough
464 	 * and thus ARCH_REQ_XCOMP_PERM should succeed.
465 	 */
466 	printf("\tAfter sigaltstack() with enough size (%u bytes).\n", enough_size);
467 	setup_altstack(altstack, enough_size, SUCCESS_EXPECTED);
468 	validate_req_xcomp_perm(SUCCESS_EXPECTED);
469 
470 	/*
471 	 * Try to coerce setup_altstack() to again accept a
472 	 * too-small altstack.  This ensures that big-enough
473 	 * sigaltstacks can not shrink to a too-small value
474 	 * once XTILEDATA permission is established.
475 	 */
476 	printf("\tThen, sigaltstack() with small size (%u bytes).\n", small_size);
477 	setup_altstack(altstack, small_size, FAIL_EXPECTED);
478 }
479 
480 static void test_dynamic_state(void)
481 {
482 	pid_t parent, child, grandchild;
483 
484 	parent = fork();
485 	if (parent < 0) {
486 		/* fork() failed */
487 		fatal_error("fork");
488 	} else if (parent > 0) {
489 		int status;
490 		/* fork() succeeded.  Now in the parent. */
491 
492 		wait(&status);
493 		if (!WIFEXITED(status) || WEXITSTATUS(status))
494 			fatal_error("arch_prctl test parent exit");
495 		return;
496 	}
497 	/* fork() succeeded.  Now in the child . */
498 
499 	printf("[RUN]\tCheck ARCH_REQ_XCOMP_PERM around process fork() and sigaltack() test.\n");
500 
501 	printf("\tFork a child.\n");
502 	child = fork();
503 	if (child < 0) {
504 		fatal_error("fork");
505 	} else if (child > 0) {
506 		int status;
507 
508 		wait(&status);
509 		if (!WIFEXITED(status) || WEXITSTATUS(status))
510 			fatal_error("arch_prctl test child exit");
511 		_exit(0);
512 	}
513 
514 	/*
515 	 * The permission request should fail without an
516 	 * XTILEDATA-compatible signal stack
517 	 */
518 	printf("\tTest XCOMP_PERM at child.\n");
519 	validate_xcomp_perm(FAIL_EXPECTED);
520 
521 	/*
522 	 * Set up an XTILEDATA-compatible signal stack and
523 	 * also obtain permission to populate XTILEDATA.
524 	 */
525 	printf("\tTest dynamic sigaltstack at child:\n");
526 	test_dynamic_sigaltstack();
527 
528 	/* Ensure that XTILEDATA can be populated. */
529 	printf("\tTest XCOMP_PERM again at child.\n");
530 	validate_xcomp_perm(SUCCESS_EXPECTED);
531 
532 	printf("\tFork a grandchild.\n");
533 	grandchild = fork();
534 	if (grandchild < 0) {
535 		/* fork() failed */
536 		fatal_error("fork");
537 	} else if (!grandchild) {
538 		/* fork() succeeded.  Now in the (grand)child. */
539 		printf("\tTest XCOMP_PERM at grandchild.\n");
540 
541 		/*
542 		 * Ensure that the grandchild inherited
543 		 * permission and a compatible sigaltstack:
544 		 */
545 		validate_xcomp_perm(SUCCESS_EXPECTED);
546 	} else {
547 		int status;
548 		/* fork() succeeded.  Now in the parent. */
549 
550 		wait(&status);
551 		if (!WIFEXITED(status) || WEXITSTATUS(status))
552 			fatal_error("fork test grandchild");
553 	}
554 
555 	_exit(0);
556 }
557 
558 static inline int __compare_tiledata_state(struct xsave_buffer *xbuf1, struct xsave_buffer *xbuf2)
559 {
560 	return memcmp(&xbuf1->bytes[xtiledata.xbuf_offset],
561 		      &xbuf2->bytes[xtiledata.xbuf_offset],
562 		      xtiledata.size);
563 }
564 
565 /*
566  * Save current register state and compare it to @xbuf1.'
567  *
568  * Returns false if @xbuf1 matches the registers.
569  * Returns true  if @xbuf1 differs from the registers.
570  */
571 static inline bool __validate_tiledata_regs(struct xsave_buffer *xbuf1)
572 {
573 	struct xsave_buffer *xbuf2;
574 	int ret;
575 
576 	xbuf2 = alloc_xbuf();
577 	if (!xbuf2)
578 		fatal_error("failed to allocate XSAVE buffer\n");
579 
580 	xsave(xbuf2, XFEATURE_MASK_XTILEDATA);
581 	ret = __compare_tiledata_state(xbuf1, xbuf2);
582 
583 	free(xbuf2);
584 
585 	if (ret == 0)
586 		return false;
587 	return true;
588 }
589 
590 static inline void validate_tiledata_regs_same(struct xsave_buffer *xbuf)
591 {
592 	int ret = __validate_tiledata_regs(xbuf);
593 
594 	if (ret != 0)
595 		fatal_error("TILEDATA registers changed");
596 }
597 
598 static inline void validate_tiledata_regs_changed(struct xsave_buffer *xbuf)
599 {
600 	int ret = __validate_tiledata_regs(xbuf);
601 
602 	if (ret == 0)
603 		fatal_error("TILEDATA registers did not change");
604 }
605 
606 /* tiledata inheritance test */
607 
608 static void test_fork(void)
609 {
610 	pid_t child, grandchild;
611 
612 	child = fork();
613 	if (child < 0) {
614 		/* fork() failed */
615 		fatal_error("fork");
616 	} else if (child > 0) {
617 		/* fork() succeeded.  Now in the parent. */
618 		int status;
619 
620 		wait(&status);
621 		if (!WIFEXITED(status) || WEXITSTATUS(status))
622 			fatal_error("fork test child");
623 		return;
624 	}
625 	/* fork() succeeded.  Now in the child. */
626 	printf("[RUN]\tCheck tile data inheritance.\n\tBefore fork(), load tiledata\n");
627 
628 	load_rand_tiledata(stashed_xsave);
629 
630 	grandchild = fork();
631 	if (grandchild < 0) {
632 		/* fork() failed */
633 		fatal_error("fork");
634 	} else if (grandchild > 0) {
635 		/* fork() succeeded.  Still in the first child. */
636 		int status;
637 
638 		wait(&status);
639 		if (!WIFEXITED(status) || WEXITSTATUS(status))
640 			fatal_error("fork test grand child");
641 		_exit(0);
642 	}
643 	/* fork() succeeded.  Now in the (grand)child. */
644 
645 	/*
646 	 * TILEDATA registers are not preserved across fork().
647 	 * Ensure that their value has changed:
648 	 */
649 	validate_tiledata_regs_changed(stashed_xsave);
650 
651 	_exit(0);
652 }
653 
654 /* Context switching test */
655 
656 static struct _ctxtswtest_cfg {
657 	unsigned int iterations;
658 	unsigned int num_threads;
659 } ctxtswtest_config;
660 
661 struct futex_info {
662 	pthread_t thread;
663 	int nr;
664 	pthread_mutex_t mutex;
665 	struct futex_info *next;
666 };
667 
668 static void *check_tiledata(void *info)
669 {
670 	struct futex_info *finfo = (struct futex_info *)info;
671 	struct xsave_buffer *xbuf;
672 	int i;
673 
674 	xbuf = alloc_xbuf();
675 	if (!xbuf)
676 		fatal_error("unable to allocate XSAVE buffer");
677 
678 	/*
679 	 * Load random data into 'xbuf' and then restore
680 	 * it to the tile registers themselves.
681 	 */
682 	load_rand_tiledata(xbuf);
683 	for (i = 0; i < ctxtswtest_config.iterations; i++) {
684 		pthread_mutex_lock(&finfo->mutex);
685 
686 		/*
687 		 * Ensure the register values have not
688 		 * diverged from those recorded in 'xbuf'.
689 		 */
690 		validate_tiledata_regs_same(xbuf);
691 
692 		/* Load new, random values into xbuf and registers */
693 		load_rand_tiledata(xbuf);
694 
695 		/*
696 		 * The last thread's last unlock will be for
697 		 * thread 0's mutex.  However, thread 0 will
698 		 * have already exited the loop and the mutex
699 		 * will already be unlocked.
700 		 *
701 		 * Because this is not an ERRORCHECK mutex,
702 		 * that inconsistency will be silently ignored.
703 		 */
704 		pthread_mutex_unlock(&finfo->next->mutex);
705 	}
706 
707 	free(xbuf);
708 	/*
709 	 * Return this thread's finfo, which is
710 	 * a unique value for this thread.
711 	 */
712 	return finfo;
713 }
714 
715 static int create_threads(int num, struct futex_info *finfo)
716 {
717 	int i;
718 
719 	for (i = 0; i < num; i++) {
720 		int next_nr;
721 
722 		finfo[i].nr = i;
723 		/*
724 		 * Thread 'i' will wait on this mutex to
725 		 * be unlocked.  Lock it immediately after
726 		 * initialization:
727 		 */
728 		pthread_mutex_init(&finfo[i].mutex, NULL);
729 		pthread_mutex_lock(&finfo[i].mutex);
730 
731 		next_nr = (i + 1) % num;
732 		finfo[i].next = &finfo[next_nr];
733 
734 		if (pthread_create(&finfo[i].thread, NULL, check_tiledata, &finfo[i]))
735 			fatal_error("pthread_create()");
736 	}
737 	return 0;
738 }
739 
740 static void affinitize_cpu0(void)
741 {
742 	cpu_set_t cpuset;
743 
744 	CPU_ZERO(&cpuset);
745 	CPU_SET(0, &cpuset);
746 
747 	if (sched_setaffinity(0, sizeof(cpuset), &cpuset) != 0)
748 		fatal_error("sched_setaffinity to CPU 0");
749 }
750 
751 static void test_context_switch(void)
752 {
753 	struct futex_info *finfo;
754 	int i;
755 
756 	/* Affinitize to one CPU to force context switches */
757 	affinitize_cpu0();
758 
759 	req_xtiledata_perm();
760 
761 	printf("[RUN]\tCheck tiledata context switches, %d iterations, %d threads.\n",
762 	       ctxtswtest_config.iterations,
763 	       ctxtswtest_config.num_threads);
764 
765 
766 	finfo = malloc(sizeof(*finfo) * ctxtswtest_config.num_threads);
767 	if (!finfo)
768 		fatal_error("malloc()");
769 
770 	create_threads(ctxtswtest_config.num_threads, finfo);
771 
772 	/*
773 	 * This thread wakes up thread 0
774 	 * Thread 0 will wake up 1
775 	 * Thread 1 will wake up 2
776 	 * ...
777 	 * the last thread will wake up 0
778 	 *
779 	 * ... this will repeat for the configured
780 	 * number of iterations.
781 	 */
782 	pthread_mutex_unlock(&finfo[0].mutex);
783 
784 	/* Wait for all the threads to finish: */
785 	for (i = 0; i < ctxtswtest_config.num_threads; i++) {
786 		void *thread_retval;
787 		int rc;
788 
789 		rc = pthread_join(finfo[i].thread, &thread_retval);
790 
791 		if (rc)
792 			fatal_error("pthread_join() failed for thread %d err: %d\n",
793 					i, rc);
794 
795 		if (thread_retval != &finfo[i])
796 			fatal_error("unexpected thread retval for thread %d: %p\n",
797 					i, thread_retval);
798 
799 	}
800 
801 	printf("[OK]\tNo incorrect case was found.\n");
802 
803 	free(finfo);
804 }
805 
806 /* Ptrace test */
807 
808 /*
809  * Make sure the ptracee has the expanded kernel buffer on the first
810  * use. Then, initialize the state before performing the state
811  * injection from the ptracer.
812  */
813 static inline void ptracee_firstuse_tiledata(void)
814 {
815 	load_rand_tiledata(stashed_xsave);
816 	init_xtiledata();
817 }
818 
819 /*
820  * Ptracer injects the randomized tile data state. It also reads
821  * before and after that, which will execute the kernel's state copy
822  * functions. So, the tester is advised to double-check any emitted
823  * kernel messages.
824  */
825 static void ptracer_inject_tiledata(pid_t target)
826 {
827 	struct xsave_buffer *xbuf;
828 	struct iovec iov;
829 
830 	xbuf = alloc_xbuf();
831 	if (!xbuf)
832 		fatal_error("unable to allocate XSAVE buffer");
833 
834 	printf("\tRead the init'ed tiledata via ptrace().\n");
835 
836 	iov.iov_base = xbuf;
837 	iov.iov_len = xbuf_size;
838 
839 	memset(stashed_xsave, 0, xbuf_size);
840 
841 	if (ptrace(PTRACE_GETREGSET, target, (uint32_t)NT_X86_XSTATE, &iov))
842 		fatal_error("PTRACE_GETREGSET");
843 
844 	if (!__compare_tiledata_state(stashed_xsave, xbuf))
845 		printf("[OK]\tThe init'ed tiledata was read from ptracee.\n");
846 	else
847 		printf("[FAIL]\tThe init'ed tiledata was not read from ptracee.\n");
848 
849 	printf("\tInject tiledata via ptrace().\n");
850 
851 	load_rand_tiledata(xbuf);
852 
853 	memcpy(&stashed_xsave->bytes[xtiledata.xbuf_offset],
854 	       &xbuf->bytes[xtiledata.xbuf_offset],
855 	       xtiledata.size);
856 
857 	if (ptrace(PTRACE_SETREGSET, target, (uint32_t)NT_X86_XSTATE, &iov))
858 		fatal_error("PTRACE_SETREGSET");
859 
860 	if (ptrace(PTRACE_GETREGSET, target, (uint32_t)NT_X86_XSTATE, &iov))
861 		fatal_error("PTRACE_GETREGSET");
862 
863 	if (!__compare_tiledata_state(stashed_xsave, xbuf))
864 		printf("[OK]\tTiledata was correctly written to ptracee.\n");
865 	else
866 		printf("[FAIL]\tTiledata was not correctly written to ptracee.\n");
867 }
868 
869 static void test_ptrace(void)
870 {
871 	pid_t child;
872 	int status;
873 
874 	child = fork();
875 	if (child < 0) {
876 		err(1, "fork");
877 	} else if (!child) {
878 		if (ptrace(PTRACE_TRACEME, 0, NULL, NULL))
879 			err(1, "PTRACE_TRACEME");
880 
881 		ptracee_firstuse_tiledata();
882 
883 		raise(SIGTRAP);
884 		_exit(0);
885 	}
886 
887 	do {
888 		wait(&status);
889 	} while (WSTOPSIG(status) != SIGTRAP);
890 
891 	ptracer_inject_tiledata(child);
892 
893 	ptrace(PTRACE_DETACH, child, NULL, NULL);
894 	wait(&status);
895 	if (!WIFEXITED(status) || WEXITSTATUS(status))
896 		err(1, "ptrace test");
897 }
898 
899 int main(void)
900 {
901 	unsigned long features;
902 	long rc;
903 
904 	rc = syscall(SYS_arch_prctl, ARCH_GET_XCOMP_SUPP, &features);
905 	if (rc || (features & XFEATURE_MASK_XTILE) != XFEATURE_MASK_XTILE) {
906 		ksft_print_msg("no AMX support\n");
907 		return KSFT_SKIP;
908 	}
909 
910 	check_cpuid_xtiledata();
911 
912 	init_stashed_xsave();
913 	sethandler(SIGILL, handle_noperm, 0);
914 
915 	test_dynamic_state();
916 
917 	/* Request permission for the following tests */
918 	req_xtiledata_perm();
919 
920 	test_fork();
921 
922 	ctxtswtest_config.iterations = 10;
923 	ctxtswtest_config.num_threads = 5;
924 	test_context_switch();
925 
926 	test_ptrace();
927 
928 	clearhandler(SIGILL);
929 	free_stashed_xsave();
930 
931 	return 0;
932 }
933