xref: /freebsd/lib/libc/amd64/amd64_archlevel.h (revision a8089ea5aee578e08acab2438e82fc9a9ae50ed8)
1 /*-
2  * Copyright (c) 2023 The FreeBSD Foundation
3  *
4  * This software was developed by Robert Clausecker <fuz@FreeBSD.org>
5  * under sponsorship from the FreeBSD Foundation.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ''AS IS'' AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE
27  */
28 
29 /* must be macros so they can be accessed from assembly */
30 #define X86_64_SCALAR    0 /* disable SIMD optimisations */
31 #define	X86_64_BASELINE  1 /* CMOV, CX8, FPU, FXSR, MMX, OSFXSR, SSE, SSE2 */
32 #define	X86_64_V2        2 /* CMPXCHG16B, LAHF-SAHF, POPCNT, SSE3, SSSE3, SSE4_1, SSE4_2 */
33 #define	X86_64_V3        3 /* AVX, AVX2, BMI1, BMI2, F16C, FMA, LZCNT, MOVBE, OSXSAVE */
34 #define	X86_64_V4        4 /* AVX512F, AVX512BW, AVX512CD, AVX512DQ, AVX512VL */
35 
36 #define	X86_64_MAX       X86_64_V4 /* highest supported architecture level */
37 #define	X86_64_UNDEFINED -1 /* architecture level not set yet */
38 
39 #ifndef __ASSEMBLER__
40 #include <dlfcn.h>
41 
42 dlfunc_t	__archlevel_resolve(u_int, u_int, u_int, u_int,
43 		    int32_t[X86_64_MAX + 1]) __hidden;
44 #else
45 #include <machine/asm.h>
46 
47 #define ARCHRESOLVE(func) \
48 	.globl CNAME(func); \
49 	.type CNAME(func), @gnu_indirect_function; \
50 	.set CNAME(func), __CONCAT(func,_resolver); \
51 	ARCHENTRY(func, resolver); \
52 	lea __CONCAT(func,_funcs)(%rip), %r8; \
53 	jmp CNAME(__archlevel_resolve); \
54 	ARCHEND(func, resolver)
55 
56 /*
57  * The func_funcs array stores the location of the implementations
58  * as the distance from the func_funcs array to the function.  Due
59  * to compiling for the medium code model, a 32 bit integer suffices
60  * to hold the distance.
61  *
62  * Doing it this way both saves storage and avoids giving rtld
63  * relocations to process at load time.
64  */
65 #define ARCHFUNCS(func) \
66 	ARCHRESOLVE(func); \
67 	.section .rodata; \
68 	.align 4; \
69 	__CONCAT(func,_funcs):
70 
71 #define NOARCHFUNC \
72 	.4byte 0
73 
74 #define ARCHFUNC(func, level) \
75 	.4byte __CONCAT(__CONCAT(func,_),level) - __CONCAT(func,_funcs)
76 
77 #define ENDARCHFUNCS(func) \
78 	.zero 4*(X86_64_MAX+1)-(.-__CONCAT(func,_funcs)); \
79 	.size __CONCAT(func,_funcs), .-__CONCAT(func,_funcs)
80 
81 #define ARCHENTRY(func, level) \
82 	_START_ENTRY; \
83 	.type __CONCAT(__CONCAT(func,_),level), @function; \
84 	__CONCAT(__CONCAT(func,_),level):; \
85 	.cfi_startproc
86 
87 #define ARCHEND(func, level) \
88 	END(__CONCAT(__CONCAT(func,_),level))
89 
90 #endif  /* __ASSEMBLER__ */
91