xref: /linux/tools/arch/x86/include/asm/amd/ibs.h (revision 7c7f9dd1ea3fc6b175b7227bb473dc883b925548)
1c1ab4ce3SIngo Molnar /* SPDX-License-Identifier: GPL-2.0 */
2*bb6b4143SArnaldo Carvalho de Melo #ifndef _ASM_X86_AMD_IBS_H
3*bb6b4143SArnaldo Carvalho de Melo #define _ASM_X86_AMD_IBS_H
4*bb6b4143SArnaldo Carvalho de Melo 
5c1ab4ce3SIngo Molnar /*
6c1ab4ce3SIngo Molnar  * From PPR Vol 1 for AMD Family 19h Model 01h B1
7c1ab4ce3SIngo Molnar  * 55898 Rev 0.35 - Feb 5, 2021
8c1ab4ce3SIngo Molnar  */
9c1ab4ce3SIngo Molnar 
10c1ab4ce3SIngo Molnar #include "../msr-index.h"
11c1ab4ce3SIngo Molnar 
12c1ab4ce3SIngo Molnar /* IBS_OP_DATA2 DataSrc */
13c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_LOC_CACHE			 2
14c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_DRAM			 3
15c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_REM_CACHE			 4
16c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_IO				 7
17c1ab4ce3SIngo Molnar 
18c1ab4ce3SIngo Molnar /* IBS_OP_DATA2 DataSrc Extension */
19c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_LOC_CACHE		 1
20c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_NEAR_CCX_CACHE		 2
21c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_DRAM			 3
22c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_FAR_CCX_CACHE		 5
23c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_PMEM			 6
24c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_IO			 7
25c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_EXT_MEM		 8
26c1ab4ce3SIngo Molnar #define IBS_DATA_SRC_EXT_PEER_AGENT_MEM		12
27c1ab4ce3SIngo Molnar 
28c1ab4ce3SIngo Molnar /*
29c1ab4ce3SIngo Molnar  * IBS Hardware MSRs
30c1ab4ce3SIngo Molnar  */
31c1ab4ce3SIngo Molnar 
32c1ab4ce3SIngo Molnar /* MSR 0xc0011030: IBS Fetch Control */
33c1ab4ce3SIngo Molnar union ibs_fetch_ctl {
34c1ab4ce3SIngo Molnar 	__u64 val;
35c1ab4ce3SIngo Molnar 	struct {
36c1ab4ce3SIngo Molnar 		__u64	fetch_maxcnt:16,/* 0-15: instruction fetch max. count */
37c1ab4ce3SIngo Molnar 			fetch_cnt:16,	/* 16-31: instruction fetch count */
38c1ab4ce3SIngo Molnar 			fetch_lat:16,	/* 32-47: instruction fetch latency */
39c1ab4ce3SIngo Molnar 			fetch_en:1,	/* 48: instruction fetch enable */
40c1ab4ce3SIngo Molnar 			fetch_val:1,	/* 49: instruction fetch valid */
41c1ab4ce3SIngo Molnar 			fetch_comp:1,	/* 50: instruction fetch complete */
42c1ab4ce3SIngo Molnar 			ic_miss:1,	/* 51: i-cache miss */
43c1ab4ce3SIngo Molnar 			phy_addr_valid:1,/* 52: physical address valid */
44c1ab4ce3SIngo Molnar 			l1tlb_pgsz:2,	/* 53-54: i-cache L1TLB page size
45c1ab4ce3SIngo Molnar 					 *	  (needs IbsPhyAddrValid) */
46c1ab4ce3SIngo Molnar 			l1tlb_miss:1,	/* 55: i-cache fetch missed in L1TLB */
47c1ab4ce3SIngo Molnar 			l2tlb_miss:1,	/* 56: i-cache fetch missed in L2TLB */
48c1ab4ce3SIngo Molnar 			rand_en:1,	/* 57: random tagging enable */
49c1ab4ce3SIngo Molnar 			fetch_l2_miss:1,/* 58: L2 miss for sampled fetch
50c1ab4ce3SIngo Molnar 					 *      (needs IbsFetchComp) */
51c1ab4ce3SIngo Molnar 			l3_miss_only:1,	/* 59: Collect L3 miss samples only */
52c1ab4ce3SIngo Molnar 			fetch_oc_miss:1,/* 60: Op cache miss for the sampled fetch */
53c1ab4ce3SIngo Molnar 			fetch_l3_miss:1,/* 61: L3 cache miss for the sampled fetch */
54c1ab4ce3SIngo Molnar 			reserved:2;	/* 62-63: reserved */
55c1ab4ce3SIngo Molnar 	};
56c1ab4ce3SIngo Molnar };
57c1ab4ce3SIngo Molnar 
58c1ab4ce3SIngo Molnar /* MSR 0xc0011033: IBS Execution Control */
59c1ab4ce3SIngo Molnar union ibs_op_ctl {
60c1ab4ce3SIngo Molnar 	__u64 val;
61c1ab4ce3SIngo Molnar 	struct {
62c1ab4ce3SIngo Molnar 		__u64	opmaxcnt:16,	/* 0-15: periodic op max. count */
63c1ab4ce3SIngo Molnar 			l3_miss_only:1,	/* 16: Collect L3 miss samples only */
64c1ab4ce3SIngo Molnar 			op_en:1,	/* 17: op sampling enable */
65c1ab4ce3SIngo Molnar 			op_val:1,	/* 18: op sample valid */
66c1ab4ce3SIngo Molnar 			cnt_ctl:1,	/* 19: periodic op counter control */
67c1ab4ce3SIngo Molnar 			opmaxcnt_ext:7,	/* 20-26: upper 7 bits of periodic op maximum count */
68c1ab4ce3SIngo Molnar 			reserved0:5,	/* 27-31: reserved */
69c1ab4ce3SIngo Molnar 			opcurcnt:27,	/* 32-58: periodic op counter current count */
70c1ab4ce3SIngo Molnar 			ldlat_thrsh:4,	/* 59-62: Load Latency threshold */
71c1ab4ce3SIngo Molnar 			ldlat_en:1;	/* 63: Load Latency enabled */
72c1ab4ce3SIngo Molnar 	};
73c1ab4ce3SIngo Molnar };
74c1ab4ce3SIngo Molnar 
75c1ab4ce3SIngo Molnar /* MSR 0xc0011035: IBS Op Data 1 */
76c1ab4ce3SIngo Molnar union ibs_op_data {
77c1ab4ce3SIngo Molnar 	__u64 val;
78c1ab4ce3SIngo Molnar 	struct {
79c1ab4ce3SIngo Molnar 		__u64	comp_to_ret_ctr:16,	/* 0-15: op completion to retire count */
80c1ab4ce3SIngo Molnar 			tag_to_ret_ctr:16,	/* 15-31: op tag to retire count */
81c1ab4ce3SIngo Molnar 			reserved1:2,		/* 32-33: reserved */
82c1ab4ce3SIngo Molnar 			op_return:1,		/* 34: return op */
83c1ab4ce3SIngo Molnar 			op_brn_taken:1,		/* 35: taken branch op */
84c1ab4ce3SIngo Molnar 			op_brn_misp:1,		/* 36: mispredicted branch op */
85c1ab4ce3SIngo Molnar 			op_brn_ret:1,		/* 37: branch op retired */
86c1ab4ce3SIngo Molnar 			op_rip_invalid:1,	/* 38: RIP is invalid */
87c1ab4ce3SIngo Molnar 			op_brn_fuse:1,		/* 39: fused branch op */
88c1ab4ce3SIngo Molnar 			op_microcode:1,		/* 40: microcode op */
89c1ab4ce3SIngo Molnar 			reserved2:23;		/* 41-63: reserved */
90c1ab4ce3SIngo Molnar 	};
91c1ab4ce3SIngo Molnar };
92c1ab4ce3SIngo Molnar 
93c1ab4ce3SIngo Molnar /* MSR 0xc0011036: IBS Op Data 2 */
94c1ab4ce3SIngo Molnar union ibs_op_data2 {
95c1ab4ce3SIngo Molnar 	__u64 val;
96c1ab4ce3SIngo Molnar 	struct {
97c1ab4ce3SIngo Molnar 		__u64	data_src_lo:3,	/* 0-2: data source low */
98c1ab4ce3SIngo Molnar 			reserved0:1,	/* 3: reserved */
99c1ab4ce3SIngo Molnar 			rmt_node:1,	/* 4: destination node */
100c1ab4ce3SIngo Molnar 			cache_hit_st:1,	/* 5: cache hit state */
101c1ab4ce3SIngo Molnar 			data_src_hi:2,	/* 6-7: data source high */
102c1ab4ce3SIngo Molnar 			reserved1:56;	/* 8-63: reserved */
103c1ab4ce3SIngo Molnar 	};
104c1ab4ce3SIngo Molnar };
105c1ab4ce3SIngo Molnar 
106c1ab4ce3SIngo Molnar /* MSR 0xc0011037: IBS Op Data 3 */
107c1ab4ce3SIngo Molnar union ibs_op_data3 {
108c1ab4ce3SIngo Molnar 	__u64 val;
109c1ab4ce3SIngo Molnar 	struct {
110c1ab4ce3SIngo Molnar 		__u64	ld_op:1,			/* 0: load op */
111c1ab4ce3SIngo Molnar 			st_op:1,			/* 1: store op */
112c1ab4ce3SIngo Molnar 			dc_l1tlb_miss:1,		/* 2: data cache L1TLB miss */
113c1ab4ce3SIngo Molnar 			dc_l2tlb_miss:1,		/* 3: data cache L2TLB hit in 2M page */
114c1ab4ce3SIngo Molnar 			dc_l1tlb_hit_2m:1,		/* 4: data cache L1TLB hit in 2M page */
115c1ab4ce3SIngo Molnar 			dc_l1tlb_hit_1g:1,		/* 5: data cache L1TLB hit in 1G page */
116c1ab4ce3SIngo Molnar 			dc_l2tlb_hit_2m:1,		/* 6: data cache L2TLB hit in 2M page */
117c1ab4ce3SIngo Molnar 			dc_miss:1,			/* 7: data cache miss */
118c1ab4ce3SIngo Molnar 			dc_mis_acc:1,			/* 8: misaligned access */
119c1ab4ce3SIngo Molnar 			reserved:4,			/* 9-12: reserved */
120c1ab4ce3SIngo Molnar 			dc_wc_mem_acc:1,		/* 13: write combining memory access */
121c1ab4ce3SIngo Molnar 			dc_uc_mem_acc:1,		/* 14: uncacheable memory access */
122c1ab4ce3SIngo Molnar 			dc_locked_op:1,			/* 15: locked operation */
123c1ab4ce3SIngo Molnar 			dc_miss_no_mab_alloc:1,		/* 16: DC miss with no MAB allocated */
124c1ab4ce3SIngo Molnar 			dc_lin_addr_valid:1,		/* 17: data cache linear address valid */
125c1ab4ce3SIngo Molnar 			dc_phy_addr_valid:1,		/* 18: data cache physical address valid */
126c1ab4ce3SIngo Molnar 			dc_l2_tlb_hit_1g:1,		/* 19: data cache L2 hit in 1GB page */
127c1ab4ce3SIngo Molnar 			l2_miss:1,			/* 20: L2 cache miss */
128c1ab4ce3SIngo Molnar 			sw_pf:1,			/* 21: software prefetch */
129c1ab4ce3SIngo Molnar 			op_mem_width:4,			/* 22-25: load/store size in bytes */
130c1ab4ce3SIngo Molnar 			op_dc_miss_open_mem_reqs:6,	/* 26-31: outstanding mem reqs on DC fill */
131c1ab4ce3SIngo Molnar 			dc_miss_lat:16,			/* 32-47: data cache miss latency */
132c1ab4ce3SIngo Molnar 			tlb_refill_lat:16;		/* 48-63: L1 TLB refill latency */
133c1ab4ce3SIngo Molnar 	};
134c1ab4ce3SIngo Molnar };
135c1ab4ce3SIngo Molnar 
136c1ab4ce3SIngo Molnar /* MSR 0xc001103c: IBS Fetch Control Extended */
137c1ab4ce3SIngo Molnar union ic_ibs_extd_ctl {
138c1ab4ce3SIngo Molnar 	__u64 val;
139c1ab4ce3SIngo Molnar 	struct {
140c1ab4ce3SIngo Molnar 		__u64	itlb_refill_lat:16,	/* 0-15: ITLB Refill latency for sampled fetch */
141c1ab4ce3SIngo Molnar 			reserved:48;		/* 16-63: reserved */
142c1ab4ce3SIngo Molnar 	};
143c1ab4ce3SIngo Molnar };
144c1ab4ce3SIngo Molnar 
145c1ab4ce3SIngo Molnar /*
146c1ab4ce3SIngo Molnar  * IBS driver related
147c1ab4ce3SIngo Molnar  */
148c1ab4ce3SIngo Molnar 
149c1ab4ce3SIngo Molnar struct perf_ibs_data {
150c1ab4ce3SIngo Molnar 	u32		size;
151c1ab4ce3SIngo Molnar 	union {
152c1ab4ce3SIngo Molnar 		u32	data[0];	/* data buffer starts here */
153c1ab4ce3SIngo Molnar 		u32	caps;
154c1ab4ce3SIngo Molnar 	};
155c1ab4ce3SIngo Molnar 	u64		regs[MSR_AMD64_IBS_REG_COUNT_MAX];
156c1ab4ce3SIngo Molnar };
157*bb6b4143SArnaldo Carvalho de Melo 
158*bb6b4143SArnaldo Carvalho de Melo #endif /* _ASM_X86_AMD_IBS_H */
159