1 /* SPDX-License-Identifier: GPL-2.0 */
2 /*
3  * From PPR Vol 1 for AMD Family 19h Model 01h B1
4  * 55898 Rev 0.35 - Feb 5, 2021
5  */
6 
7 #include "msr-index.h"
8 
9 /* IBS_OP_DATA2 DataSrc */
10 #define IBS_DATA_SRC_LOC_CACHE			 2
11 #define IBS_DATA_SRC_DRAM			 3
12 #define IBS_DATA_SRC_REM_CACHE			 4
13 #define IBS_DATA_SRC_IO				 7
14 
15 /* IBS_OP_DATA2 DataSrc Extension */
16 #define IBS_DATA_SRC_EXT_LOC_CACHE		 1
17 #define IBS_DATA_SRC_EXT_NEAR_CCX_CACHE		 2
18 #define IBS_DATA_SRC_EXT_DRAM			 3
19 #define IBS_DATA_SRC_EXT_FAR_CCX_CACHE		 5
20 #define IBS_DATA_SRC_EXT_PMEM			 6
21 #define IBS_DATA_SRC_EXT_IO			 7
22 #define IBS_DATA_SRC_EXT_EXT_MEM		 8
23 #define IBS_DATA_SRC_EXT_PEER_AGENT_MEM		12
24 
25 /*
26  * IBS Hardware MSRs
27  */
28 
29 /* MSR 0xc0011030: IBS Fetch Control */
30 union ibs_fetch_ctl {
31 	__u64 val;
32 	struct {
33 		__u64	fetch_maxcnt:16,/* 0-15: instruction fetch max. count */
34 			fetch_cnt:16,	/* 16-31: instruction fetch count */
35 			fetch_lat:16,	/* 32-47: instruction fetch latency */
36 			fetch_en:1,	/* 48: instruction fetch enable */
37 			fetch_val:1,	/* 49: instruction fetch valid */
38 			fetch_comp:1,	/* 50: instruction fetch complete */
39 			ic_miss:1,	/* 51: i-cache miss */
40 			phy_addr_valid:1,/* 52: physical address valid */
41 			l1tlb_pgsz:2,	/* 53-54: i-cache L1TLB page size
42 					 *	  (needs IbsPhyAddrValid) */
43 			l1tlb_miss:1,	/* 55: i-cache fetch missed in L1TLB */
44 			l2tlb_miss:1,	/* 56: i-cache fetch missed in L2TLB */
45 			rand_en:1,	/* 57: random tagging enable */
46 			fetch_l2_miss:1,/* 58: L2 miss for sampled fetch
47 					 *      (needs IbsFetchComp) */
48 			l3_miss_only:1,	/* 59: Collect L3 miss samples only */
49 			fetch_oc_miss:1,/* 60: Op cache miss for the sampled fetch */
50 			fetch_l3_miss:1,/* 61: L3 cache miss for the sampled fetch */
51 			reserved:2;	/* 62-63: reserved */
52 	};
53 };
54 
55 /* MSR 0xc0011033: IBS Execution Control */
56 union ibs_op_ctl {
57 	__u64 val;
58 	struct {
59 		__u64	opmaxcnt:16,	/* 0-15: periodic op max. count */
60 			l3_miss_only:1,	/* 16: Collect L3 miss samples only */
61 			op_en:1,	/* 17: op sampling enable */
62 			op_val:1,	/* 18: op sample valid */
63 			cnt_ctl:1,	/* 19: periodic op counter control */
64 			opmaxcnt_ext:7,	/* 20-26: upper 7 bits of periodic op maximum count */
65 			reserved0:5,	/* 27-31: reserved */
66 			opcurcnt:27,	/* 32-58: periodic op counter current count */
67 			ldlat_thrsh:4,	/* 59-62: Load Latency threshold */
68 			ldlat_en:1;	/* 63: Load Latency enabled */
69 	};
70 };
71 
72 /* MSR 0xc0011035: IBS Op Data 1 */
73 union ibs_op_data {
74 	__u64 val;
75 	struct {
76 		__u64	comp_to_ret_ctr:16,	/* 0-15: op completion to retire count */
77 			tag_to_ret_ctr:16,	/* 15-31: op tag to retire count */
78 			reserved1:2,		/* 32-33: reserved */
79 			op_return:1,		/* 34: return op */
80 			op_brn_taken:1,		/* 35: taken branch op */
81 			op_brn_misp:1,		/* 36: mispredicted branch op */
82 			op_brn_ret:1,		/* 37: branch op retired */
83 			op_rip_invalid:1,	/* 38: RIP is invalid */
84 			op_brn_fuse:1,		/* 39: fused branch op */
85 			op_microcode:1,		/* 40: microcode op */
86 			reserved2:23;		/* 41-63: reserved */
87 	};
88 };
89 
90 /* MSR 0xc0011036: IBS Op Data 2 */
91 union ibs_op_data2 {
92 	__u64 val;
93 	struct {
94 		__u64	data_src_lo:3,	/* 0-2: data source low */
95 			reserved0:1,	/* 3: reserved */
96 			rmt_node:1,	/* 4: destination node */
97 			cache_hit_st:1,	/* 5: cache hit state */
98 			data_src_hi:2,	/* 6-7: data source high */
99 			reserved1:56;	/* 8-63: reserved */
100 	};
101 };
102 
103 /* MSR 0xc0011037: IBS Op Data 3 */
104 union ibs_op_data3 {
105 	__u64 val;
106 	struct {
107 		__u64	ld_op:1,			/* 0: load op */
108 			st_op:1,			/* 1: store op */
109 			dc_l1tlb_miss:1,		/* 2: data cache L1TLB miss */
110 			dc_l2tlb_miss:1,		/* 3: data cache L2TLB hit in 2M page */
111 			dc_l1tlb_hit_2m:1,		/* 4: data cache L1TLB hit in 2M page */
112 			dc_l1tlb_hit_1g:1,		/* 5: data cache L1TLB hit in 1G page */
113 			dc_l2tlb_hit_2m:1,		/* 6: data cache L2TLB hit in 2M page */
114 			dc_miss:1,			/* 7: data cache miss */
115 			dc_mis_acc:1,			/* 8: misaligned access */
116 			reserved:4,			/* 9-12: reserved */
117 			dc_wc_mem_acc:1,		/* 13: write combining memory access */
118 			dc_uc_mem_acc:1,		/* 14: uncacheable memory access */
119 			dc_locked_op:1,			/* 15: locked operation */
120 			dc_miss_no_mab_alloc:1,		/* 16: DC miss with no MAB allocated */
121 			dc_lin_addr_valid:1,		/* 17: data cache linear address valid */
122 			dc_phy_addr_valid:1,		/* 18: data cache physical address valid */
123 			dc_l2_tlb_hit_1g:1,		/* 19: data cache L2 hit in 1GB page */
124 			l2_miss:1,			/* 20: L2 cache miss */
125 			sw_pf:1,			/* 21: software prefetch */
126 			op_mem_width:4,			/* 22-25: load/store size in bytes */
127 			op_dc_miss_open_mem_reqs:6,	/* 26-31: outstanding mem reqs on DC fill */
128 			dc_miss_lat:16,			/* 32-47: data cache miss latency */
129 			tlb_refill_lat:16;		/* 48-63: L1 TLB refill latency */
130 	};
131 };
132 
133 /* MSR 0xc001103c: IBS Fetch Control Extended */
134 union ic_ibs_extd_ctl {
135 	__u64 val;
136 	struct {
137 		__u64	itlb_refill_lat:16,	/* 0-15: ITLB Refill latency for sampled fetch */
138 			reserved:48;		/* 16-63: reserved */
139 	};
140 };
141 
142 /*
143  * IBS driver related
144  */
145 
146 struct perf_ibs_data {
147 	u32		size;
148 	union {
149 		u32	data[0];	/* data buffer starts here */
150 		u32	caps;
151 	};
152 	u64		regs[MSR_AMD64_IBS_REG_COUNT_MAX];
153 };
154