Blame view

arch/x86/kernel/cpu/perf_event_p4.c 42.8 KB
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1
  /*
0d2eb44f6   Lucas De Marchi   x86: Fix common m...
2
   * Netburst Performance Events (P4, old Xeon)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
3
4
5
6
7
8
   *
   *  Copyright (C) 2010 Parallels, Inc., Cyrill Gorcunov <gorcunov@openvz.org>
   *  Copyright (C) 2010 Intel Corporation, Lin Ming <ming.m.lin@intel.com>
   *
   *  For licencing details see kernel-base/COPYING
   */
de0428a7a   Kevin Winchester   x86, perf: Clean ...
9
  #include <linux/perf_event.h>
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
10
11
  
  #include <asm/perf_event_p4.h>
de0428a7a   Kevin Winchester   x86, perf: Clean ...
12
13
14
15
  #include <asm/hardirq.h>
  #include <asm/apic.h>
  
  #include "perf_event.h"
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
16

d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
17
  #define P4_CNTR_LIMIT 3
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
18
19
20
  /*
   * array indices: 0,1 - HT threads, used with HT enabled cpu
   */
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
21
22
23
  struct p4_event_bind {
  	unsigned int opcode;			/* Event code and ESCR selector */
  	unsigned int escr_msr[2];		/* ESCR MSR for this event */
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
24
25
  	unsigned int escr_emask;		/* valid ESCR EventMask bits */
  	unsigned int shared;			/* event is shared across threads */
1ff3d7d79   Cyrill Gorcunov   x86, perf: P4 PMU...
26
  	char cntr[2][P4_CNTR_LIMIT];		/* counter index (offset), -1 on abscence */
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
27
  };
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
28
  struct p4_pebs_bind {
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
29
30
  	unsigned int metric_pebs;
  	unsigned int metric_vert;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
31
  };
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
32
33
34
35
36
  /* it sets P4_PEBS_ENABLE_UOP_TAG as well */
  #define P4_GEN_PEBS_BIND(name, pebs, vert)			\
  	[P4_PEBS_METRIC__##name] = {				\
  		.metric_pebs = pebs | P4_PEBS_ENABLE_UOP_TAG,	\
  		.metric_vert = vert,				\
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
37
  	}
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
  /*
   * note we have P4_PEBS_ENABLE_UOP_TAG always set here
   *
   * it's needed for mapping P4_PEBS_CONFIG_METRIC_MASK bits of
   * event configuration to find out which values are to be
   * written into MSR_IA32_PEBS_ENABLE and MSR_P4_PEBS_MATRIX_VERT
   * resgisters
   */
  static struct p4_pebs_bind p4_pebs_bind_map[] = {
  	P4_GEN_PEBS_BIND(1stl_cache_load_miss_retired,	0x0000001, 0x0000001),
  	P4_GEN_PEBS_BIND(2ndl_cache_load_miss_retired,	0x0000002, 0x0000001),
  	P4_GEN_PEBS_BIND(dtlb_load_miss_retired,	0x0000004, 0x0000001),
  	P4_GEN_PEBS_BIND(dtlb_store_miss_retired,	0x0000004, 0x0000002),
  	P4_GEN_PEBS_BIND(dtlb_all_miss_retired,		0x0000004, 0x0000003),
  	P4_GEN_PEBS_BIND(tagged_mispred_branch,		0x0018000, 0x0000010),
  	P4_GEN_PEBS_BIND(mob_load_replay_retired,	0x0000200, 0x0000001),
  	P4_GEN_PEBS_BIND(split_load_retired,		0x0000400, 0x0000001),
  	P4_GEN_PEBS_BIND(split_store_retired,		0x0000400, 0x0000002),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
  };
  
  /*
   * Note that we don't use CCCR1 here, there is an
   * exception for P4_BSQ_ALLOCATION but we just have
   * no workaround
   *
   * consider this binding as resources which particular
   * event may borrow, it doesn't contain EventMask,
   * Tags and friends -- they are left to a caller
   */
  static struct p4_event_bind p4_event_bind_map[] = {
  	[P4_EVENT_TC_DELIVER_MODE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_TC_DELIVER_MODE),
  		.escr_msr	= { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
71
72
73
74
75
76
77
78
79
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DD)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DB)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, DI)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BD)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BB)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, BI)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_DELIVER_MODE, ID),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
80
81
82
83
84
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_BPU_FETCH_REQUEST] = {
  		.opcode		= P4_OPCODE(P4_EVENT_BPU_FETCH_REQUEST),
  		.escr_msr	= { MSR_P4_BPU_ESCR0, MSR_P4_BPU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
85
86
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_BPU_FETCH_REQUEST, TCMISS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
87
88
89
90
91
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_ITLB_REFERENCE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_ITLB_REFERENCE),
  		.escr_msr	= { MSR_P4_ITLB_ESCR0, MSR_P4_ITLB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
92
93
94
95
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, HIT)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, MISS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_ITLB_REFERENCE, HIT_UK),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
96
97
98
99
100
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_MEMORY_CANCEL] = {
  		.opcode		= P4_OPCODE(P4_EVENT_MEMORY_CANCEL),
  		.escr_msr	= { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
101
102
103
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_CANCEL, ST_RB_FULL)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_CANCEL, 64K_CONF),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
104
105
106
107
108
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_MEMORY_COMPLETE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_MEMORY_COMPLETE),
  		.escr_msr	= { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
109
110
111
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_COMPLETE, LSC)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MEMORY_COMPLETE, SSC),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
112
113
114
115
116
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_LOAD_PORT_REPLAY] = {
  		.opcode		= P4_OPCODE(P4_EVENT_LOAD_PORT_REPLAY),
  		.escr_msr	= { MSR_P4_SAAT_ESCR0, MSR_P4_SAAT_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
117
118
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_LOAD_PORT_REPLAY, SPLIT_LD),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
119
120
121
122
123
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_STORE_PORT_REPLAY] = {
  		.opcode		= P4_OPCODE(P4_EVENT_STORE_PORT_REPLAY),
  		.escr_msr	= { MSR_P4_SAAT_ESCR0 ,  MSR_P4_SAAT_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
124
125
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_STORE_PORT_REPLAY, SPLIT_ST),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
126
127
128
129
130
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_MOB_LOAD_REPLAY] = {
  		.opcode		= P4_OPCODE(P4_EVENT_MOB_LOAD_REPLAY),
  		.escr_msr	= { MSR_P4_MOB_ESCR0, MSR_P4_MOB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
131
132
133
134
135
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, NO_STA)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, NO_STD)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, PARTIAL_DATA)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MOB_LOAD_REPLAY, UNALGN_ADDR),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
136
137
138
139
140
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_PAGE_WALK_TYPE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_PAGE_WALK_TYPE),
  		.escr_msr	= { MSR_P4_PMH_ESCR0, MSR_P4_PMH_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
141
142
143
144
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_PAGE_WALK_TYPE, DTMISS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_PAGE_WALK_TYPE, ITMISS),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
145
146
147
148
149
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_BSQ_CACHE_REFERENCE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_BSQ_CACHE_REFERENCE),
  		.escr_msr	= { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
150
151
152
153
154
155
156
157
158
159
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITS)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITM)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITS)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITM)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_MISS)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_MISS)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, WR_2ndL_MISS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
160
161
162
163
164
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_IOQ_ALLOCATION] = {
  		.opcode		= P4_OPCODE(P4_EVENT_IOQ_ALLOCATION),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
165
166
167
168
169
170
171
172
173
174
175
176
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, DEFAULT)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, ALL_READ)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, ALL_WRITE)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_UC)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WC)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WT)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WP)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, MEM_WB)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, OWN)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, OTHER)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ALLOCATION, PREFETCH),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
177
178
179
180
181
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_IOQ_ACTIVE_ENTRIES] = {	/* shared ESCR */
  		.opcode		= P4_OPCODE(P4_EVENT_IOQ_ACTIVE_ENTRIES),
  		.escr_msr	= { MSR_P4_FSB_ESCR1,  MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
182
183
184
185
186
187
188
189
190
191
192
193
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, DEFAULT)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_READ)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_WRITE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_UC)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WC)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WT)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WP)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WB)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, OWN)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, OTHER)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_IOQ_ACTIVE_ENTRIES, PREFETCH),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
194
195
196
197
198
  		.cntr		= { {2, -1, -1}, {3, -1, -1} },
  	},
  	[P4_EVENT_FSB_DATA_ACTIVITY] = {
  		.opcode		= P4_OPCODE(P4_EVENT_FSB_DATA_ACTIVITY),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
199
200
201
202
203
204
205
206
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_DRV)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OWN)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OTHER)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_DRV)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OWN)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OTHER),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
207
208
209
210
211
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_BSQ_ALLOCATION] = {		/* shared ESCR, broken CCCR1 */
  		.opcode		= P4_OPCODE(P4_EVENT_BSQ_ALLOCATION),
  		.escr_msr	= { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR0 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
212
213
214
215
216
217
218
219
220
221
222
223
224
225
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE0)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE1)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LEN0)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LEN1)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_IO_TYPE)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_LOCK_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_CACHE_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_SPLIT_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_DEM_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, REQ_ORD_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE0)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE1)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE2),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
226
227
228
229
230
  		.cntr		= { {0, -1, -1}, {1, -1, -1} },
  	},
  	[P4_EVENT_BSQ_ACTIVE_ENTRIES] = {	/* shared ESCR */
  		.opcode		= P4_OPCODE(P4_EVENT_BSQ_ACTIVE_ENTRIES),
  		.escr_msr	= { MSR_P4_BSU_ESCR1 , MSR_P4_BSU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
231
232
233
234
235
236
237
238
239
240
241
242
243
244
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE0)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE1)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN0)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN1)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_IO_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LOCK_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_CACHE_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_SPLIT_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_DEM_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_ORD_TYPE)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE0)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE1)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE2),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
245
246
247
248
249
  		.cntr		= { {2, -1, -1}, {3, -1, -1} },
  	},
  	[P4_EVENT_SSE_INPUT_ASSIST] = {
  		.opcode		= P4_OPCODE(P4_EVENT_SSE_INPUT_ASSIST),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
250
251
252
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_SSE_INPUT_ASSIST, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
253
254
255
256
257
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_PACKED_SP_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_PACKED_SP_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
258
259
260
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_PACKED_SP_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
261
262
263
264
265
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_PACKED_DP_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_PACKED_DP_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
266
267
268
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_PACKED_DP_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
269
270
271
272
273
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_SCALAR_SP_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_SCALAR_SP_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
274
275
276
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_SCALAR_SP_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
277
278
279
280
281
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_SCALAR_DP_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_SCALAR_DP_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
282
283
284
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_SCALAR_DP_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
285
286
287
288
289
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_64BIT_MMX_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_64BIT_MMX_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
290
291
292
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_64BIT_MMX_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
293
294
295
296
297
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_128BIT_MMX_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_128BIT_MMX_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
298
299
300
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_128BIT_MMX_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
301
302
303
304
305
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_X87_FP_UOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_X87_FP_UOP),
  		.escr_msr	= { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
306
307
308
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_FP_UOP, ALL),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
309
310
311
312
313
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_TC_MISC] = {
  		.opcode		= P4_OPCODE(P4_EVENT_TC_MISC),
  		.escr_msr	= { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
314
315
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_MISC, FLUSH),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
316
317
318
319
320
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_GLOBAL_POWER_EVENTS] = {
  		.opcode		= P4_OPCODE(P4_EVENT_GLOBAL_POWER_EVENTS),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
321
322
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
323
324
325
326
327
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_TC_MS_XFER] = {
  		.opcode		= P4_OPCODE(P4_EVENT_TC_MS_XFER),
  		.escr_msr	= { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
328
329
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_TC_MS_XFER, CISC),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
330
331
332
333
334
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_UOP_QUEUE_WRITES] = {
  		.opcode		= P4_OPCODE(P4_EVENT_UOP_QUEUE_WRITES),
  		.escr_msr	= { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
335
336
337
338
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_BUILD)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_DELIVER)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_QUEUE_WRITES, FROM_ROM),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
339
340
341
342
343
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE),
  		.escr_msr	= { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR0 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
344
345
346
347
348
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CONDITIONAL)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CALL)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, RETURN)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, INDIRECT),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
349
350
351
352
353
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_RETIRED_BRANCH_TYPE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_RETIRED_BRANCH_TYPE),
  		.escr_msr	= { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
354
355
356
357
358
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CONDITIONAL)	|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CALL)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, RETURN)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, INDIRECT),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
359
360
361
362
363
  		.cntr		= { {4, 5, -1}, {6, 7, -1} },
  	},
  	[P4_EVENT_RESOURCE_STALL] = {
  		.opcode		= P4_OPCODE(P4_EVENT_RESOURCE_STALL),
  		.escr_msr	= { MSR_P4_ALF_ESCR0, MSR_P4_ALF_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
364
365
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_RESOURCE_STALL, SBFULL),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
366
367
368
369
370
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_WC_BUFFER] = {
  		.opcode		= P4_OPCODE(P4_EVENT_WC_BUFFER),
  		.escr_msr	= { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
371
372
373
374
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_WC_BUFFER, WCB_EVICTS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_WC_BUFFER, WCB_FULL_EVICTS),
  		.shared		= 1,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
375
376
377
378
379
  		.cntr		= { {8, 9, -1}, {10, 11, -1} },
  	},
  	[P4_EVENT_B2B_CYCLES] = {
  		.opcode		= P4_OPCODE(P4_EVENT_B2B_CYCLES),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
380
  		.escr_emask	= 0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
381
382
383
384
385
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_BNR] = {
  		.opcode		= P4_OPCODE(P4_EVENT_BNR),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
386
  		.escr_emask	= 0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
387
388
389
390
391
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_SNOOP] = {
  		.opcode		= P4_OPCODE(P4_EVENT_SNOOP),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
392
  		.escr_emask	= 0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
393
394
395
396
397
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_RESPONSE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_RESPONSE),
  		.escr_msr	= { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
398
  		.escr_emask	= 0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
399
400
401
402
403
  		.cntr		= { {0, -1, -1}, {2, -1, -1} },
  	},
  	[P4_EVENT_FRONT_END_EVENT] = {
  		.opcode		= P4_OPCODE(P4_EVENT_FRONT_END_EVENT),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
404
405
406
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_FRONT_END_EVENT, NBOGUS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_FRONT_END_EVENT, BOGUS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
407
408
409
410
411
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_EXECUTION_EVENT] = {
  		.opcode		= P4_OPCODE(P4_EVENT_EXECUTION_EVENT),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
412
413
414
415
416
417
418
419
420
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS0)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS1)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS2)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS3)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS0)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS1)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS2)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS3),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
421
422
423
424
425
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_REPLAY_EVENT] = {
  		.opcode		= P4_OPCODE(P4_EVENT_REPLAY_EVENT),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
426
427
428
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_REPLAY_EVENT, NBOGUS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_REPLAY_EVENT, BOGUS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
429
430
431
432
433
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_INSTR_RETIRED] = {
  		.opcode		= P4_OPCODE(P4_EVENT_INSTR_RETIRED),
  		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
434
435
436
437
438
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSNTAG)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSTAG)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSNTAG)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSTAG),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
439
440
441
442
443
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_UOPS_RETIRED] = {
  		.opcode		= P4_OPCODE(P4_EVENT_UOPS_RETIRED),
  		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
444
445
446
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOPS_RETIRED, NBOGUS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOPS_RETIRED, BOGUS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
447
448
449
450
451
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_UOP_TYPE] = {
  		.opcode		= P4_OPCODE(P4_EVENT_UOP_TYPE),
  		.escr_msr	= { MSR_P4_RAT_ESCR0, MSR_P4_RAT_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
452
453
454
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_TYPE, TAGLOADS)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_UOP_TYPE, TAGSTORES),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
455
456
457
458
459
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_BRANCH_RETIRED] = {
  		.opcode		= P4_OPCODE(P4_EVENT_BRANCH_RETIRED),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
460
461
462
463
464
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMNP)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMNM)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMTP)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_BRANCH_RETIRED, MMTM),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
465
466
467
468
469
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_MISPRED_BRANCH_RETIRED] = {
  		.opcode		= P4_OPCODE(P4_EVENT_MISPRED_BRANCH_RETIRED),
  		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
470
  		.escr_emask	=
1d321881a   Cyrill Gorcunov   perf, x86: P4 PMU...
471
  			P4_ESCR_EMASK_BIT(P4_EVENT_MISPRED_BRANCH_RETIRED, NBOGUS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
472
473
474
475
476
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_X87_ASSIST] = {
  		.opcode		= P4_OPCODE(P4_EVENT_X87_ASSIST),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
477
478
479
480
481
482
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, FPSU)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, FPSO)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, POAO)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, POAU)			|
  			P4_ESCR_EMASK_BIT(P4_EVENT_X87_ASSIST, PREA),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
483
484
485
486
487
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_MACHINE_CLEAR] = {
  		.opcode		= P4_OPCODE(P4_EVENT_MACHINE_CLEAR),
  		.escr_msr	= { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
488
489
490
491
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, CLEAR)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, MOCLEAR)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_MACHINE_CLEAR, SMCLEAR),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
492
493
494
495
496
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  	[P4_EVENT_INSTR_COMPLETED] = {
  		.opcode		= P4_OPCODE(P4_EVENT_INSTR_COMPLETED),
  		.escr_msr	= { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 },
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
497
498
499
  		.escr_emask	=
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_COMPLETED, NBOGUS)		|
  			P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_COMPLETED, BOGUS),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
500
501
502
  		.cntr		= { {12, 13, 16}, {14, 15, 17} },
  	},
  };
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
503

39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
504
  #define P4_GEN_CACHE_EVENT(event, bit, metric)				  \
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
505
506
  	p4_config_pack_escr(P4_ESCR_EVENT(event)			| \
  			    P4_ESCR_EMASK_BIT(event, bit))		| \
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
507
  	p4_config_pack_cccr(metric					| \
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
508
  			    P4_CCCR_ESEL(P4_OPCODE_ESEL(P4_OPCODE(event))))
cb7d6b505   Lin Ming   perf, x86: Add ca...
509

caaa8be3b   Peter Zijlstra   perf, x86: Fix __...
510
  static __initconst const u64 p4_hw_cache_event_ids
cb7d6b505   Lin Ming   perf, x86: Add ca...
511
512
513
514
515
516
517
  				[PERF_COUNT_HW_CACHE_MAX]
  				[PERF_COUNT_HW_CACHE_OP_MAX]
  				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
  {
   [ C(L1D ) ] = {
  	[ C(OP_READ) ] = {
  		[ C(RESULT_ACCESS) ] = 0x0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
518
  		[ C(RESULT_MISS)   ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
519
  						P4_PEBS_METRIC__1stl_cache_load_miss_retired),
cb7d6b505   Lin Ming   perf, x86: Add ca...
520
521
522
523
524
  	},
   },
   [ C(LL  ) ] = {
  	[ C(OP_READ) ] = {
  		[ C(RESULT_ACCESS) ] = 0x0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
525
  		[ C(RESULT_MISS)   ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
526
  						P4_PEBS_METRIC__2ndl_cache_load_miss_retired),
cb7d6b505   Lin Ming   perf, x86: Add ca...
527
  	},
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
528
  },
cb7d6b505   Lin Ming   perf, x86: Add ca...
529
530
531
   [ C(DTLB) ] = {
  	[ C(OP_READ) ] = {
  		[ C(RESULT_ACCESS) ] = 0x0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
532
  		[ C(RESULT_MISS)   ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
533
  						P4_PEBS_METRIC__dtlb_load_miss_retired),
cb7d6b505   Lin Ming   perf, x86: Add ca...
534
535
536
  	},
  	[ C(OP_WRITE) ] = {
  		[ C(RESULT_ACCESS) ] = 0x0,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
537
  		[ C(RESULT_MISS)   ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
538
  						P4_PEBS_METRIC__dtlb_store_miss_retired),
cb7d6b505   Lin Ming   perf, x86: Add ca...
539
540
541
542
  	},
   },
   [ C(ITLB) ] = {
  	[ C(OP_READ) ] = {
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
543
  		[ C(RESULT_ACCESS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_ITLB_REFERENCE, HIT,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
544
  						P4_PEBS_METRIC__none),
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
545
  		[ C(RESULT_MISS)   ] = P4_GEN_CACHE_EVENT(P4_EVENT_ITLB_REFERENCE, MISS,
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
546
  						P4_PEBS_METRIC__none),
cb7d6b505   Lin Ming   perf, x86: Add ca...
547
548
549
550
551
552
553
554
555
556
  	},
  	[ C(OP_WRITE) ] = {
  		[ C(RESULT_ACCESS) ] = -1,
  		[ C(RESULT_MISS)   ] = -1,
  	},
  	[ C(OP_PREFETCH) ] = {
  		[ C(RESULT_ACCESS) ] = -1,
  		[ C(RESULT_MISS)   ] = -1,
  	},
   },
89d6c0b5b   Peter Zijlstra   perf, arch: Add g...
557
558
559
560
561
562
563
564
565
566
567
568
569
570
   [ C(NODE) ] = {
  	[ C(OP_READ) ] = {
  		[ C(RESULT_ACCESS) ] = -1,
  		[ C(RESULT_MISS)   ] = -1,
  	},
  	[ C(OP_WRITE) ] = {
  		[ C(RESULT_ACCESS) ] = -1,
  		[ C(RESULT_MISS)   ] = -1,
  	},
  	[ C(OP_PREFETCH) ] = {
  		[ C(RESULT_ACCESS) ] = -1,
  		[ C(RESULT_MISS)   ] = -1,
  	},
   },
cb7d6b505   Lin Ming   perf, x86: Add ca...
571
  };
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
572
  /*
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
573
574
575
576
   * Because of Netburst being quite restricted in how many
   * identical events may run simultaneously, we introduce event aliases,
   * ie the different events which have the same functionality but
   * utilize non-intersected resources (ESCR/CCCR/counter registers).
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
577
   *
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
578
579
   * This allow us to relax restrictions a bit and run two or more
   * identical events together.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
580
   *
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
581
582
583
   * Never set any custom internal bits such as P4_CONFIG_HT,
   * P4_CONFIG_ALIASABLE or bits for P4_PEBS_METRIC, they are
   * either up to date automatically or not applicable at all.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
584
585
   */
  struct p4_event_alias {
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
586
587
  	u64 original;
  	u64 alternative;
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
588
589
590
  } p4_event_aliases[] = {
  	{
  		/*
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
591
592
593
594
595
  		 * Non-halted cycles can be substituted with non-sleeping cycles (see
  		 * Intel SDM Vol3b for details). We need this alias to be able
  		 * to run nmi-watchdog and 'perf top' (or any other user space tool
  		 * which is interested in running PERF_COUNT_HW_CPU_CYCLES)
  		 * simultaneously.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
596
  		 */
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
597
  	.original	=
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
598
599
  		p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_GLOBAL_POWER_EVENTS)		|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING)),
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
600
  	.alternative	=
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
  		p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_EXECUTION_EVENT)		|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS0)|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS1)|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS2)|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, NBOGUS3)|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS0)	|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS1)	|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS2)	|
  				    P4_ESCR_EMASK_BIT(P4_EVENT_EXECUTION_EVENT, BOGUS3))|
  		p4_config_pack_cccr(P4_CCCR_THRESHOLD(15) | P4_CCCR_COMPLEMENT		|
  				    P4_CCCR_COMPARE),
  	},
  };
  
  static u64 p4_get_alias_event(u64 config)
  {
  	u64 config_match;
  	int i;
  
  	/*
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
621
622
623
  	 * Only event with special mark is allowed,
  	 * we're to be sure it didn't come as malformed
  	 * RAW event.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
624
625
626
627
628
  	 */
  	if (!(config & P4_CONFIG_ALIASABLE))
  		return 0;
  
  	config_match = config & P4_CONFIG_EVENT_ALIAS_MASK;
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
629
  	for (i = 0; i < ARRAY_SIZE(p4_event_aliases); i++) {
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
630
631
  		if (config_match == p4_event_aliases[i].original) {
  			config_match = p4_event_aliases[i].alternative;
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
632
  			break;
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
633
634
  		} else if (config_match == p4_event_aliases[i].alternative) {
  			config_match = p4_event_aliases[i].original;
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
635
636
637
638
639
640
  			break;
  		}
  	}
  
  	if (i >= ARRAY_SIZE(p4_event_aliases))
  		return 0;
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
641
  	return config_match | (config & P4_CONFIG_EVENT_ALIAS_IMMUTABLE_BITS);
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
642
  }
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
643
644
645
646
  static u64 p4_general_events[PERF_COUNT_HW_MAX] = {
    /* non-halted CPU clocks */
    [PERF_COUNT_HW_CPU_CYCLES] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_GLOBAL_POWER_EVENTS)		|
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
647
648
  		P4_ESCR_EMASK_BIT(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING))	|
  		P4_CONFIG_ALIASABLE,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
  
    /*
     * retired instructions
     * in a sake of simplicity we don't use the FSB tagging
     */
    [PERF_COUNT_HW_INSTRUCTIONS] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_INSTR_RETIRED)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSNTAG)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSNTAG)),
  
    /* cache hits */
    [PERF_COUNT_HW_CACHE_REFERENCES] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_BSQ_CACHE_REFERENCE)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITS)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITE)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITM)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITS)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITE)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITM)),
  
    /* cache misses */
    [PERF_COUNT_HW_CACHE_MISSES] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_BSQ_CACHE_REFERENCE)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_MISS)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_MISS)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, WR_2ndL_MISS)),
  
    /* branch instructions retired */
    [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_RETIRED_BRANCH_TYPE)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CONDITIONAL)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CALL)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, RETURN)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, INDIRECT)),
  
    /* mispredicted branches retired */
    [PERF_COUNT_HW_BRANCH_MISSES]	=
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_MISPRED_BRANCH_RETIRED)	|
  		P4_ESCR_EMASK_BIT(P4_EVENT_MISPRED_BRANCH_RETIRED, NBOGUS)),
  
    /* bus ready clocks (cpu is driving #DRDY_DRV\#DRDY_OWN):  */
    [PERF_COUNT_HW_BUS_CYCLES] =
  	p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_FSB_DATA_ACTIVITY)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_DRV)		|
  		P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OWN))	|
  	p4_config_pack_cccr(P4_CCCR_EDGE | P4_CCCR_COMPARE),
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
695
  };
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
696
697
698
699
700
701
702
703
704
705
  static struct p4_event_bind *p4_config_get_bind(u64 config)
  {
  	unsigned int evnt = p4_config_unpack_event(config);
  	struct p4_event_bind *bind = NULL;
  
  	if (evnt < ARRAY_SIZE(p4_event_bind_map))
  		bind = &p4_event_bind_map[evnt];
  
  	return bind;
  }
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
706
707
  static u64 p4_pmu_event_map(int hw_event)
  {
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
708
709
  	struct p4_event_bind *bind;
  	unsigned int esel;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
710
  	u64 config;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
711
712
713
714
  	config = p4_general_events[hw_event];
  	bind = p4_config_get_bind(config);
  	esel = P4_OPCODE_ESEL(bind->opcode);
  	config |= p4_config_pack_cccr(P4_CCCR_ESEL(esel));
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
715

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
716
717
  	return config;
  }
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
  /* check cpu model specifics */
  static bool p4_event_match_cpu_model(unsigned int event_idx)
  {
  	/* INSTR_COMPLETED event only exist for model 3, 4, 6 (Prescott) */
  	if (event_idx == P4_EVENT_INSTR_COMPLETED) {
  		if (boot_cpu_data.x86_model != 3 &&
  			boot_cpu_data.x86_model != 4 &&
  			boot_cpu_data.x86_model != 6)
  			return false;
  	}
  
  	/*
  	 * For info
  	 * - IQ_ESCR0, IQ_ESCR1 only for models 1 and 2
  	 */
  
  	return true;
  }
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
736
737
  static int p4_validate_raw_event(struct perf_event *event)
  {
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
738
  	unsigned int v, emask;
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
739

c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
740
  	/* User data may have out-of-bound event index */
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
741
  	v = p4_config_unpack_event(event->attr.config);
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
742
743
744
745
746
  	if (v >= ARRAY_SIZE(p4_event_bind_map))
  		return -EINVAL;
  
  	/* It may be unsupported: */
  	if (!p4_event_match_cpu_model(v))
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
747
  		return -EINVAL;
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
748
749
750
751
752
753
754
755
756
757
758
759
760
761
  
  	/*
  	 * NOTE: P4_CCCR_THREAD_ANY has not the same meaning as
  	 * in Architectural Performance Monitoring, it means not
  	 * on _which_ logical cpu to count but rather _when_, ie it
  	 * depends on logical cpu state -- count event if one cpu active,
  	 * none, both or any, so we just allow user to pass any value
  	 * desired.
  	 *
  	 * In turn we always set Tx_OS/Tx_USR bits bound to logical
  	 * cpu without their propagation to another cpu
  	 */
  
  	/*
0d2eb44f6   Lucas De Marchi   x86: Fix common m...
762
  	 * if an event is shared across the logical threads
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
763
764
  	 * the user needs special permissions to be able to use it
  	 */
d038b12c6   Stephane Eranian   perf: Fix Pentium...
765
  	if (p4_ht_active() && p4_event_bind_map[v].shared) {
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
766
767
  		if (perf_paranoid_cpu() && !capable(CAP_SYS_ADMIN))
  			return -EACCES;
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
768
  	}
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
769
770
771
772
  	/* ESCR EventMask bits may be invalid */
  	emask = p4_config_unpack_escr(event->attr.config) & P4_ESCR_EVENTMASK_MASK;
  	if (emask & ~p4_event_bind_map[v].escr_emask)
  		return -EINVAL;
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
773
  	/*
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
774
  	 * it may have some invalid PEBS bits
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
775
  	 */
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
776
  	if (p4_config_pebs_has(event->attr.config, P4_PEBS_CONFIG_ENABLE))
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
777
  		return -EINVAL;
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
778

39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
779
  	v = p4_config_unpack_metric(event->attr.config);
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
780
  	if (v >= ARRAY_SIZE(p4_pebs_bind_map))
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
781
  		return -EINVAL;
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
782
783
784
  
  	return 0;
  }
b4cdc5c26   Peter Zijlstra   perf, x86: Fix up...
785
  static int p4_hw_config(struct perf_event *event)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
786
  {
137351e0f   Cyrill Gorcunov   x86, perf: P4 PMU...
787
788
  	int cpu = get_cpu();
  	int rc = 0;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
789
  	u32 escr, cccr;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
790
791
792
793
794
795
  
  	/*
  	 * the reason we use cpu that early is that: if we get scheduled
  	 * first time on the same cpu -- we will not need swap thread
  	 * specific flags in config (and will save some cpu cycles)
  	 */
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
796
  	cccr = p4_default_cccr_conf(cpu);
b4cdc5c26   Peter Zijlstra   perf, x86: Fix up...
797
798
799
800
  	escr = p4_default_escr_conf(cpu, event->attr.exclude_kernel,
  					 event->attr.exclude_user);
  	event->hw.config = p4_config_pack_escr(escr) |
  			   p4_config_pack_cccr(cccr);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
801

cb7d6b505   Lin Ming   perf, x86: Add ca...
802
  	if (p4_ht_active() && p4_ht_thread(cpu))
b4cdc5c26   Peter Zijlstra   perf, x86: Fix up...
803
  		event->hw.config = p4_set_ht_bit(event->hw.config);
de902d967   Cyrill Gorcunov   x86, perf: P4 PMU...
804
  	if (event->attr.type == PERF_TYPE_RAW) {
d038b12c6   Stephane Eranian   perf: Fix Pentium...
805
806
  		struct p4_event_bind *bind;
  		unsigned int esel;
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
807
808
809
810
811
  		/*
  		 * Clear bits we reserve to be managed by kernel itself
  		 * and never allowed from a user space
  		 */
  		 event->attr.config &= P4_CONFIG_MASK;
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
812
813
  		rc = p4_validate_raw_event(event);
  		if (rc)
c7993165e   Cyrill Gorcunov   x86, perf: P4 PMU...
814
  			goto out;
c7993165e   Cyrill Gorcunov   x86, perf: P4 PMU...
815

de902d967   Cyrill Gorcunov   x86, perf: P4 PMU...
816
  		/*
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
817
818
  		 * Note that for RAW events we allow user to use P4_CCCR_RESERVED
  		 * bits since we keep additional info here (for cache events and etc)
de902d967   Cyrill Gorcunov   x86, perf: P4 PMU...
819
  		 */
c9cf4a019   Cyrill Gorcunov   perf, x86, Pentiu...
820
  		event->hw.config |= event->attr.config;
d038b12c6   Stephane Eranian   perf: Fix Pentium...
821
822
823
824
825
826
827
  		bind = p4_config_get_bind(event->attr.config);
  		if (!bind) {
  			rc = -EINVAL;
  			goto out;
  		}
  		esel = P4_OPCODE_ESEL(bind->opcode);
  		event->hw.config |= p4_config_pack_cccr(P4_CCCR_ESEL(esel));
de902d967   Cyrill Gorcunov   x86, perf: P4 PMU...
828
  	}
cb7d6b505   Lin Ming   perf, x86: Add ca...
829

137351e0f   Cyrill Gorcunov   x86, perf: P4 PMU...
830
  	rc = x86_setup_perfctr(event);
c7993165e   Cyrill Gorcunov   x86, perf: P4 PMU...
831
  out:
137351e0f   Cyrill Gorcunov   x86, perf: P4 PMU...
832
  	put_cpu();
137351e0f   Cyrill Gorcunov   x86, perf: P4 PMU...
833
  	return rc;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
834
  }
0db1a7bc0   Cyrill Gorcunov   perf, x86: P4 PMU...
835
  static inline int p4_pmu_clear_cccr_ovf(struct hw_perf_event *hwc)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
836
  {
047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
837
  	u64 v;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
838

047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
839
  	/* an official way for overflow indication */
73d6e5220   Robert Richter   perf, x86: Store ...
840
  	rdmsrl(hwc->config_base, v);
047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
841
  	if (v & P4_CCCR_OVF) {
73d6e5220   Robert Richter   perf, x86: Store ...
842
  		wrmsrl(hwc->config_base, v & ~P4_CCCR_OVF);
047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
843
  		return 1;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
844
  	}
0db1a7bc0   Cyrill Gorcunov   perf, x86: P4 PMU...
845

7d44ec193   Cyrill Gorcunov   perf, x86: P4 PMU...
846
847
848
849
850
851
852
  	/*
  	 * In some circumstances the overflow might issue an NMI but did
  	 * not set P4_CCCR_OVF bit. Because a counter holds a negative value
  	 * we simply check for high bit being set, if it's cleared it means
  	 * the counter has reached zero value and continued counting before
  	 * real NMI signal was received:
  	 */
242214f9c   Don Zickus   perf, x86: P4 PMU...
853
  	rdmsrl(hwc->event_base, v);
7d44ec193   Cyrill Gorcunov   perf, x86: P4 PMU...
854
  	if (!(v & ARCH_P4_UNFLAGGED_BIT))
047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
855
856
857
  		return 1;
  
  	return 0;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
858
  }
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
859
860
861
862
863
864
865
  static void p4_pmu_disable_pebs(void)
  {
  	/*
  	 * FIXME
  	 *
  	 * It's still allowed that two threads setup same cache
  	 * events so we can't simply clear metrics until we knew
0d2eb44f6   Lucas De Marchi   x86: Fix common m...
866
  	 * no one is depending on us, so we need kind of counter
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
867
868
869
870
871
  	 * for "ReplayEvent" users.
  	 *
  	 * What is more complex -- RAW events, if user (for some
  	 * reason) will pass some cache event metric with improper
  	 * event opcode -- it's fine from hardware point of view
0d2eb44f6   Lucas De Marchi   x86: Fix common m...
872
  	 * but completely nonsense from "meaning" of such action.
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
873
874
875
876
877
878
879
880
  	 *
  	 * So at moment let leave metrics turned on forever -- it's
  	 * ok for now but need to be revisited!
  	 *
  	 * (void)checking_wrmsrl(MSR_IA32_PEBS_ENABLE, (u64)0);
  	 * (void)checking_wrmsrl(MSR_P4_PEBS_MATRIX_VERT, (u64)0);
  	 */
  }
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
881
882
883
884
885
886
887
888
889
  static inline void p4_pmu_disable_event(struct perf_event *event)
  {
  	struct hw_perf_event *hwc = &event->hw;
  
  	/*
  	 * If event gets disabled while counter is in overflowed
  	 * state we need to clear P4_CCCR_OVF, otherwise interrupt get
  	 * asserted again and again
  	 */
73d6e5220   Robert Richter   perf, x86: Store ...
890
  	(void)checking_wrmsrl(hwc->config_base,
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
891
  		(u64)(p4_config_unpack_cccr(hwc->config)) &
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
892
  			~P4_CCCR_ENABLE & ~P4_CCCR_OVF & ~P4_CCCR_RESERVED);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
893
894
895
896
897
898
  }
  
  static void p4_pmu_disable_all(void)
  {
  	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
  	int idx;
948b1bb89   Robert Richter   perf, x86: Undo s...
899
  	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
900
901
902
903
904
  		struct perf_event *event = cpuc->events[idx];
  		if (!test_bit(idx, cpuc->active_mask))
  			continue;
  		p4_pmu_disable_event(event);
  	}
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
  
  	p4_pmu_disable_pebs();
  }
  
  /* configuration must be valid */
  static void p4_pmu_enable_pebs(u64 config)
  {
  	struct p4_pebs_bind *bind;
  	unsigned int idx;
  
  	BUILD_BUG_ON(P4_PEBS_METRIC__max > P4_PEBS_CONFIG_METRIC_MASK);
  
  	idx = p4_config_unpack_metric(config);
  	if (idx == P4_PEBS_METRIC__none)
  		return;
  
  	bind = &p4_pebs_bind_map[idx];
  
  	(void)checking_wrmsrl(MSR_IA32_PEBS_ENABLE,	(u64)bind->metric_pebs);
  	(void)checking_wrmsrl(MSR_P4_PEBS_MATRIX_VERT,	(u64)bind->metric_vert);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
925
926
927
928
929
930
931
  }
  
  static void p4_pmu_enable_event(struct perf_event *event)
  {
  	struct hw_perf_event *hwc = &event->hw;
  	int thread = p4_ht_config_thread(hwc->config);
  	u64 escr_conf = p4_config_unpack_escr(p4_clear_ht_bit(hwc->config));
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
932
  	unsigned int idx = p4_config_unpack_event(hwc->config);
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
933
  	struct p4_event_bind *bind;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
934
  	u64 escr_addr, cccr;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
935

d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
936
937
  	bind = &p4_event_bind_map[idx];
  	escr_addr = (u64)bind->escr_msr[thread];
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
938
939
940
941
942
943
944
  
  	/*
  	 * - we dont support cascaded counters yet
  	 * - and counter 1 is broken (erratum)
  	 */
  	WARN_ON_ONCE(p4_is_event_cascaded(hwc->config));
  	WARN_ON_ONCE(hwc->idx == 1);
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
945
946
947
948
949
950
951
  	/* we need a real Event value */
  	escr_conf &= ~P4_ESCR_EVENT_MASK;
  	escr_conf |= P4_ESCR_EVENT(P4_OPCODE_EVNT(bind->opcode));
  
  	cccr = p4_config_unpack_cccr(hwc->config);
  
  	/*
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
952
953
  	 * it could be Cache event so we need to write metrics
  	 * into additional MSRs
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
954
  	 */
39ef13a4a   Cyrill Gorcunov   perf, x86: P4 PMU...
955
  	p4_pmu_enable_pebs(hwc->config);
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
956
957
  
  	(void)checking_wrmsrl(escr_addr, escr_conf);
73d6e5220   Robert Richter   perf, x86: Store ...
958
  	(void)checking_wrmsrl(hwc->config_base,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
959
  				(cccr & ~P4_CCCR_RESERVED) | P4_CCCR_ENABLE);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
960
  }
11164cd4f   Peter Zijlstra   perf, x86: Add Ne...
961
  static void p4_pmu_enable_all(int added)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
962
963
964
  {
  	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);
  	int idx;
948b1bb89   Robert Richter   perf, x86: Undo s...
965
  	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
  		struct perf_event *event = cpuc->events[idx];
  		if (!test_bit(idx, cpuc->active_mask))
  			continue;
  		p4_pmu_enable_event(event);
  	}
  }
  
  static int p4_pmu_handle_irq(struct pt_regs *regs)
  {
  	struct perf_sample_data data;
  	struct cpu_hw_events *cpuc;
  	struct perf_event *event;
  	struct hw_perf_event *hwc;
  	int idx, handled = 0;
  	u64 val;
103b39348   Cyrill Gorcunov   perf, x86: P4 PMU...
981
  	perf_sample_data_init(&data, 0);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
982
983
  
  	cpuc = &__get_cpu_var(cpu_hw_events);
948b1bb89   Robert Richter   perf, x86: Undo s...
984
  	for (idx = 0; idx < x86_pmu.num_counters; idx++) {
1c250d709   Cyrill Gorcunov   perf, x86: P4 PMU...
985
  		int overflow;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
986

03e22198d   Cyrill Gorcunov   perf, x86: Handle...
987
988
989
990
  		if (!test_bit(idx, cpuc->active_mask)) {
  			/* catch in-flight IRQs */
  			if (__test_and_clear_bit(idx, cpuc->running))
  				handled++;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
991
  			continue;
03e22198d   Cyrill Gorcunov   perf, x86: Handle...
992
  		}
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
993
994
995
996
997
  
  		event = cpuc->events[idx];
  		hwc = &event->hw;
  
  		WARN_ON_ONCE(hwc->idx != idx);
0db1a7bc0   Cyrill Gorcunov   perf, x86: P4 PMU...
998
  		/* it might be unflagged overflow */
1c250d709   Cyrill Gorcunov   perf, x86: P4 PMU...
999
  		overflow = p4_pmu_clear_cccr_ovf(hwc);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1000
1001
  
  		val = x86_perf_event_update(event);
1c250d709   Cyrill Gorcunov   perf, x86: P4 PMU...
1002
  		if (!overflow && (val & (1ULL << (x86_pmu.cntval_bits - 1))))
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1003
  			continue;
1c250d709   Cyrill Gorcunov   perf, x86: P4 PMU...
1004
  		handled += overflow;
0db1a7bc0   Cyrill Gorcunov   perf, x86: P4 PMU...
1005
1006
  		/* event overflow for sure */
  		data.period = event->hw.last_period;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1007
1008
1009
  
  		if (!x86_perf_event_set_period(event))
  			continue;
a8b0ca17b   Peter Zijlstra   perf: Remove the ...
1010
  		if (perf_event_overflow(event, &data, regs))
1ea5a6afd   Cyrill Gorcunov   perf, x86: P4 PMU...
1011
  			x86_pmu_stop(event, 0);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1012
  	}
2bce5daca   Don Zickus   perf, x86, nmi: M...
1013
  	if (handled)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1014
  		inc_irq_stat(apic_perf_irqs);
2bce5daca   Don Zickus   perf, x86, nmi: M...
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
  
  	/*
  	 * When dealing with the unmasking of the LVTPC on P4 perf hw, it has
  	 * been observed that the OVF bit flag has to be cleared first _before_
  	 * the LVTPC can be unmasked.
  	 *
  	 * The reason is the NMI line will continue to be asserted while the OVF
  	 * bit is set.  This causes a second NMI to generate if the LVTPC is
  	 * unmasked before the OVF bit is cleared, leading to unknown NMI
  	 * messages.
  	 */
  	apic_write(APIC_LVTPC, APIC_DM_NMI);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1027

de725dec9   Peter Zijlstra   perf, x86: Fix ha...
1028
  	return handled;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
  }
  
  /*
   * swap thread specific fields according to a thread
   * we are going to run on
   */
  static void p4_pmu_swap_config_ts(struct hw_perf_event *hwc, int cpu)
  {
  	u32 escr, cccr;
  
  	/*
  	 * we either lucky and continue on same cpu or no HT support
  	 */
  	if (!p4_should_swap_ts(hwc->config, cpu))
  		return;
  
  	/*
  	 * the event is migrated from an another logical
  	 * cpu, so we need to swap thread specific flags
  	 */
  
  	escr = p4_config_unpack_escr(hwc->config);
  	cccr = p4_config_unpack_cccr(hwc->config);
  
  	if (p4_ht_thread(cpu)) {
  		cccr &= ~P4_CCCR_OVF_PMI_T0;
  		cccr |= P4_CCCR_OVF_PMI_T1;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1056
1057
1058
  		if (escr & P4_ESCR_T0_OS) {
  			escr &= ~P4_ESCR_T0_OS;
  			escr |= P4_ESCR_T1_OS;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1059
  		}
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1060
1061
1062
  		if (escr & P4_ESCR_T0_USR) {
  			escr &= ~P4_ESCR_T0_USR;
  			escr |= P4_ESCR_T1_USR;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1063
1064
1065
1066
1067
1068
1069
  		}
  		hwc->config  = p4_config_pack_escr(escr);
  		hwc->config |= p4_config_pack_cccr(cccr);
  		hwc->config |= P4_CONFIG_HT;
  	} else {
  		cccr &= ~P4_CCCR_OVF_PMI_T1;
  		cccr |= P4_CCCR_OVF_PMI_T0;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1070
1071
1072
  		if (escr & P4_ESCR_T1_OS) {
  			escr &= ~P4_ESCR_T1_OS;
  			escr |= P4_ESCR_T0_OS;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1073
  		}
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1074
1075
1076
  		if (escr & P4_ESCR_T1_USR) {
  			escr &= ~P4_ESCR_T1_USR;
  			escr |= P4_ESCR_T0_USR;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1077
1078
1079
1080
1081
1082
  		}
  		hwc->config  = p4_config_pack_escr(escr);
  		hwc->config |= p4_config_pack_cccr(cccr);
  		hwc->config &= ~P4_CONFIG_HT;
  	}
  }
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1083
1084
  /*
   * ESCR address hashing is tricky, ESCRs are not sequential
623aab896   Cyrill Gorcunov   perf, x86: P4 PMU...
1085
   * in memory but all starts from MSR_P4_BSU_ESCR0 (0x03a0) and
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
   * the metric between any ESCRs is laid in range [0xa0,0xe1]
   *
   * so we make ~70% filled hashtable
   */
  
  #define P4_ESCR_MSR_BASE		0x000003a0
  #define P4_ESCR_MSR_MAX			0x000003e1
  #define P4_ESCR_MSR_TABLE_SIZE		(P4_ESCR_MSR_MAX - P4_ESCR_MSR_BASE + 1)
  #define P4_ESCR_MSR_IDX(msr)		(msr - P4_ESCR_MSR_BASE)
  #define P4_ESCR_MSR_TABLE_ENTRY(msr)	[P4_ESCR_MSR_IDX(msr)] = msr
  
  static const unsigned int p4_escr_table[P4_ESCR_MSR_TABLE_SIZE] = {
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ALF_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ALF_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BPU_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BPU_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BSU_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BSU_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR2),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR3),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR4),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR5),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_DAC_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_DAC_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FIRM_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FIRM_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FLAME_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FLAME_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FSB_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FSB_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IQ_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IQ_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IS_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IS_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ITLB_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ITLB_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IX_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IX_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MOB_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MOB_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MS_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MS_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_PMH_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_PMH_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_RAT_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_RAT_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SAAT_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SAAT_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SSU_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SSU_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TBPU_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TBPU_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TC_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TC_ESCR1),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_U2L_ESCR0),
  	P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_U2L_ESCR1),
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1144
1145
1146
1147
  };
  
  static int p4_get_escr_idx(unsigned int addr)
  {
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1148
  	unsigned int idx = P4_ESCR_MSR_IDX(addr);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1149

623aab896   Cyrill Gorcunov   perf, x86: P4 PMU...
1150
1151
1152
  	if (unlikely(idx >= P4_ESCR_MSR_TABLE_SIZE	||
  			!p4_escr_table[idx]		||
  			p4_escr_table[idx] != addr)) {
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1153
1154
1155
  		WARN_ONCE(1, "P4 PMU: Wrong address passed: %x
  ", addr);
  		return -1;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1156
  	}
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1157
  	return idx;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1158
  }
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1159
1160
1161
  static int p4_next_cntr(int thread, unsigned long *used_mask,
  			struct p4_event_bind *bind)
  {
1ff3d7d79   Cyrill Gorcunov   x86, perf: P4 PMU...
1162
  	int i, j;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1163
1164
  
  	for (i = 0; i < P4_CNTR_LIMIT; i++) {
1ff3d7d79   Cyrill Gorcunov   x86, perf: P4 PMU...
1165
1166
  		j = bind->cntr[thread][i];
  		if (j != -1 && !test_bit(j, used_mask))
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1167
1168
1169
1170
1171
  			return j;
  	}
  
  	return -1;
  }
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1172
1173
1174
  static int p4_pmu_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign)
  {
  	unsigned long used_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1175
  	unsigned long escr_mask[BITS_TO_LONGS(P4_ESCR_MSR_TABLE_SIZE)];
9d36dfcf2   Cyrill Gorcunov   perf, x86: P4_pmu...
1176
  	int cpu = smp_processor_id();
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1177
1178
1179
1180
  	struct hw_perf_event *hwc;
  	struct p4_event_bind *bind;
  	unsigned int i, thread, num;
  	int cntr_idx, escr_idx;
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
1181
1182
  	u64 config_alias;
  	int pass;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1183
1184
  
  	bitmap_zero(used_mask, X86_PMC_IDX_MAX);
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1185
  	bitmap_zero(escr_mask, P4_ESCR_MSR_TABLE_SIZE);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1186

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1187
  	for (i = 0, num = n; i < n; i++, num--) {
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1188

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1189
  		hwc = &cpuc->event_list[i]->hw;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1190
  		thread = p4_ht_thread(cpu);
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
1191
1192
1193
1194
  		pass = 0;
  
  again:
  		/*
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
1195
1196
1197
  		 * It's possible to hit a circular lock
  		 * between original and alternative events
  		 * if both are scheduled already.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
1198
1199
1200
  		 */
  		if (pass > 2)
  			goto done;
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1201
1202
  		bind = p4_config_get_bind(hwc->config);
  		escr_idx = p4_get_escr_idx(bind->escr_msr[thread]);
720019908   Cyrill Gorcunov   x86, perf: P4 PMU...
1203
1204
  		if (unlikely(escr_idx == -1))
  			goto done;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1205

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1206
  		if (hwc->idx != -1 && !p4_should_swap_ts(hwc->config, cpu)) {
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1207
  			cntr_idx = hwc->idx;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1208
1209
  			if (assign)
  				assign[i] = hwc->idx;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1210
1211
  			goto reserve;
  		}
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1212
  		cntr_idx = p4_next_cntr(thread, used_mask, bind);
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
1213
1214
  		if (cntr_idx == -1 || test_bit(escr_idx, escr_mask)) {
  			/*
f53173e47   Cyrill Gorcunov   x86, perf: P4 PMU...
1215
  			 * Check whether an event alias is still available.
f91298709   Cyrill Gorcunov   perf, x86: P4 PMU...
1216
1217
1218
1219
1220
1221
1222
1223
  			 */
  			config_alias = p4_get_alias_event(hwc->config);
  			if (!config_alias)
  				goto done;
  			hwc->config = config_alias;
  			pass++;
  			goto again;
  		}
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1224

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1225
  		p4_pmu_swap_config_ts(hwc, cpu);
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1226
1227
  		if (assign)
  			assign[i] = cntr_idx;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1228
  reserve:
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1229
  		set_bit(cntr_idx, used_mask);
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1230
1231
1232
1233
  		set_bit(escr_idx, escr_mask);
  	}
  
  done:
aa2bc1ade   Peter Zijlstra   perf: Don't use -...
1234
  	return num ? -EINVAL : 0;
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1235
  }
caaa8be3b   Peter Zijlstra   perf, x86: Fix __...
1236
  static __initconst const struct x86_pmu p4_pmu = {
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1237
1238
1239
1240
1241
1242
1243
1244
1245
  	.name			= "Netburst P4/Xeon",
  	.handle_irq		= p4_pmu_handle_irq,
  	.disable_all		= p4_pmu_disable_all,
  	.enable_all		= p4_pmu_enable_all,
  	.enable			= p4_pmu_enable_event,
  	.disable		= p4_pmu_disable_event,
  	.eventsel		= MSR_P4_BPU_CCCR0,
  	.perfctr		= MSR_P4_BPU_PERFCTR0,
  	.event_map		= p4_pmu_event_map,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1246
  	.max_events		= ARRAY_SIZE(p4_general_events),
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1247
1248
1249
1250
1251
1252
1253
  	.get_event_constraints	= x86_get_event_constraints,
  	/*
  	 * IF HT disabled we may need to use all
  	 * ARCH_P4_MAX_CCCR counters simulaneously
  	 * though leave it restricted at moment assuming
  	 * HT is on
  	 */
948b1bb89   Robert Richter   perf, x86: Undo s...
1254
  	.num_counters		= ARCH_P4_MAX_CCCR,
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1255
  	.apic			= 1,
047a3772f   Cyrill Gorcunov   perf, x86: P4 PMU...
1256
1257
1258
  	.cntval_bits		= ARCH_P4_CNTRVAL_BITS,
  	.cntval_mask		= ARCH_P4_CNTRVAL_MASK,
  	.max_period		= (1ULL << (ARCH_P4_CNTRVAL_BITS - 1)) - 1,
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1259
1260
  	.hw_config		= p4_hw_config,
  	.schedule_events	= p4_pmu_schedule_events,
68aa00ac0   Cyrill Gorcunov   perf, x86: Make a...
1261
1262
1263
1264
1265
1266
1267
1268
1269
  	/*
  	 * This handles erratum N15 in intel doc 249199-029,
  	 * the counter may not be updated correctly on write
  	 * so we need a second write operation to do the trick
  	 * (the official workaround didn't work)
  	 *
  	 * the former idea is taken from OProfile code
  	 */
  	.perfctr_second_write	= 1,
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1270
  };
de0428a7a   Kevin Winchester   x86, perf: Clean ...
1271
  __init int p4_pmu_init(void)
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1272
1273
  {
  	unsigned int low, high;
fa7b69475   Justin P. Mattock   perf events, x86,...
1274
  	/* If we get stripped -- indexing fails */
a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1275
1276
1277
1278
1279
1280
1281
1282
  	BUILD_BUG_ON(ARCH_P4_MAX_CCCR > X86_PMC_MAX_GENERIC);
  
  	rdmsr(MSR_IA32_MISC_ENABLE, low, high);
  	if (!(low & (1 << 7))) {
  		pr_cont("unsupported Netburst CPU model %d ",
  			boot_cpu_data.x86_model);
  		return -ENODEV;
  	}
cb7d6b505   Lin Ming   perf, x86: Add ca...
1283
  	memcpy(hw_cache_event_ids, p4_hw_cache_event_ids,
d814f3010   Cyrill Gorcunov   x86, perf: Add ra...
1284
  		sizeof(hw_cache_event_ids));
cb7d6b505   Lin Ming   perf, x86: Add ca...
1285

a072738e0   Cyrill Gorcunov   perf, x86: Implem...
1286
1287
1288
1289
1290
1291
  	pr_cont("Netburst events, ");
  
  	x86_pmu = p4_pmu;
  
  	return 0;
  }