Loading...
Note: File does not exist in v3.1.
1// SPDX-License-Identifier: MIT
2/*
3 * Copyright © 2022 Intel Corporation
4 */
5
6#include "xe_wa.h"
7
8#include <drm/drm_managed.h>
9#include <kunit/visibility.h>
10#include <linux/compiler_types.h>
11
12#include <generated/xe_wa_oob.h>
13
14#include "regs/xe_engine_regs.h"
15#include "regs/xe_gt_regs.h"
16#include "regs/xe_regs.h"
17#include "xe_device_types.h"
18#include "xe_force_wake.h"
19#include "xe_gt.h"
20#include "xe_hw_engine_types.h"
21#include "xe_mmio.h"
22#include "xe_platform_types.h"
23#include "xe_rtp.h"
24#include "xe_step.h"
25
26/**
27 * DOC: Hardware workarounds
28 *
29 * Hardware workarounds are register programming documented to be executed in
30 * the driver that fall outside of the normal programming sequences for a
31 * platform. There are some basic categories of workarounds, depending on
32 * how/when they are applied:
33 *
34 * - LRC workarounds: workarounds that touch registers that are
35 * saved/restored to/from the HW context image. The list is emitted (via Load
36 * Register Immediate commands) once when initializing the device and saved in
37 * the default context. That default context is then used on every context
38 * creation to have a "primed golden context", i.e. a context image that
39 * already contains the changes needed to all the registers.
40 *
41 * - Engine workarounds: the list of these WAs is applied whenever the specific
42 * engine is reset. It's also possible that a set of engine classes share a
43 * common power domain and they are reset together. This happens on some
44 * platforms with render and compute engines. In this case (at least) one of
45 * them need to keeep the workaround programming: the approach taken in the
46 * driver is to tie those workarounds to the first compute/render engine that
47 * is registered. When executing with GuC submission, engine resets are
48 * outside of kernel driver control, hence the list of registers involved in
49 * written once, on engine initialization, and then passed to GuC, that
50 * saves/restores their values before/after the reset takes place. See
51 * ``drivers/gpu/drm/xe/xe_guc_ads.c`` for reference.
52 *
53 * - GT workarounds: the list of these WAs is applied whenever these registers
54 * revert to their default values: on GPU reset, suspend/resume [1]_, etc.
55 *
56 * - Register whitelist: some workarounds need to be implemented in userspace,
57 * but need to touch privileged registers. The whitelist in the kernel
58 * instructs the hardware to allow the access to happen. From the kernel side,
59 * this is just a special case of a MMIO workaround (as we write the list of
60 * these to/be-whitelisted registers to some special HW registers).
61 *
62 * - Workaround batchbuffers: buffers that get executed automatically by the
63 * hardware on every HW context restore. These buffers are created and
64 * programmed in the default context so the hardware always go through those
65 * programming sequences when switching contexts. The support for workaround
66 * batchbuffers is enabled these hardware mechanisms:
67 *
68 * #. INDIRECT_CTX: A batchbuffer and an offset are provided in the default
69 * context, pointing the hardware to jump to that location when that offset
70 * is reached in the context restore. Workaround batchbuffer in the driver
71 * currently uses this mechanism for all platforms.
72 *
73 * #. BB_PER_CTX_PTR: A batchbuffer is provided in the default context,
74 * pointing the hardware to a buffer to continue executing after the
75 * engine registers are restored in a context restore sequence. This is
76 * currently not used in the driver.
77 *
78 * - Other/OOB: There are WAs that, due to their nature, cannot be applied from
79 * a central place. Those are peppered around the rest of the code, as needed.
80 * Workarounds related to the display IP are the main example.
81 *
82 * .. [1] Technically, some registers are powercontext saved & restored, so they
83 * survive a suspend/resume. In practice, writing them again is not too
84 * costly and simplifies things, so it's the approach taken in the driver.
85 *
86 * .. note::
87 * Hardware workarounds in xe work the same way as in i915, with the
88 * difference of how they are maintained in the code. In xe it uses the
89 * xe_rtp infrastructure so the workarounds can be kept in tables, following
90 * a more declarative approach rather than procedural.
91 */
92
93#undef XE_REG_MCR
94#define XE_REG_MCR(...) XE_REG(__VA_ARGS__, .mcr = 1)
95
96__diag_push();
97__diag_ignore_all("-Woverride-init", "Allow field overrides in table");
98
99static const struct xe_rtp_entry_sr gt_was[] = {
100 { XE_RTP_NAME("14011060649"),
101 XE_RTP_RULES(MEDIA_VERSION_RANGE(1200, 1255),
102 ENGINE_CLASS(VIDEO_DECODE),
103 FUNC(xe_rtp_match_even_instance)),
104 XE_RTP_ACTIONS(SET(VDBOX_CGCTL3F10(0), IECPUNIT_CLKGATE_DIS)),
105 XE_RTP_ENTRY_FLAG(FOREACH_ENGINE),
106 },
107 { XE_RTP_NAME("14011059788"),
108 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210)),
109 XE_RTP_ACTIONS(SET(DFR_RATIO_EN_AND_CHICKEN, DFR_DISABLE))
110 },
111 { XE_RTP_NAME("14015795083"),
112 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1260)),
113 XE_RTP_ACTIONS(CLR(MISCCPCTL, DOP_CLOCK_GATE_RENDER_ENABLE))
114 },
115
116 /* DG1 */
117
118 { XE_RTP_NAME("1409420604"),
119 XE_RTP_RULES(PLATFORM(DG1)),
120 XE_RTP_ACTIONS(SET(SUBSLICE_UNIT_LEVEL_CLKGATE2, CPSSUNIT_CLKGATE_DIS))
121 },
122 { XE_RTP_NAME("1408615072"),
123 XE_RTP_RULES(PLATFORM(DG1)),
124 XE_RTP_ACTIONS(SET(UNSLICE_UNIT_LEVEL_CLKGATE2, VSUNIT_CLKGATE2_DIS))
125 },
126
127 /* DG2 */
128
129 { XE_RTP_NAME("22010523718"),
130 XE_RTP_RULES(SUBPLATFORM(DG2, G10)),
131 XE_RTP_ACTIONS(SET(UNSLICE_UNIT_LEVEL_CLKGATE, CG3DDISCFEG_CLKGATE_DIS))
132 },
133 { XE_RTP_NAME("14011006942"),
134 XE_RTP_RULES(SUBPLATFORM(DG2, G10)),
135 XE_RTP_ACTIONS(SET(SUBSLICE_UNIT_LEVEL_CLKGATE, DSS_ROUTER_CLKGATE_DIS))
136 },
137 { XE_RTP_NAME("14014830051"),
138 XE_RTP_RULES(PLATFORM(DG2)),
139 XE_RTP_ACTIONS(CLR(SARB_CHICKEN1, COMP_CKN_IN))
140 },
141 { XE_RTP_NAME("18018781329"),
142 XE_RTP_RULES(PLATFORM(DG2)),
143 XE_RTP_ACTIONS(SET(RENDER_MOD_CTRL, FORCE_MISS_FTLB),
144 SET(COMP_MOD_CTRL, FORCE_MISS_FTLB),
145 SET(XEHP_VDBX_MOD_CTRL, FORCE_MISS_FTLB),
146 SET(XEHP_VEBX_MOD_CTRL, FORCE_MISS_FTLB))
147 },
148 { XE_RTP_NAME("1509235366"),
149 XE_RTP_RULES(PLATFORM(DG2)),
150 XE_RTP_ACTIONS(SET(XEHP_GAMCNTRL_CTRL,
151 INVALIDATION_BROADCAST_MODE_DIS |
152 GLOBAL_INVALIDATION_MODE))
153 },
154
155 /* PVC */
156
157 { XE_RTP_NAME("18018781329"),
158 XE_RTP_RULES(PLATFORM(PVC)),
159 XE_RTP_ACTIONS(SET(RENDER_MOD_CTRL, FORCE_MISS_FTLB),
160 SET(COMP_MOD_CTRL, FORCE_MISS_FTLB),
161 SET(XEHP_VDBX_MOD_CTRL, FORCE_MISS_FTLB),
162 SET(XEHP_VEBX_MOD_CTRL, FORCE_MISS_FTLB))
163 },
164 { XE_RTP_NAME("16016694945"),
165 XE_RTP_RULES(PLATFORM(PVC)),
166 XE_RTP_ACTIONS(SET(XEHPC_LNCFMISCCFGREG0, XEHPC_OVRLSCCC))
167 },
168
169 /* Xe_LPG */
170
171 { XE_RTP_NAME("14015795083"),
172 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271), GRAPHICS_STEP(A0, B0)),
173 XE_RTP_ACTIONS(CLR(MISCCPCTL, DOP_CLOCK_GATE_RENDER_ENABLE))
174 },
175 { XE_RTP_NAME("14018575942"),
176 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271)),
177 XE_RTP_ACTIONS(SET(COMP_MOD_CTRL, FORCE_MISS_FTLB))
178 },
179 { XE_RTP_NAME("22016670082"),
180 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271)),
181 XE_RTP_ACTIONS(SET(SQCNT1, ENFORCE_RAR))
182 },
183
184 /* Xe_LPM+ */
185
186 { XE_RTP_NAME("16021867713"),
187 XE_RTP_RULES(MEDIA_VERSION(1300),
188 ENGINE_CLASS(VIDEO_DECODE)),
189 XE_RTP_ACTIONS(SET(VDBOX_CGCTL3F1C(0), MFXPIPE_CLKGATE_DIS)),
190 XE_RTP_ENTRY_FLAG(FOREACH_ENGINE),
191 },
192 { XE_RTP_NAME("22016670082"),
193 XE_RTP_RULES(MEDIA_VERSION(1300)),
194 XE_RTP_ACTIONS(SET(XELPMP_SQCNT1, ENFORCE_RAR))
195 },
196
197 /* Xe2_LPG */
198
199 { XE_RTP_NAME("16020975621"),
200 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0)),
201 XE_RTP_ACTIONS(SET(XEHP_SLICE_UNIT_LEVEL_CLKGATE, SBEUNIT_CLKGATE_DIS))
202 },
203 { XE_RTP_NAME("14018157293"),
204 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0)),
205 XE_RTP_ACTIONS(SET(XEHPC_L3CLOS_MASK(0), ~0),
206 SET(XEHPC_L3CLOS_MASK(1), ~0),
207 SET(XEHPC_L3CLOS_MASK(2), ~0),
208 SET(XEHPC_L3CLOS_MASK(3), ~0))
209 },
210
211 /* Xe2_LPM */
212
213 { XE_RTP_NAME("14017421178"),
214 XE_RTP_RULES(MEDIA_VERSION(2000),
215 ENGINE_CLASS(VIDEO_DECODE)),
216 XE_RTP_ACTIONS(SET(VDBOX_CGCTL3F10(0), IECPUNIT_CLKGATE_DIS)),
217 XE_RTP_ENTRY_FLAG(FOREACH_ENGINE),
218 },
219 { XE_RTP_NAME("16021867713"),
220 XE_RTP_RULES(MEDIA_VERSION(2000),
221 ENGINE_CLASS(VIDEO_DECODE)),
222 XE_RTP_ACTIONS(SET(VDBOX_CGCTL3F1C(0), MFXPIPE_CLKGATE_DIS)),
223 XE_RTP_ENTRY_FLAG(FOREACH_ENGINE),
224 },
225 { XE_RTP_NAME("14019449301"),
226 XE_RTP_RULES(MEDIA_VERSION(2000), ENGINE_CLASS(VIDEO_DECODE)),
227 XE_RTP_ACTIONS(SET(VDBOX_CGCTL3F08(0), CG3DDISHRS_CLKGATE_DIS)),
228 XE_RTP_ENTRY_FLAG(FOREACH_ENGINE),
229 },
230
231 {}
232};
233
234static const struct xe_rtp_entry_sr engine_was[] = {
235 { XE_RTP_NAME("22010931296, 18011464164, 14010919138"),
236 XE_RTP_RULES(GRAPHICS_VERSION(1200), ENGINE_CLASS(RENDER)),
237 XE_RTP_ACTIONS(SET(FF_THREAD_MODE(RENDER_RING_BASE),
238 FF_TESSELATION_DOP_GATE_DISABLE))
239 },
240 { XE_RTP_NAME("1409804808"),
241 XE_RTP_RULES(GRAPHICS_VERSION(1200),
242 ENGINE_CLASS(RENDER),
243 IS_INTEGRATED),
244 XE_RTP_ACTIONS(SET(ROW_CHICKEN2, PUSH_CONST_DEREF_HOLD_DIS))
245 },
246 { XE_RTP_NAME("14010229206, 1409085225"),
247 XE_RTP_RULES(GRAPHICS_VERSION(1200),
248 ENGINE_CLASS(RENDER),
249 IS_INTEGRATED),
250 XE_RTP_ACTIONS(SET(ROW_CHICKEN4, DISABLE_TDL_PUSH))
251 },
252 { XE_RTP_NAME("1606931601"),
253 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210), ENGINE_CLASS(RENDER)),
254 XE_RTP_ACTIONS(SET(ROW_CHICKEN2, DISABLE_EARLY_READ))
255 },
256 { XE_RTP_NAME("14010826681, 1606700617, 22010271021, 18019627453"),
257 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1255), ENGINE_CLASS(RENDER)),
258 XE_RTP_ACTIONS(SET(CS_DEBUG_MODE1(RENDER_RING_BASE),
259 FF_DOP_CLOCK_GATE_DISABLE))
260 },
261 { XE_RTP_NAME("1406941453"),
262 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210), ENGINE_CLASS(RENDER)),
263 XE_RTP_ACTIONS(SET(SAMPLER_MODE, ENABLE_SMALLPL))
264 },
265 { XE_RTP_NAME("FtrPerCtxtPreemptionGranularityControl"),
266 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1250), ENGINE_CLASS(RENDER)),
267 XE_RTP_ACTIONS(SET(FF_SLICE_CS_CHICKEN1(RENDER_RING_BASE),
268 FFSC_PERCTX_PREEMPT_CTRL))
269 },
270
271 /* TGL */
272
273 { XE_RTP_NAME("1607297627, 1607030317, 1607186500"),
274 XE_RTP_RULES(PLATFORM(TIGERLAKE), ENGINE_CLASS(RENDER)),
275 XE_RTP_ACTIONS(SET(RING_PSMI_CTL(RENDER_RING_BASE),
276 WAIT_FOR_EVENT_POWER_DOWN_DISABLE |
277 RC_SEMA_IDLE_MSG_DISABLE))
278 },
279
280 /* RKL */
281
282 { XE_RTP_NAME("1607297627, 1607030317, 1607186500"),
283 XE_RTP_RULES(PLATFORM(ROCKETLAKE), ENGINE_CLASS(RENDER)),
284 XE_RTP_ACTIONS(SET(RING_PSMI_CTL(RENDER_RING_BASE),
285 WAIT_FOR_EVENT_POWER_DOWN_DISABLE |
286 RC_SEMA_IDLE_MSG_DISABLE))
287 },
288
289 /* ADL-P */
290
291 { XE_RTP_NAME("1607297627, 1607030317, 1607186500"),
292 XE_RTP_RULES(PLATFORM(ALDERLAKE_P), ENGINE_CLASS(RENDER)),
293 XE_RTP_ACTIONS(SET(RING_PSMI_CTL(RENDER_RING_BASE),
294 WAIT_FOR_EVENT_POWER_DOWN_DISABLE |
295 RC_SEMA_IDLE_MSG_DISABLE))
296 },
297
298 /* DG2 */
299
300 { XE_RTP_NAME("22013037850"),
301 XE_RTP_RULES(PLATFORM(DG2), FUNC(xe_rtp_match_first_render_or_compute)),
302 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW,
303 DISABLE_128B_EVICTION_COMMAND_UDW))
304 },
305 { XE_RTP_NAME("22014226127"),
306 XE_RTP_RULES(PLATFORM(DG2), FUNC(xe_rtp_match_first_render_or_compute)),
307 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0, DISABLE_D8_D16_COASLESCE))
308 },
309 { XE_RTP_NAME("18017747507"),
310 XE_RTP_RULES(PLATFORM(DG2), FUNC(xe_rtp_match_first_render_or_compute)),
311 XE_RTP_ACTIONS(SET(VFG_PREEMPTION_CHICKEN,
312 POLYGON_TRIFAN_LINELOOP_DISABLE))
313 },
314 { XE_RTP_NAME("22012826095, 22013059131"),
315 XE_RTP_RULES(SUBPLATFORM(DG2, G11),
316 FUNC(xe_rtp_match_first_render_or_compute)),
317 XE_RTP_ACTIONS(FIELD_SET(LSC_CHICKEN_BIT_0_UDW,
318 MAXREQS_PER_BANK,
319 REG_FIELD_PREP(MAXREQS_PER_BANK, 2)))
320 },
321 { XE_RTP_NAME("22013059131"),
322 XE_RTP_RULES(SUBPLATFORM(DG2, G11),
323 FUNC(xe_rtp_match_first_render_or_compute)),
324 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0, FORCE_1_SUB_MESSAGE_PER_FRAGMENT))
325 },
326 { XE_RTP_NAME("14015227452"),
327 XE_RTP_RULES(PLATFORM(DG2),
328 FUNC(xe_rtp_match_first_render_or_compute)),
329 XE_RTP_ACTIONS(SET(ROW_CHICKEN4, XEHP_DIS_BBL_SYSPIPE))
330 },
331 { XE_RTP_NAME("16015675438"),
332 XE_RTP_RULES(PLATFORM(DG2),
333 FUNC(xe_rtp_match_first_render_or_compute)),
334 XE_RTP_ACTIONS(SET(FF_SLICE_CS_CHICKEN2(RENDER_RING_BASE),
335 PERF_FIX_BALANCING_CFE_DISABLE))
336 },
337 { XE_RTP_NAME("18028616096"),
338 XE_RTP_RULES(PLATFORM(DG2),
339 FUNC(xe_rtp_match_first_render_or_compute)),
340 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, UGM_FRAGMENT_THRESHOLD_TO_3))
341 },
342 { XE_RTP_NAME("22015475538"),
343 XE_RTP_RULES(PLATFORM(DG2),
344 FUNC(xe_rtp_match_first_render_or_compute)),
345 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, DIS_CHAIN_2XSIMD8))
346 },
347 { XE_RTP_NAME("22012654132"),
348 XE_RTP_RULES(SUBPLATFORM(DG2, G11),
349 FUNC(xe_rtp_match_first_render_or_compute)),
350 XE_RTP_ACTIONS(SET(CACHE_MODE_SS, ENABLE_PREFETCH_INTO_IC,
351 /*
352 * Register can't be read back for verification on
353 * DG2 due to Wa_14012342262
354 */
355 .read_mask = 0))
356 },
357 { XE_RTP_NAME("1509727124"),
358 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
359 XE_RTP_ACTIONS(SET(SAMPLER_MODE, SC_DISABLE_POWER_OPTIMIZATION_EBB))
360 },
361 { XE_RTP_NAME("22012856258"),
362 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
363 XE_RTP_ACTIONS(SET(ROW_CHICKEN2, DISABLE_READ_SUPPRESSION))
364 },
365 { XE_RTP_NAME("22010960976, 14013347512"),
366 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
367 XE_RTP_ACTIONS(CLR(XEHP_HDC_CHICKEN0,
368 LSC_L1_FLUSH_CTL_3D_DATAPORT_FLUSH_EVENTS_MASK))
369 },
370 { XE_RTP_NAME("14015150844"),
371 XE_RTP_RULES(PLATFORM(DG2), FUNC(xe_rtp_match_first_render_or_compute)),
372 XE_RTP_ACTIONS(SET(XEHP_HDC_CHICKEN0, DIS_ATOMIC_CHAINING_TYPED_WRITES,
373 XE_RTP_NOCHECK))
374 },
375
376 /* PVC */
377
378 { XE_RTP_NAME("22014226127"),
379 XE_RTP_RULES(PLATFORM(PVC), FUNC(xe_rtp_match_first_render_or_compute)),
380 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0, DISABLE_D8_D16_COASLESCE))
381 },
382 { XE_RTP_NAME("14015227452"),
383 XE_RTP_RULES(PLATFORM(PVC), FUNC(xe_rtp_match_first_render_or_compute)),
384 XE_RTP_ACTIONS(SET(ROW_CHICKEN4, XEHP_DIS_BBL_SYSPIPE))
385 },
386 { XE_RTP_NAME("16015675438"),
387 XE_RTP_RULES(PLATFORM(PVC), FUNC(xe_rtp_match_first_render_or_compute)),
388 XE_RTP_ACTIONS(SET(FF_SLICE_CS_CHICKEN2(RENDER_RING_BASE),
389 PERF_FIX_BALANCING_CFE_DISABLE))
390 },
391 { XE_RTP_NAME("14014999345"),
392 XE_RTP_RULES(PLATFORM(PVC), ENGINE_CLASS(COMPUTE),
393 GRAPHICS_STEP(B0, C0)),
394 XE_RTP_ACTIONS(SET(CACHE_MODE_SS, DISABLE_ECC))
395 },
396
397 /* Xe_LPG */
398
399 { XE_RTP_NAME("14017856879"),
400 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271),
401 FUNC(xe_rtp_match_first_render_or_compute)),
402 XE_RTP_ACTIONS(SET(ROW_CHICKEN3, DIS_FIX_EOT1_FLUSH))
403 },
404 { XE_RTP_NAME("14015150844"),
405 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271),
406 FUNC(xe_rtp_match_first_render_or_compute)),
407 XE_RTP_ACTIONS(SET(XEHP_HDC_CHICKEN0, DIS_ATOMIC_CHAINING_TYPED_WRITES,
408 XE_RTP_NOCHECK))
409 },
410
411 /* Xe2_LPG */
412
413 { XE_RTP_NAME("18032247524"),
414 XE_RTP_RULES(GRAPHICS_VERSION(2004),
415 FUNC(xe_rtp_match_first_render_or_compute)),
416 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0, SEQUENTIAL_ACCESS_UPGRADE_DISABLE))
417 },
418 { XE_RTP_NAME("16018712365"),
419 XE_RTP_RULES(GRAPHICS_VERSION(2004), FUNC(xe_rtp_match_first_render_or_compute)),
420 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, XE2_ALLOC_DPA_STARVE_FIX_DIS))
421 },
422 { XE_RTP_NAME("14018957109"),
423 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
424 FUNC(xe_rtp_match_first_render_or_compute)),
425 XE_RTP_ACTIONS(SET(HALF_SLICE_CHICKEN5, DISABLE_SAMPLE_G_PERFORMANCE))
426 },
427 { XE_RTP_NAME("16021540221"),
428 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
429 FUNC(xe_rtp_match_first_render_or_compute)),
430 XE_RTP_ACTIONS(SET(ROW_CHICKEN4, DISABLE_TDL_PUSH))
431 },
432 { XE_RTP_NAME("14019322943"),
433 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
434 FUNC(xe_rtp_match_first_render_or_compute)),
435 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0, TGM_WRITE_EOM_FORCE))
436 },
437 { XE_RTP_NAME("14018471104"),
438 XE_RTP_RULES(GRAPHICS_VERSION(2004), FUNC(xe_rtp_match_first_render_or_compute)),
439 XE_RTP_ACTIONS(SET(LSC_CHICKEN_BIT_0_UDW, ENABLE_SMP_LD_RENDER_SURFACE_CONTROL))
440 },
441 { XE_RTP_NAME("16018737384"),
442 XE_RTP_RULES(GRAPHICS_VERSION(2004), FUNC(xe_rtp_match_first_render_or_compute)),
443 XE_RTP_ACTIONS(SET(ROW_CHICKEN, EARLY_EOT_DIS))
444 },
445 /*
446 * These two workarounds are the same, just applying to different
447 * engines. Although Wa_18032095049 (for the RCS) isn't required on
448 * all steppings, disabling these reports has no impact for our
449 * driver or the GuC, so we go ahead and treat it the same as
450 * Wa_16021639441 which does apply to all steppings.
451 */
452 { XE_RTP_NAME("18032095049, 16021639441"),
453 XE_RTP_RULES(GRAPHICS_VERSION(2004)),
454 XE_RTP_ACTIONS(SET(CSFE_CHICKEN1(0),
455 GHWSP_CSB_REPORT_DIS |
456 PPHWSP_CSB_AND_TIMESTAMP_REPORT_DIS,
457 XE_RTP_ACTION_FLAG(ENGINE_BASE)))
458 },
459 { XE_RTP_NAME("16018610683"),
460 XE_RTP_RULES(GRAPHICS_VERSION(2004), FUNC(xe_rtp_match_first_render_or_compute)),
461 XE_RTP_ACTIONS(SET(TDL_TSL_CHICKEN, SLM_WMTP_RESTORE))
462 },
463 {}
464};
465
466static const struct xe_rtp_entry_sr lrc_was[] = {
467 { XE_RTP_NAME("1409342910, 14010698770, 14010443199, 1408979724, 1409178076, 1409207793, 1409217633, 1409252684, 1409347922, 1409142259"),
468 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210)),
469 XE_RTP_ACTIONS(SET(COMMON_SLICE_CHICKEN3,
470 DISABLE_CPS_AWARE_COLOR_PIPE))
471 },
472 { XE_RTP_NAME("WaDisableGPGPUMidThreadPreemption"),
473 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210)),
474 XE_RTP_ACTIONS(FIELD_SET(CS_CHICKEN1(RENDER_RING_BASE),
475 PREEMPT_GPGPU_LEVEL_MASK,
476 PREEMPT_GPGPU_THREAD_GROUP_LEVEL))
477 },
478 { XE_RTP_NAME("1806527549"),
479 XE_RTP_RULES(GRAPHICS_VERSION(1200)),
480 XE_RTP_ACTIONS(SET(HIZ_CHICKEN, HZ_DEPTH_TEST_LE_GE_OPT_DISABLE))
481 },
482 { XE_RTP_NAME("1606376872"),
483 XE_RTP_RULES(GRAPHICS_VERSION(1200)),
484 XE_RTP_ACTIONS(SET(COMMON_SLICE_CHICKEN4, DISABLE_TDC_LOAD_BALANCING_CALC))
485 },
486
487 /* DG1 */
488
489 { XE_RTP_NAME("1409044764"),
490 XE_RTP_RULES(PLATFORM(DG1)),
491 XE_RTP_ACTIONS(CLR(COMMON_SLICE_CHICKEN3,
492 DG1_FLOAT_POINT_BLEND_OPT_STRICT_MODE_EN))
493 },
494 { XE_RTP_NAME("22010493298"),
495 XE_RTP_RULES(PLATFORM(DG1)),
496 XE_RTP_ACTIONS(SET(HIZ_CHICKEN,
497 DG1_HZ_READ_SUPPRESSION_OPTIMIZATION_DISABLE))
498 },
499
500 /* DG2 */
501
502 { XE_RTP_NAME("16013271637"),
503 XE_RTP_RULES(PLATFORM(DG2)),
504 XE_RTP_ACTIONS(SET(XEHP_SLICE_COMMON_ECO_CHICKEN1,
505 MSC_MSAA_REODER_BUF_BYPASS_DISABLE))
506 },
507 { XE_RTP_NAME("14014947963"),
508 XE_RTP_RULES(PLATFORM(DG2)),
509 XE_RTP_ACTIONS(FIELD_SET(VF_PREEMPTION,
510 PREEMPTION_VERTEX_COUNT,
511 0x4000))
512 },
513 { XE_RTP_NAME("18018764978"),
514 XE_RTP_RULES(PLATFORM(DG2)),
515 XE_RTP_ACTIONS(SET(XEHP_PSS_MODE2,
516 SCOREBOARD_STALL_FLUSH_CONTROL))
517 },
518 { XE_RTP_NAME("18019271663"),
519 XE_RTP_RULES(PLATFORM(DG2)),
520 XE_RTP_ACTIONS(SET(CACHE_MODE_1, MSAA_OPTIMIZATION_REDUC_DISABLE))
521 },
522 { XE_RTP_NAME("14019877138"),
523 XE_RTP_RULES(PLATFORM(DG2)),
524 XE_RTP_ACTIONS(SET(XEHP_PSS_CHICKEN, FD_END_COLLECT))
525 },
526
527 /* PVC */
528
529 { XE_RTP_NAME("16017236439"),
530 XE_RTP_RULES(PLATFORM(PVC), ENGINE_CLASS(COPY),
531 FUNC(xe_rtp_match_even_instance)),
532 XE_RTP_ACTIONS(SET(BCS_SWCTRL(0),
533 BCS_SWCTRL_DISABLE_256B,
534 XE_RTP_ACTION_FLAG(ENGINE_BASE))),
535 },
536
537 /* Xe_LPG */
538
539 { XE_RTP_NAME("18019271663"),
540 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271)),
541 XE_RTP_ACTIONS(SET(CACHE_MODE_1, MSAA_OPTIMIZATION_REDUC_DISABLE))
542 },
543 { XE_RTP_NAME("14019877138"),
544 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1271), ENGINE_CLASS(RENDER)),
545 XE_RTP_ACTIONS(SET(XEHP_PSS_CHICKEN, FD_END_COLLECT))
546 },
547
548 /* Xe2_LPG */
549
550 { XE_RTP_NAME("16020518922"),
551 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
552 ENGINE_CLASS(RENDER)),
553 XE_RTP_ACTIONS(SET(FF_MODE,
554 DIS_TE_AUTOSTRIP |
555 DIS_MESH_PARTIAL_AUTOSTRIP |
556 DIS_MESH_AUTOSTRIP),
557 SET(VFLSKPD,
558 DIS_PARTIAL_AUTOSTRIP |
559 DIS_AUTOSTRIP))
560 },
561 { XE_RTP_NAME("14019386621"),
562 XE_RTP_RULES(GRAPHICS_VERSION(2004), ENGINE_CLASS(RENDER)),
563 XE_RTP_ACTIONS(SET(VF_SCRATCHPAD, XE2_VFG_TED_CREDIT_INTERFACE_DISABLE))
564 },
565 { XE_RTP_NAME("14019877138"),
566 XE_RTP_RULES(GRAPHICS_VERSION(2004), ENGINE_CLASS(RENDER)),
567 XE_RTP_ACTIONS(SET(XEHP_PSS_CHICKEN, FD_END_COLLECT))
568 },
569 { XE_RTP_NAME("14020013138"),
570 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
571 ENGINE_CLASS(RENDER)),
572 XE_RTP_ACTIONS(SET(WM_CHICKEN3, HIZ_PLANE_COMPRESSION_DIS))
573 },
574 { XE_RTP_NAME("14019988906"),
575 XE_RTP_RULES(GRAPHICS_VERSION(2004), ENGINE_CLASS(RENDER)),
576 XE_RTP_ACTIONS(SET(XEHP_PSS_CHICKEN, FLSH_IGNORES_PSD))
577 },
578 { XE_RTP_NAME("16020183090"),
579 XE_RTP_RULES(GRAPHICS_VERSION(2004), GRAPHICS_STEP(A0, B0),
580 ENGINE_CLASS(RENDER)),
581 XE_RTP_ACTIONS(SET(INSTPM(RENDER_RING_BASE), ENABLE_SEMAPHORE_POLL_BIT))
582 },
583
584 {}
585};
586
587static __maybe_unused const struct xe_rtp_entry oob_was[] = {
588#include <generated/xe_wa_oob.c>
589 {}
590};
591
592static_assert(ARRAY_SIZE(oob_was) - 1 == _XE_WA_OOB_COUNT);
593
594__diag_pop();
595
596/**
597 * xe_wa_process_oob - process OOB workaround table
598 * @gt: GT instance to process workarounds for
599 *
600 * Process OOB workaround table for this platform, marking in @gt the
601 * workarounds that are active.
602 */
603void xe_wa_process_oob(struct xe_gt *gt)
604{
605 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(gt);
606
607 xe_rtp_process_ctx_enable_active_tracking(&ctx, gt->wa_active.oob,
608 ARRAY_SIZE(oob_was));
609 xe_rtp_process(&ctx, oob_was);
610}
611
612/**
613 * xe_wa_process_gt - process GT workaround table
614 * @gt: GT instance to process workarounds for
615 *
616 * Process GT workaround table for this platform, saving in @gt all the
617 * workarounds that need to be applied at the GT level.
618 */
619void xe_wa_process_gt(struct xe_gt *gt)
620{
621 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(gt);
622
623 xe_rtp_process_ctx_enable_active_tracking(&ctx, gt->wa_active.gt,
624 ARRAY_SIZE(gt_was));
625 xe_rtp_process_to_sr(&ctx, gt_was, >->reg_sr);
626}
627EXPORT_SYMBOL_IF_KUNIT(xe_wa_process_gt);
628
629/**
630 * xe_wa_process_engine - process engine workaround table
631 * @hwe: engine instance to process workarounds for
632 *
633 * Process engine workaround table for this platform, saving in @hwe all the
634 * workarounds that need to be applied at the engine level that match this
635 * engine.
636 */
637void xe_wa_process_engine(struct xe_hw_engine *hwe)
638{
639 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(hwe);
640
641 xe_rtp_process_ctx_enable_active_tracking(&ctx, hwe->gt->wa_active.engine,
642 ARRAY_SIZE(engine_was));
643 xe_rtp_process_to_sr(&ctx, engine_was, &hwe->reg_sr);
644}
645
646/**
647 * xe_wa_process_lrc - process context workaround table
648 * @hwe: engine instance to process workarounds for
649 *
650 * Process context workaround table for this platform, saving in @hwe all the
651 * workarounds that need to be applied on context restore. These are workarounds
652 * touching registers that are part of the HW context image.
653 */
654void xe_wa_process_lrc(struct xe_hw_engine *hwe)
655{
656 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(hwe);
657
658 xe_rtp_process_ctx_enable_active_tracking(&ctx, hwe->gt->wa_active.lrc,
659 ARRAY_SIZE(lrc_was));
660 xe_rtp_process_to_sr(&ctx, lrc_was, &hwe->reg_lrc);
661}
662
663/**
664 * xe_wa_init - initialize gt with workaround bookkeeping
665 * @gt: GT instance to initialize
666 *
667 * Returns 0 for success, negative error code otherwise.
668 */
669int xe_wa_init(struct xe_gt *gt)
670{
671 struct xe_device *xe = gt_to_xe(gt);
672 size_t n_oob, n_lrc, n_engine, n_gt, total;
673 unsigned long *p;
674
675 n_gt = BITS_TO_LONGS(ARRAY_SIZE(gt_was));
676 n_engine = BITS_TO_LONGS(ARRAY_SIZE(engine_was));
677 n_lrc = BITS_TO_LONGS(ARRAY_SIZE(lrc_was));
678 n_oob = BITS_TO_LONGS(ARRAY_SIZE(oob_was));
679 total = n_gt + n_engine + n_lrc + n_oob;
680
681 p = drmm_kzalloc(&xe->drm, sizeof(*p) * total, GFP_KERNEL);
682 if (!p)
683 return -ENOMEM;
684
685 gt->wa_active.gt = p;
686 p += n_gt;
687 gt->wa_active.engine = p;
688 p += n_engine;
689 gt->wa_active.lrc = p;
690 p += n_lrc;
691 gt->wa_active.oob = p;
692
693 return 0;
694}
695
696void xe_wa_dump(struct xe_gt *gt, struct drm_printer *p)
697{
698 size_t idx;
699
700 drm_printf(p, "GT Workarounds\n");
701 for_each_set_bit(idx, gt->wa_active.gt, ARRAY_SIZE(gt_was))
702 drm_printf_indent(p, 1, "%s\n", gt_was[idx].name);
703
704 drm_printf(p, "\nEngine Workarounds\n");
705 for_each_set_bit(idx, gt->wa_active.engine, ARRAY_SIZE(engine_was))
706 drm_printf_indent(p, 1, "%s\n", engine_was[idx].name);
707
708 drm_printf(p, "\nLRC Workarounds\n");
709 for_each_set_bit(idx, gt->wa_active.lrc, ARRAY_SIZE(lrc_was))
710 drm_printf_indent(p, 1, "%s\n", lrc_was[idx].name);
711
712 drm_printf(p, "\nOOB Workarounds\n");
713 for_each_set_bit(idx, gt->wa_active.oob, ARRAY_SIZE(oob_was))
714 if (oob_was[idx].name)
715 drm_printf_indent(p, 1, "%s\n", oob_was[idx].name);
716}
717
718/*
719 * Apply tile (non-GT, non-display) workarounds. Think very carefully before
720 * adding anything to this function; most workarounds should be implemented
721 * elsewhere. The programming here is primarily for sgunit/soc workarounds,
722 * which are relatively rare. Since the registers these workarounds target are
723 * outside the GT, they should only need to be applied once at device
724 * probe/resume; they will not lose their values on any kind of GT or engine
725 * reset.
726 *
727 * TODO: We may want to move this over to xe_rtp in the future once we have
728 * enough workarounds to justify the work.
729 */
730void xe_wa_apply_tile_workarounds(struct xe_tile *tile)
731{
732 struct xe_gt *mmio = tile->primary_gt;
733
734 if (XE_WA(mmio, 22010954014))
735 xe_mmio_rmw32(mmio, XEHP_CLOCK_GATE_DIS, 0, SGSI_SIDECLK_DIS);
736}