Loading...
Note: File does not exist in v5.4.
1// SPDX-License-Identifier: MIT
2/*
3 * Copyright © 2022 Intel Corporation
4 */
5
6#include "xe_tuning.h"
7
8#include <kunit/visibility.h>
9
10#include "regs/xe_gt_regs.h"
11#include "xe_gt_types.h"
12#include "xe_platform_types.h"
13#include "xe_rtp.h"
14
15#undef XE_REG_MCR
16#define XE_REG_MCR(...) XE_REG(__VA_ARGS__, .mcr = 1)
17
18static const struct xe_rtp_entry_sr gt_tunings[] = {
19 { XE_RTP_NAME("Tuning: Blend Fill Caching Optimization Disable"),
20 XE_RTP_RULES(PLATFORM(DG2)),
21 XE_RTP_ACTIONS(SET(XEHP_L3SCQREG7, BLEND_FILL_CACHING_OPT_DIS))
22 },
23 { XE_RTP_NAME("Tuning: 32B Access Enable"),
24 XE_RTP_RULES(PLATFORM(DG2)),
25 XE_RTP_ACTIONS(SET(XEHP_SQCM, EN_32B_ACCESS))
26 },
27
28 /* Xe2 */
29
30 { XE_RTP_NAME("Tuning: L3 cache"),
31 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(2001, XE_RTP_END_VERSION_UNDEFINED)),
32 XE_RTP_ACTIONS(FIELD_SET(XEHP_L3SQCREG5, L3_PWM_TIMER_INIT_VAL_MASK,
33 REG_FIELD_PREP(L3_PWM_TIMER_INIT_VAL_MASK, 0x7f)))
34 },
35 { XE_RTP_NAME("Tuning: L3 cache - media"),
36 XE_RTP_RULES(MEDIA_VERSION_RANGE(2000, XE_RTP_END_VERSION_UNDEFINED)),
37 XE_RTP_ACTIONS(FIELD_SET(XE2LPM_L3SQCREG5, L3_PWM_TIMER_INIT_VAL_MASK,
38 REG_FIELD_PREP(L3_PWM_TIMER_INIT_VAL_MASK, 0x7f)))
39 },
40 { XE_RTP_NAME("Tuning: Compression Overfetch"),
41 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(2001, XE_RTP_END_VERSION_UNDEFINED)),
42 XE_RTP_ACTIONS(CLR(CCCHKNREG1, ENCOMPPERFFIX),
43 SET(CCCHKNREG1, L3CMPCTRL))
44 },
45 { XE_RTP_NAME("Tuning: Compression Overfetch - media"),
46 XE_RTP_RULES(MEDIA_VERSION_RANGE(2000, XE_RTP_END_VERSION_UNDEFINED)),
47 XE_RTP_ACTIONS(CLR(XE2LPM_CCCHKNREG1, ENCOMPPERFFIX),
48 SET(XE2LPM_CCCHKNREG1, L3CMPCTRL))
49 },
50 { XE_RTP_NAME("Tuning: Enable compressible partial write overfetch in L3"),
51 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(2001, XE_RTP_END_VERSION_UNDEFINED)),
52 XE_RTP_ACTIONS(SET(L3SQCREG3, COMPPWOVERFETCHEN))
53 },
54 { XE_RTP_NAME("Tuning: Enable compressible partial write overfetch in L3 - media"),
55 XE_RTP_RULES(MEDIA_VERSION_RANGE(2000, XE_RTP_END_VERSION_UNDEFINED)),
56 XE_RTP_ACTIONS(SET(XE2LPM_L3SQCREG3, COMPPWOVERFETCHEN))
57 },
58 { XE_RTP_NAME("Tuning: L2 Overfetch Compressible Only"),
59 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(2001, XE_RTP_END_VERSION_UNDEFINED)),
60 XE_RTP_ACTIONS(SET(L3SQCREG2,
61 COMPMEMRD256BOVRFETCHEN))
62 },
63 { XE_RTP_NAME("Tuning: L2 Overfetch Compressible Only - media"),
64 XE_RTP_RULES(MEDIA_VERSION_RANGE(2000, XE_RTP_END_VERSION_UNDEFINED)),
65 XE_RTP_ACTIONS(SET(XE2LPM_L3SQCREG2,
66 COMPMEMRD256BOVRFETCHEN))
67 },
68 { XE_RTP_NAME("Tuning: Stateless compression control"),
69 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(2001, XE_RTP_END_VERSION_UNDEFINED)),
70 XE_RTP_ACTIONS(FIELD_SET(STATELESS_COMPRESSION_CTRL, UNIFIED_COMPRESSION_FORMAT,
71 REG_FIELD_PREP(UNIFIED_COMPRESSION_FORMAT, 0)))
72 },
73 { XE_RTP_NAME("Tuning: Stateless compression control - media"),
74 XE_RTP_RULES(MEDIA_VERSION_RANGE(1301, XE_RTP_END_VERSION_UNDEFINED)),
75 XE_RTP_ACTIONS(FIELD_SET(STATELESS_COMPRESSION_CTRL, UNIFIED_COMPRESSION_FORMAT,
76 REG_FIELD_PREP(UNIFIED_COMPRESSION_FORMAT, 0)))
77 },
78 { XE_RTP_NAME("Tuning: L3 RW flush all Cache"),
79 XE_RTP_RULES(GRAPHICS_VERSION(2004)),
80 XE_RTP_ACTIONS(SET(SCRATCH3_LBCF, RWFLUSHALLEN))
81 },
82 { XE_RTP_NAME("Tuning: L3 RW flush all cache - media"),
83 XE_RTP_RULES(MEDIA_VERSION(2000)),
84 XE_RTP_ACTIONS(SET(XE2LPM_SCRATCH3_LBCF, RWFLUSHALLEN))
85 },
86
87 {}
88};
89
90static const struct xe_rtp_entry_sr engine_tunings[] = {
91 { XE_RTP_NAME("Tuning: Set Indirect State Override"),
92 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1274),
93 ENGINE_CLASS(RENDER)),
94 XE_RTP_ACTIONS(SET(SAMPLER_MODE, INDIRECT_STATE_BASE_ADDR_OVERRIDE))
95 },
96 {}
97};
98
99static const struct xe_rtp_entry_sr lrc_tunings[] = {
100 { XE_RTP_NAME("Tuning: ganged timer, also known as 16011163337"),
101 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1200, 1210), ENGINE_CLASS(RENDER)),
102 /* read verification is ignored due to 1608008084. */
103 XE_RTP_ACTIONS(FIELD_SET_NO_READ_MASK(FF_MODE2,
104 FF_MODE2_GS_TIMER_MASK,
105 FF_MODE2_GS_TIMER_224))
106 },
107
108 /* DG2 */
109
110 { XE_RTP_NAME("Tuning: L3 cache"),
111 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
112 XE_RTP_ACTIONS(FIELD_SET(XEHP_L3SQCREG5, L3_PWM_TIMER_INIT_VAL_MASK,
113 REG_FIELD_PREP(L3_PWM_TIMER_INIT_VAL_MASK, 0x7f)))
114 },
115 { XE_RTP_NAME("Tuning: TDS gang timer"),
116 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
117 /* read verification is ignored as in i915 - need to check enabling */
118 XE_RTP_ACTIONS(FIELD_SET_NO_READ_MASK(XEHP_FF_MODE2,
119 FF_MODE2_TDS_TIMER_MASK,
120 FF_MODE2_TDS_TIMER_128))
121 },
122 { XE_RTP_NAME("Tuning: TBIMR fast clip"),
123 XE_RTP_RULES(PLATFORM(DG2), ENGINE_CLASS(RENDER)),
124 XE_RTP_ACTIONS(SET(CHICKEN_RASTER_2, TBIMR_FAST_CLIP))
125 },
126
127 /* Xe_LPG */
128
129 { XE_RTP_NAME("Tuning: L3 cache"),
130 XE_RTP_RULES(GRAPHICS_VERSION_RANGE(1270, 1274), ENGINE_CLASS(RENDER)),
131 XE_RTP_ACTIONS(FIELD_SET(XEHP_L3SQCREG5, L3_PWM_TIMER_INIT_VAL_MASK,
132 REG_FIELD_PREP(L3_PWM_TIMER_INIT_VAL_MASK, 0x7f)))
133 },
134
135 /* Xe2_HPG */
136
137 { XE_RTP_NAME("Tuning: vs hit max value"),
138 XE_RTP_RULES(GRAPHICS_VERSION(2001), ENGINE_CLASS(RENDER)),
139 XE_RTP_ACTIONS(FIELD_SET(FF_MODE, VS_HIT_MAX_VALUE_MASK,
140 REG_FIELD_PREP(VS_HIT_MAX_VALUE_MASK, 0x3f)))
141 },
142
143 {}
144};
145
146void xe_tuning_process_gt(struct xe_gt *gt)
147{
148 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(gt);
149
150 xe_rtp_process_to_sr(&ctx, gt_tunings, >->reg_sr);
151}
152EXPORT_SYMBOL_IF_KUNIT(xe_tuning_process_gt);
153
154void xe_tuning_process_engine(struct xe_hw_engine *hwe)
155{
156 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(hwe);
157
158 xe_rtp_process_to_sr(&ctx, engine_tunings, &hwe->reg_sr);
159}
160EXPORT_SYMBOL_IF_KUNIT(xe_tuning_process_engine);
161
162/**
163 * xe_tuning_process_lrc - process lrc tunings
164 * @hwe: engine instance to process tunings for
165 *
166 * Process LRC table for this platform, saving in @hwe all the tunings that need
167 * to be applied on context restore. These are tunings touching registers that
168 * are part of the HW context image.
169 */
170void xe_tuning_process_lrc(struct xe_hw_engine *hwe)
171{
172 struct xe_rtp_process_ctx ctx = XE_RTP_PROCESS_CTX_INITIALIZER(hwe);
173
174 xe_rtp_process_to_sr(&ctx, lrc_tunings, &hwe->reg_lrc);
175}