Linux Audio

Check our new training course

Loading...
  1/* SPDX-License-Identifier: MIT */
  2/*
  3 * Copyright © 2019 Intel Corporation
  4 */
  5
  6#ifndef __INTEL_SSEU_H__
  7#define __INTEL_SSEU_H__
  8
  9#include <linux/types.h>
 10#include <linux/kernel.h>
 11
 12#include "i915_gem.h"
 13
 14struct drm_i915_private;
 15struct intel_gt;
 16struct drm_printer;
 17
 18/*
 19 * Maximum number of slices on older platforms.  Slices no longer exist
 20 * starting on Xe_HP ("gslices," "cslices," etc. are a different concept and
 21 * are not expressed through fusing).
 22 */
 23#define GEN_MAX_HSW_SLICES		3
 24
 25/*
 26 * Maximum number of subslices that can exist within a HSW-style slice.  This
 27 * is only relevant to pre-Xe_HP platforms (Xe_HP and beyond use the
 28 * I915_MAX_SS_FUSE_BITS value below).
 29 */
 30#define GEN_MAX_SS_PER_HSW_SLICE	8
 31
 32/*
 33 * Maximum number of 32-bit registers used by hardware to express the
 34 * enabled/disabled subslices.
 35 */
 36#define I915_MAX_SS_FUSE_REGS	2
 37#define I915_MAX_SS_FUSE_BITS	(I915_MAX_SS_FUSE_REGS * 32)
 38
 39/* Maximum number of EUs that can exist within a subslice or DSS. */
 40#define GEN_MAX_EUS_PER_SS		16
 41
 42#define SSEU_MAX(a, b)			((a) > (b) ? (a) : (b))
 43
 44/* The maximum number of bits needed to express each subslice/DSS independently */
 45#define GEN_SS_MASK_SIZE		SSEU_MAX(I915_MAX_SS_FUSE_BITS, \
 46						 GEN_MAX_HSW_SLICES * GEN_MAX_SS_PER_HSW_SLICE)
 47
 48#define GEN_SSEU_STRIDE(max_entries)	DIV_ROUND_UP(max_entries, BITS_PER_BYTE)
 49#define GEN_MAX_SUBSLICE_STRIDE		GEN_SSEU_STRIDE(GEN_SS_MASK_SIZE)
 50#define GEN_MAX_EU_STRIDE		GEN_SSEU_STRIDE(GEN_MAX_EUS_PER_SS)
 51
 52#define GEN_DSS_PER_GSLICE	4
 53#define GEN_DSS_PER_CSLICE	8
 54#define GEN_DSS_PER_MSLICE	8
 55
 56#define GEN_MAX_GSLICES		(I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_GSLICE)
 57#define GEN_MAX_CSLICES		(I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_CSLICE)
 58
 59typedef union {
 60	u8 hsw[GEN_MAX_HSW_SLICES];
 61
 62	/* Bitmap compatible with linux/bitmap.h; may exceed size of u64 */
 63	unsigned long xehp[BITS_TO_LONGS(I915_MAX_SS_FUSE_BITS)];
 64} intel_sseu_ss_mask_t;
 65
 66#define XEHP_BITMAP_BITS(mask)	((int)BITS_PER_TYPE(typeof(mask.xehp)))
 67
 68struct sseu_dev_info {
 69	u8 slice_mask;
 70	intel_sseu_ss_mask_t subslice_mask;
 71	intel_sseu_ss_mask_t geometry_subslice_mask;
 72	intel_sseu_ss_mask_t compute_subslice_mask;
 73	union {
 74		u16 hsw[GEN_MAX_HSW_SLICES][GEN_MAX_SS_PER_HSW_SLICE];
 75		u16 xehp[I915_MAX_SS_FUSE_BITS];
 76	} eu_mask;
 77
 78	u16 eu_total;
 79	u8 eu_per_subslice;
 80	u8 min_eu_in_pool;
 81	/* For each slice, which subslice(s) has(have) 7 EUs (bitfield)? */
 82	u8 subslice_7eu[3];
 83	u8 has_slice_pg:1;
 84	u8 has_subslice_pg:1;
 85	u8 has_eu_pg:1;
 86	/*
 87	 * For Xe_HP and beyond, the hardware no longer has traditional slices
 88	 * so we just report the entire DSS pool under a fake "slice 0."
 89	 */
 90	u8 has_xehp_dss:1;
 91
 92	/* Topology fields */
 93	u8 max_slices;
 94	u8 max_subslices;
 95	u8 max_eus_per_subslice;
 96};
 97
 98/*
 99 * Powergating configuration for a particular (context,engine).
100 */
101struct intel_sseu {
102	u8 slice_mask;
103	u8 subslice_mask;
104	u8 min_eus_per_subslice;
105	u8 max_eus_per_subslice;
106};
107
108static inline struct intel_sseu
109intel_sseu_from_device_info(const struct sseu_dev_info *sseu)
110{
111	struct intel_sseu value = {
112		.slice_mask = sseu->slice_mask,
113		.subslice_mask = sseu->subslice_mask.hsw[0],
114		.min_eus_per_subslice = sseu->max_eus_per_subslice,
115		.max_eus_per_subslice = sseu->max_eus_per_subslice,
116	};
117
118	return value;
119}
120
121static inline bool
122intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice,
123			int subslice)
124{
125	if (slice >= sseu->max_slices ||
126	    subslice >= sseu->max_subslices)
127		return false;
128
129	if (sseu->has_xehp_dss)
130		return test_bit(subslice, sseu->subslice_mask.xehp);
131	else
132		return sseu->subslice_mask.hsw[slice] & BIT(subslice);
133}
134
135/*
136 * Used to obtain the index of the first DSS.  Can start searching from the
137 * beginning of a specific dss group (e.g., gslice, cslice, etc.) if
138 * groupsize and groupnum are non-zero.
139 */
140static inline unsigned int
141intel_sseu_find_first_xehp_dss(const struct sseu_dev_info *sseu, int groupsize,
142			       int groupnum)
143{
144	return find_next_bit(sseu->subslice_mask.xehp,
145			     XEHP_BITMAP_BITS(sseu->subslice_mask),
146			     groupnum * groupsize);
147}
148
149void intel_sseu_set_info(struct sseu_dev_info *sseu, u8 max_slices,
150			 u8 max_subslices, u8 max_eus_per_subslice);
151
152unsigned int
153intel_sseu_subslice_total(const struct sseu_dev_info *sseu);
154
155unsigned int
156intel_sseu_get_hsw_subslices(const struct sseu_dev_info *sseu, u8 slice);
157
158intel_sseu_ss_mask_t
159intel_sseu_get_compute_subslices(const struct sseu_dev_info *sseu);
160
161void intel_sseu_info_init(struct intel_gt *gt);
162
163u32 intel_sseu_make_rpcs(struct intel_gt *gt,
164			 const struct intel_sseu *req_sseu);
165
166void intel_sseu_dump(const struct sseu_dev_info *sseu, struct drm_printer *p);
167void intel_sseu_print_topology(struct drm_i915_private *i915,
168			       const struct sseu_dev_info *sseu,
169			       struct drm_printer *p);
170
171u16 intel_slicemask_from_xehp_dssmask(intel_sseu_ss_mask_t dss_mask, int dss_per_slice);
172
173int intel_sseu_copy_eumask_to_user(void __user *to,
174				   const struct sseu_dev_info *sseu);
175int intel_sseu_copy_ssmask_to_user(void __user *to,
176				   const struct sseu_dev_info *sseu);
177
178void intel_sseu_print_ss_info(const char *type,
179			      const struct sseu_dev_info *sseu,
180			      struct seq_file *m);
181
182#endif /* __INTEL_SSEU_H__ */