| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182 |
- /* SPDX-License-Identifier: MIT */
- /*
- * Copyright © 2019 Intel Corporation
- */
- #ifndef __INTEL_SSEU_H__
- #define __INTEL_SSEU_H__
- #include <linux/types.h>
- #include <linux/kernel.h>
- #include "i915_gem.h"
- struct drm_i915_private;
- struct intel_gt;
- struct drm_printer;
- /*
- * Maximum number of slices on older platforms. Slices no longer exist
- * starting on Xe_HP ("gslices," "cslices," etc. are a different concept and
- * are not expressed through fusing).
- */
- #define GEN_MAX_HSW_SLICES 3
- /*
- * Maximum number of subslices that can exist within a HSW-style slice. This
- * is only relevant to pre-Xe_HP platforms (Xe_HP and beyond use the
- * I915_MAX_SS_FUSE_BITS value below).
- */
- #define GEN_MAX_SS_PER_HSW_SLICE 8
- /*
- * Maximum number of 32-bit registers used by hardware to express the
- * enabled/disabled subslices.
- */
- #define I915_MAX_SS_FUSE_REGS 2
- #define I915_MAX_SS_FUSE_BITS (I915_MAX_SS_FUSE_REGS * 32)
- /* Maximum number of EUs that can exist within a subslice or DSS. */
- #define GEN_MAX_EUS_PER_SS 16
- #define SSEU_MAX(a, b) ((a) > (b) ? (a) : (b))
- /* The maximum number of bits needed to express each subslice/DSS independently */
- #define GEN_SS_MASK_SIZE SSEU_MAX(I915_MAX_SS_FUSE_BITS, \
- GEN_MAX_HSW_SLICES * GEN_MAX_SS_PER_HSW_SLICE)
- #define GEN_SSEU_STRIDE(max_entries) DIV_ROUND_UP(max_entries, BITS_PER_BYTE)
- #define GEN_MAX_SUBSLICE_STRIDE GEN_SSEU_STRIDE(GEN_SS_MASK_SIZE)
- #define GEN_MAX_EU_STRIDE GEN_SSEU_STRIDE(GEN_MAX_EUS_PER_SS)
- #define GEN_DSS_PER_GSLICE 4
- #define GEN_DSS_PER_CSLICE 8
- #define GEN_DSS_PER_MSLICE 8
- #define GEN_MAX_GSLICES (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_GSLICE)
- #define GEN_MAX_CSLICES (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_CSLICE)
- typedef union {
- u8 hsw[GEN_MAX_HSW_SLICES];
- /* Bitmap compatible with linux/bitmap.h; may exceed size of u64 */
- unsigned long xehp[BITS_TO_LONGS(I915_MAX_SS_FUSE_BITS)];
- } intel_sseu_ss_mask_t;
- #define XEHP_BITMAP_BITS(mask) ((int)BITS_PER_TYPE(typeof(mask.xehp)))
- struct sseu_dev_info {
- u8 slice_mask;
- intel_sseu_ss_mask_t subslice_mask;
- intel_sseu_ss_mask_t geometry_subslice_mask;
- intel_sseu_ss_mask_t compute_subslice_mask;
- union {
- u16 hsw[GEN_MAX_HSW_SLICES][GEN_MAX_SS_PER_HSW_SLICE];
- u16 xehp[I915_MAX_SS_FUSE_BITS];
- } eu_mask;
- u16 eu_total;
- u8 eu_per_subslice;
- u8 min_eu_in_pool;
- /* For each slice, which subslice(s) has(have) 7 EUs (bitfield)? */
- u8 subslice_7eu[3];
- u8 has_slice_pg:1;
- u8 has_subslice_pg:1;
- u8 has_eu_pg:1;
- /*
- * For Xe_HP and beyond, the hardware no longer has traditional slices
- * so we just report the entire DSS pool under a fake "slice 0."
- */
- u8 has_xehp_dss:1;
- /* Topology fields */
- u8 max_slices;
- u8 max_subslices;
- u8 max_eus_per_subslice;
- };
- /*
- * Powergating configuration for a particular (context,engine).
- */
- struct intel_sseu {
- u8 slice_mask;
- u8 subslice_mask;
- u8 min_eus_per_subslice;
- u8 max_eus_per_subslice;
- };
- static inline struct intel_sseu
- intel_sseu_from_device_info(const struct sseu_dev_info *sseu)
- {
- struct intel_sseu value = {
- .slice_mask = sseu->slice_mask,
- .subslice_mask = sseu->subslice_mask.hsw[0],
- .min_eus_per_subslice = sseu->max_eus_per_subslice,
- .max_eus_per_subslice = sseu->max_eus_per_subslice,
- };
- return value;
- }
- static inline bool
- intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice,
- int subslice)
- {
- if (slice >= sseu->max_slices ||
- subslice >= sseu->max_subslices)
- return false;
- if (sseu->has_xehp_dss)
- return test_bit(subslice, sseu->subslice_mask.xehp);
- else
- return sseu->subslice_mask.hsw[slice] & BIT(subslice);
- }
- /*
- * Used to obtain the index of the first DSS. Can start searching from the
- * beginning of a specific dss group (e.g., gslice, cslice, etc.) if
- * groupsize and groupnum are non-zero.
- */
- static inline unsigned int
- intel_sseu_find_first_xehp_dss(const struct sseu_dev_info *sseu, int groupsize,
- int groupnum)
- {
- return find_next_bit(sseu->subslice_mask.xehp,
- XEHP_BITMAP_BITS(sseu->subslice_mask),
- groupnum * groupsize);
- }
- void intel_sseu_set_info(struct sseu_dev_info *sseu, u8 max_slices,
- u8 max_subslices, u8 max_eus_per_subslice);
- unsigned int
- intel_sseu_subslice_total(const struct sseu_dev_info *sseu);
- unsigned int
- intel_sseu_get_hsw_subslices(const struct sseu_dev_info *sseu, u8 slice);
- intel_sseu_ss_mask_t
- intel_sseu_get_compute_subslices(const struct sseu_dev_info *sseu);
- void intel_sseu_info_init(struct intel_gt *gt);
- u32 intel_sseu_make_rpcs(struct intel_gt *gt,
- const struct intel_sseu *req_sseu);
- void intel_sseu_dump(const struct sseu_dev_info *sseu, struct drm_printer *p);
- void intel_sseu_print_topology(struct drm_i915_private *i915,
- const struct sseu_dev_info *sseu,
- struct drm_printer *p);
- u16 intel_slicemask_from_xehp_dssmask(intel_sseu_ss_mask_t dss_mask, int dss_per_slice);
- int intel_sseu_copy_eumask_to_user(void __user *to,
- const struct sseu_dev_info *sseu);
- int intel_sseu_copy_ssmask_to_user(void __user *to,
- const struct sseu_dev_info *sseu);
- void intel_sseu_print_ss_info(const char *type,
- const struct sseu_dev_info *sseu,
- struct seq_file *m);
- #endif /* __INTEL_SSEU_H__ */
|