| 1 | /* SPDX-License-Identifier: MIT */ |
| 2 | /* |
| 3 | * Copyright © 2019 Intel Corporation |
| 4 | */ |
| 5 | |
| 6 | #ifndef __INTEL_SSEU_H__ |
| 7 | #define __INTEL_SSEU_H__ |
| 8 | |
| 9 | #include <linux/types.h> |
| 10 | #include <linux/kernel.h> |
| 11 | |
| 12 | #include "i915_gem.h" |
| 13 | |
| 14 | struct drm_i915_private; |
| 15 | struct intel_gt; |
| 16 | struct drm_printer; |
| 17 | |
| 18 | /* |
| 19 | * Maximum number of slices on older platforms. Slices no longer exist |
| 20 | * starting on Xe_HP ("gslices," "cslices," etc. are a different concept and |
| 21 | * are not expressed through fusing). |
| 22 | */ |
| 23 | #define GEN_MAX_HSW_SLICES 3 |
| 24 | |
| 25 | /* |
| 26 | * Maximum number of subslices that can exist within a HSW-style slice. This |
| 27 | * is only relevant to pre-Xe_HP platforms (Xe_HP and beyond use the |
| 28 | * I915_MAX_SS_FUSE_BITS value below). |
| 29 | */ |
| 30 | #define GEN_MAX_SS_PER_HSW_SLICE 8 |
| 31 | |
| 32 | /* |
| 33 | * Maximum number of 32-bit registers used by hardware to express the |
| 34 | * enabled/disabled subslices. |
| 35 | */ |
| 36 | #define I915_MAX_SS_FUSE_REGS 2 |
| 37 | #define I915_MAX_SS_FUSE_BITS (I915_MAX_SS_FUSE_REGS * 32) |
| 38 | |
| 39 | /* Maximum number of EUs that can exist within a subslice or DSS. */ |
| 40 | #define GEN_MAX_EUS_PER_SS 16 |
| 41 | |
| 42 | #define SSEU_MAX(a, b) ((a) > (b) ? (a) : (b)) |
| 43 | |
| 44 | /* The maximum number of bits needed to express each subslice/DSS independently */ |
| 45 | #define GEN_SS_MASK_SIZE SSEU_MAX(I915_MAX_SS_FUSE_BITS, \ |
| 46 | GEN_MAX_HSW_SLICES * GEN_MAX_SS_PER_HSW_SLICE) |
| 47 | |
| 48 | #define GEN_SSEU_STRIDE(max_entries) DIV_ROUND_UP(max_entries, BITS_PER_BYTE) |
| 49 | #define GEN_MAX_SUBSLICE_STRIDE GEN_SSEU_STRIDE(GEN_SS_MASK_SIZE) |
| 50 | #define GEN_MAX_EU_STRIDE GEN_SSEU_STRIDE(GEN_MAX_EUS_PER_SS) |
| 51 | |
| 52 | #define GEN_DSS_PER_GSLICE 4 |
| 53 | #define GEN_DSS_PER_CSLICE 8 |
| 54 | #define GEN_DSS_PER_MSLICE 8 |
| 55 | |
| 56 | #define GEN_MAX_GSLICES (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_GSLICE) |
| 57 | #define GEN_MAX_CSLICES (I915_MAX_SS_FUSE_BITS / GEN_DSS_PER_CSLICE) |
| 58 | |
| 59 | typedef union { |
| 60 | u8 hsw[GEN_MAX_HSW_SLICES]; |
| 61 | |
| 62 | /* Bitmap compatible with linux/bitmap.h; may exceed size of u64 */ |
| 63 | unsigned long xehp[BITS_TO_LONGS(I915_MAX_SS_FUSE_BITS)]; |
| 64 | } intel_sseu_ss_mask_t; |
| 65 | |
| 66 | #define XEHP_BITMAP_BITS(mask) ((int)BITS_PER_TYPE(typeof(mask.xehp))) |
| 67 | |
| 68 | struct sseu_dev_info { |
| 69 | u8 slice_mask; |
| 70 | intel_sseu_ss_mask_t subslice_mask; |
| 71 | intel_sseu_ss_mask_t geometry_subslice_mask; |
| 72 | intel_sseu_ss_mask_t compute_subslice_mask; |
| 73 | union { |
| 74 | u16 hsw[GEN_MAX_HSW_SLICES][GEN_MAX_SS_PER_HSW_SLICE]; |
| 75 | u16 xehp[I915_MAX_SS_FUSE_BITS]; |
| 76 | } eu_mask; |
| 77 | |
| 78 | u16 eu_total; |
| 79 | u8 eu_per_subslice; |
| 80 | u8 min_eu_in_pool; |
| 81 | /* For each slice, which subslice(s) has(have) 7 EUs (bitfield)? */ |
| 82 | u8 subslice_7eu[3]; |
| 83 | u8 has_slice_pg:1; |
| 84 | u8 has_subslice_pg:1; |
| 85 | u8 has_eu_pg:1; |
| 86 | /* |
| 87 | * For Xe_HP and beyond, the hardware no longer has traditional slices |
| 88 | * so we just report the entire DSS pool under a fake "slice 0." |
| 89 | */ |
| 90 | u8 has_xehp_dss:1; |
| 91 | |
| 92 | /* Topology fields */ |
| 93 | u8 max_slices; |
| 94 | u8 max_subslices; |
| 95 | u8 max_eus_per_subslice; |
| 96 | }; |
| 97 | |
| 98 | /* |
| 99 | * Powergating configuration for a particular (context,engine). |
| 100 | */ |
| 101 | struct intel_sseu { |
| 102 | u8 slice_mask; |
| 103 | u8 subslice_mask; |
| 104 | u8 min_eus_per_subslice; |
| 105 | u8 max_eus_per_subslice; |
| 106 | }; |
| 107 | |
| 108 | static inline struct intel_sseu |
| 109 | intel_sseu_from_device_info(const struct sseu_dev_info *sseu) |
| 110 | { |
| 111 | struct intel_sseu value = { |
| 112 | .slice_mask = sseu->slice_mask, |
| 113 | .subslice_mask = sseu->subslice_mask.hsw[0], |
| 114 | .min_eus_per_subslice = sseu->max_eus_per_subslice, |
| 115 | .max_eus_per_subslice = sseu->max_eus_per_subslice, |
| 116 | }; |
| 117 | |
| 118 | return value; |
| 119 | } |
| 120 | |
| 121 | static inline bool |
| 122 | intel_sseu_has_subslice(const struct sseu_dev_info *sseu, int slice, |
| 123 | int subslice) |
| 124 | { |
| 125 | if (slice >= sseu->max_slices || |
| 126 | subslice >= sseu->max_subslices) |
| 127 | return false; |
| 128 | |
| 129 | if (sseu->has_xehp_dss) |
| 130 | return test_bit(subslice, sseu->subslice_mask.xehp); |
| 131 | else |
| 132 | return sseu->subslice_mask.hsw[slice] & BIT(subslice); |
| 133 | } |
| 134 | |
| 135 | /* |
| 136 | * Used to obtain the index of the first DSS. Can start searching from the |
| 137 | * beginning of a specific dss group (e.g., gslice, cslice, etc.) if |
| 138 | * groupsize and groupnum are non-zero. |
| 139 | */ |
| 140 | static inline unsigned int |
| 141 | intel_sseu_find_first_xehp_dss(const struct sseu_dev_info *sseu, int groupsize, |
| 142 | int groupnum) |
| 143 | { |
| 144 | return find_next_bit(addr: sseu->subslice_mask.xehp, |
| 145 | XEHP_BITMAP_BITS(sseu->subslice_mask), |
| 146 | offset: groupnum * groupsize); |
| 147 | } |
| 148 | |
| 149 | void intel_sseu_set_info(struct sseu_dev_info *sseu, u8 max_slices, |
| 150 | u8 max_subslices, u8 max_eus_per_subslice); |
| 151 | |
| 152 | unsigned int |
| 153 | intel_sseu_subslice_total(const struct sseu_dev_info *sseu); |
| 154 | |
| 155 | unsigned int |
| 156 | intel_sseu_get_hsw_subslices(const struct sseu_dev_info *sseu, u8 slice); |
| 157 | |
| 158 | intel_sseu_ss_mask_t |
| 159 | intel_sseu_get_compute_subslices(const struct sseu_dev_info *sseu); |
| 160 | |
| 161 | void intel_sseu_info_init(struct intel_gt *gt); |
| 162 | |
| 163 | u32 intel_sseu_make_rpcs(struct intel_gt *gt, |
| 164 | const struct intel_sseu *req_sseu); |
| 165 | |
| 166 | void intel_sseu_dump(const struct sseu_dev_info *sseu, struct drm_printer *p); |
| 167 | void intel_sseu_print_topology(struct drm_i915_private *i915, |
| 168 | const struct sseu_dev_info *sseu, |
| 169 | struct drm_printer *p); |
| 170 | |
| 171 | u16 intel_slicemask_from_xehp_dssmask(intel_sseu_ss_mask_t dss_mask, int dss_per_slice); |
| 172 | |
| 173 | int intel_sseu_copy_eumask_to_user(void __user *to, |
| 174 | const struct sseu_dev_info *sseu); |
| 175 | int intel_sseu_copy_ssmask_to_user(void __user *to, |
| 176 | const struct sseu_dev_info *sseu); |
| 177 | |
| 178 | void intel_sseu_print_ss_info(const char *type, |
| 179 | const struct sseu_dev_info *sseu, |
| 180 | struct seq_file *m); |
| 181 | |
| 182 | #endif /* __INTEL_SSEU_H__ */ |
| 183 | |