[PATCH] drm/i915: Use per device iommu check
Robin Murphy
robin.murphy at arm.com
Thu Nov 25 11:47:37 UTC 2021
On 2021-11-25 10:42, Tvrtko Ursulin wrote:
> From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>
> With both integrated and discrete Intel GPUs in a system, the current
> global check of intel_iommu_gfx_mapped, as done from intel_vtd_active()
> may not be completely accurate.
>
> In this patch we add i915 parameter to intel_vtd_active() in order to
> prepare it for multiple GPUs and we also change the check away from Intel
> specific intel_iommu_gfx_mapped (global exported by the Intel IOMMU
> driver) to probing the presence of IOMMU domain on a specific device
> using iommu_get_domain_for_dev().
FWIW the way you have it now is functionally equivalent to using
device_iommu_mapped(), which I think might be slightly clearer for the
current intent, but I don't have a significantly strong preference
(after all, this *was* the de-facto way of checking before
device_iommu_mapped() was introduced, and there are still other examples
of it around). So from the IOMMU perspective,
Acked-by: Robin Murphy <robin.murphy at arm.com>
Perhaps the AGP driver could also be tweaked and intel_iommu_gfx_mapped
cleaned away entirely, but I'll leave that for Baolu to think about :)
Cheers,
Robin.
> It was suggested to additionally check for __IOMMU_DOMAIN_PAGING bit
> present in the returned iommu domain, however I opted not to do that at
> this point.
>
> Checking for this flag would detect whether IOMMU is in address
> translation mode, with the assumption that is the only relevant question.
> Downside to that is that in identity mapping (pass-through) mode IOMMU
> hardware is still active, sitting on the communication path, just not
> doing address translation.
>
> My rationale was, that for the many intel_vtd_active() checks in our code
> base, while some clearly are about performance impact of address
> translation, some may be about working around functional issues when the
> IOMMU hardware is simply being active. There also may be some performance
> impact in pass-through mode, but I have not specifically attempted to
> measure it.
>
> Therefore the safest option feels to be to keep intel_vtd_active()
> answering the question of "is the IOMMU hardware active" for this device.
> If in the future we want to expand the set of questions to "is IOMMU
> active and doing address translation" we can easily do that by adding a
> new helper to be called from appropriate sites.
>
> v2:
> * Check for dmar translation specifically, not just iommu domain. (Baolu)
>
> v3:
> * Go back to plain "any domain" check for now, rewrite commit message.
>
> Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
> Cc: Lu Baolu <baolu.lu at linux.intel.com>
> Cc: Lucas De Marchi <lucas.demarchi at intel.com>
> Cc: Robin Murphy <robin.murphy at arm.com>
> ---
> drivers/gpu/drm/i915/display/intel_bw.c | 2 +-
> drivers/gpu/drm/i915/display/intel_display.c | 2 +-
> drivers/gpu/drm/i915/display/intel_fbc.c | 2 +-
> drivers/gpu/drm/i915/gem/i915_gem_stolen.c | 2 +-
> drivers/gpu/drm/i915/gem/i915_gemfs.c | 2 +-
> drivers/gpu/drm/i915/gt/intel_ggtt.c | 4 ++--
> drivers/gpu/drm/i915/i915_debugfs.c | 1 +
> drivers/gpu/drm/i915/i915_driver.c | 7 +++++++
> drivers/gpu/drm/i915/i915_drv.h | 13 +++++++------
> drivers/gpu/drm/i915/i915_gpu_error.c | 5 +----
> drivers/gpu/drm/i915/intel_device_info.c | 14 +-------------
> drivers/gpu/drm/i915/intel_pm.c | 2 +-
> 12 files changed, 25 insertions(+), 31 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/display/intel_bw.c b/drivers/gpu/drm/i915/display/intel_bw.c
> index abec394f6869..2da4aacc956b 100644
> --- a/drivers/gpu/drm/i915/display/intel_bw.c
> +++ b/drivers/gpu/drm/i915/display/intel_bw.c
> @@ -634,7 +634,7 @@ static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> for_each_pipe(dev_priv, pipe)
> data_rate += bw_state->data_rate[pipe];
>
> - if (DISPLAY_VER(dev_priv) >= 13 && intel_vtd_active())
> + if (DISPLAY_VER(dev_priv) >= 13 && intel_vtd_active(dev_priv))
> data_rate = data_rate * 105 / 100;
>
> return data_rate;
> diff --git a/drivers/gpu/drm/i915/display/intel_display.c b/drivers/gpu/drm/i915/display/intel_display.c
> index b2d51cd79d6c..1ef77ba7f645 100644
> --- a/drivers/gpu/drm/i915/display/intel_display.c
> +++ b/drivers/gpu/drm/i915/display/intel_display.c
> @@ -1293,7 +1293,7 @@ static bool needs_async_flip_vtd_wa(const struct intel_crtc_state *crtc_state)
> {
> struct drm_i915_private *i915 = to_i915(crtc_state->uapi.crtc->dev);
>
> - return crtc_state->uapi.async_flip && intel_vtd_active() &&
> + return crtc_state->uapi.async_flip && intel_vtd_active(i915) &&
> (DISPLAY_VER(i915) == 9 || IS_BROADWELL(i915) || IS_HASWELL(i915));
> }
>
> diff --git a/drivers/gpu/drm/i915/display/intel_fbc.c b/drivers/gpu/drm/i915/display/intel_fbc.c
> index d0c34bc3af6c..614e8697c068 100644
> --- a/drivers/gpu/drm/i915/display/intel_fbc.c
> +++ b/drivers/gpu/drm/i915/display/intel_fbc.c
> @@ -1677,7 +1677,7 @@ static int intel_sanitize_fbc_option(struct drm_i915_private *i915)
> static bool need_fbc_vtd_wa(struct drm_i915_private *i915)
> {
> /* WaFbcTurnOffFbcWhenHyperVisorIsUsed:skl,bxt */
> - if (intel_vtd_active() &&
> + if (intel_vtd_active(i915) &&
> (IS_SKYLAKE(i915) || IS_BROXTON(i915))) {
> drm_info(&i915->drm,
> "Disabling framebuffer compression (FBC) to prevent screen flicker with VT-d enabled\n");
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_stolen.c b/drivers/gpu/drm/i915/gem/i915_gem_stolen.c
> index ddd37ccb1362..cf100c0ea3b7 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_stolen.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_stolen.c
> @@ -399,7 +399,7 @@ static int i915_gem_init_stolen(struct intel_memory_region *mem)
> return 0;
> }
>
> - if (intel_vtd_active() && GRAPHICS_VER(i915) < 8) {
> + if (intel_vtd_active(i915) && GRAPHICS_VER(i915) < 8) {
> drm_notice(&i915->drm,
> "%s, disabling use of stolen memory\n",
> "DMAR active");
> diff --git a/drivers/gpu/drm/i915/gem/i915_gemfs.c b/drivers/gpu/drm/i915/gem/i915_gemfs.c
> index dbdbdc344d87..11cd66d183e6 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gemfs.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gemfs.c
> @@ -31,7 +31,7 @@ int i915_gemfs_init(struct drm_i915_private *i915)
> */
>
> opts = NULL;
> - if (intel_vtd_active()) {
> + if (intel_vtd_active(i915)) {
> if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE)) {
> static char huge_opt[] = "huge=within_size"; /* r/w */
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_ggtt.c b/drivers/gpu/drm/i915/gt/intel_ggtt.c
> index 555111c3bee5..110d3944f9a2 100644
> --- a/drivers/gpu/drm/i915/gt/intel_ggtt.c
> +++ b/drivers/gpu/drm/i915/gt/intel_ggtt.c
> @@ -106,7 +106,7 @@ static bool needs_idle_maps(struct drm_i915_private *i915)
> * Query intel_iommu to see if we need the workaround. Presumably that
> * was loaded first.
> */
> - if (!intel_vtd_active())
> + if (!intel_vtd_active(i915))
> return false;
>
> if (GRAPHICS_VER(i915) == 5 && IS_MOBILE(i915))
> @@ -1233,7 +1233,7 @@ int i915_ggtt_probe_hw(struct drm_i915_private *i915)
> if (ret)
> return ret;
>
> - if (intel_vtd_active())
> + if (intel_vtd_active(i915))
> drm_info(&i915->drm, "VT-d active for gfx access\n");
>
> return 0;
> diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> index fe638b5da7c0..390d541f64ea 100644
> --- a/drivers/gpu/drm/i915/i915_debugfs.c
> +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> @@ -65,6 +65,7 @@ static int i915_capabilities(struct seq_file *m, void *data)
>
> intel_device_info_print_static(INTEL_INFO(i915), &p);
> intel_device_info_print_runtime(RUNTIME_INFO(i915), &p);
> + i915_print_iommu_status(i915, &p);
> intel_gt_info_print(&i915->gt.info, &p);
> intel_driver_caps_print(&i915->caps, &p);
>
> diff --git a/drivers/gpu/drm/i915/i915_driver.c b/drivers/gpu/drm/i915/i915_driver.c
> index a13666627dad..bbc99fc5888f 100644
> --- a/drivers/gpu/drm/i915/i915_driver.c
> +++ b/drivers/gpu/drm/i915/i915_driver.c
> @@ -741,6 +741,12 @@ static void i915_driver_unregister(struct drm_i915_private *dev_priv)
> i915_gem_driver_unregister(dev_priv);
> }
>
> +void
> +i915_print_iommu_status(struct drm_i915_private *i915, struct drm_printer *p)
> +{
> + drm_printf(p, "iommu: %s\n", enableddisabled(intel_vtd_active(i915)));
> +}
> +
> static void i915_welcome_messages(struct drm_i915_private *dev_priv)
> {
> if (drm_debug_enabled(DRM_UT_DRIVER)) {
> @@ -756,6 +762,7 @@ static void i915_welcome_messages(struct drm_i915_private *dev_priv)
>
> intel_device_info_print_static(INTEL_INFO(dev_priv), &p);
> intel_device_info_print_runtime(RUNTIME_INFO(dev_priv), &p);
> + i915_print_iommu_status(dev_priv, &p);
> intel_gt_info_print(&dev_priv->gt.info, &p);
> }
>
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index 1bfadd9127fc..da3b32ae65e0 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -1760,26 +1760,27 @@ static inline bool run_as_guest(void)
> #define HAS_D12_PLANE_MINIMIZATION(dev_priv) (IS_ROCKETLAKE(dev_priv) || \
> IS_ALDERLAKE_S(dev_priv))
>
> -static inline bool intel_vtd_active(void)
> +static inline bool intel_vtd_active(struct drm_i915_private *i915)
> {
> -#ifdef CONFIG_INTEL_IOMMU
> - if (intel_iommu_gfx_mapped)
> + if (iommu_get_domain_for_dev(i915->drm.dev))
> return true;
> -#endif
>
> /* Running as a guest, we assume the host is enforcing VT'd */
> return run_as_guest();
> }
>
> +void
> +i915_print_iommu_status(struct drm_i915_private *i915, struct drm_printer *p);
> +
> static inline bool intel_scanout_needs_vtd_wa(struct drm_i915_private *dev_priv)
> {
> - return GRAPHICS_VER(dev_priv) >= 6 && intel_vtd_active();
> + return GRAPHICS_VER(dev_priv) >= 6 && intel_vtd_active(dev_priv);
> }
>
> static inline bool
> intel_ggtt_update_needs_vtd_wa(struct drm_i915_private *i915)
> {
> - return IS_BROXTON(i915) && intel_vtd_active();
> + return IS_BROXTON(i915) && intel_vtd_active(i915);
> }
>
> static inline bool
> diff --git a/drivers/gpu/drm/i915/i915_gpu_error.c b/drivers/gpu/drm/i915/i915_gpu_error.c
> index 2a2d7643b551..3f39d6641894 100644
> --- a/drivers/gpu/drm/i915/i915_gpu_error.c
> +++ b/drivers/gpu/drm/i915/i915_gpu_error.c
> @@ -1750,10 +1750,7 @@ static void capture_gen(struct i915_gpu_coredump *error)
> error->wakelock = atomic_read(&i915->runtime_pm.wakeref_count);
> error->suspended = i915->runtime_pm.suspended;
>
> - error->iommu = -1;
> -#ifdef CONFIG_INTEL_IOMMU
> - error->iommu = intel_iommu_gfx_mapped;
> -#endif
> + error->iommu = intel_vtd_active(i915);
> error->reset_count = i915_reset_count(&i915->gpu_error);
> error->suspend_count = i915->suspend_count;
>
> diff --git a/drivers/gpu/drm/i915/intel_device_info.c b/drivers/gpu/drm/i915/intel_device_info.c
> index 6e6b317bc33c..e6605b5181a5 100644
> --- a/drivers/gpu/drm/i915/intel_device_info.c
> +++ b/drivers/gpu/drm/i915/intel_device_info.c
> @@ -83,17 +83,6 @@ const char *intel_platform_name(enum intel_platform platform)
> return platform_names[platform];
> }
>
> -static const char *iommu_name(void)
> -{
> - const char *msg = "n/a";
> -
> -#ifdef CONFIG_INTEL_IOMMU
> - msg = enableddisabled(intel_iommu_gfx_mapped);
> -#endif
> -
> - return msg;
> -}
> -
> void intel_device_info_print_static(const struct intel_device_info *info,
> struct drm_printer *p)
> {
> @@ -114,7 +103,6 @@ void intel_device_info_print_static(const struct intel_device_info *info,
> drm_printf(p, "display version: %u\n", info->display.ver);
>
> drm_printf(p, "gt: %d\n", info->gt);
> - drm_printf(p, "iommu: %s\n", iommu_name());
> drm_printf(p, "memory-regions: %x\n", info->memory_regions);
> drm_printf(p, "page-sizes: %x\n", info->page_sizes);
> drm_printf(p, "platform: %s\n", intel_platform_name(info->platform));
> @@ -374,7 +362,7 @@ void intel_device_info_runtime_init(struct drm_i915_private *dev_priv)
> info->display.has_dsc = 0;
> }
>
> - if (GRAPHICS_VER(dev_priv) == 6 && intel_vtd_active()) {
> + if (GRAPHICS_VER(dev_priv) == 6 && intel_vtd_active(dev_priv)) {
> drm_info(&dev_priv->drm,
> "Disabling ppGTT for VT-d support\n");
> info->ppgtt_type = INTEL_PPGTT_NONE;
> diff --git a/drivers/gpu/drm/i915/intel_pm.c b/drivers/gpu/drm/i915/intel_pm.c
> index 01fa3fac1b57..cff0f32bedc9 100644
> --- a/drivers/gpu/drm/i915/intel_pm.c
> +++ b/drivers/gpu/drm/i915/intel_pm.c
> @@ -98,7 +98,7 @@ static void gen9_init_clock_gating(struct drm_i915_private *dev_priv)
> * "Plane N strech max must be programmed to 11b (x1)
> * when Async flips are enabled on that plane."
> */
> - if (!IS_GEMINILAKE(dev_priv) && intel_vtd_active())
> + if (!IS_GEMINILAKE(dev_priv) && intel_vtd_active(dev_priv))
> intel_uncore_rmw(&dev_priv->uncore, CHICKEN_PIPESL_1(pipe),
> SKL_PLANE1_STRETCH_MAX_MASK, SKL_PLANE1_STRETCH_MAX_X1);
> }
>
More information about the dri-devel
mailing list