All of lore.kernel.org
 help / color / mirror / Atom feed
* [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
@ 2023-04-03  8:50 Mika Kahola
  2023-04-03  9:17 ` Jani Nikula
                   ` (6 more replies)
  0 siblings, 7 replies; 13+ messages in thread
From: Mika Kahola @ 2023-04-03  8:50 UTC (permalink / raw)
  To: intel-gfx; +Cc: Lucas De Marchi, Matt Roper

Display14 introduces a new way to instruct the PUnit with
power and bandwidth requirements of DE. Add the functionality
to program the registers and handle waits using interrupts.
The current wait time for timeouts is programmed for 10 msecs to
factor in the worst case scenarios. Changes made to use REG_BIT
for a register that we touched(GEN8_DE_MISC_IER _MMIO).

v2:
  - Removed repeated definition of dbuf, which has been moved to struct
    intel_display. (Gustavo)
  - s/dev_priv->dbuf/dev_priv->display.dbuf/ (Gustavo)

Bspec: 66451, 64636, 64602, 64603
Cc: Matt Atwood <matthew.s.atwood@intel.com>
Cc: Matt Roper <matthew.d.roper@intel.com>
Cc: Lucas De Marchi <lucas.demarchi@intel.com>
Cc: Gustavo Sousa <gustavo.sousa@intel.com>
Signed-off-by: José Roberto de Souza <jose.souza@intel.com>
Signed-off-by: Radhakrishna Sripada <radhakrishna.sripada@intel.com>
Signed-off-by: Mika Kahola <mika.kahola@intel.com>
---
 drivers/gpu/drm/i915/display/intel_bw.c       |   4 +-
 drivers/gpu/drm/i915/display/intel_bw.h       |   2 +
 drivers/gpu/drm/i915/display/intel_display.c  |  14 +
 .../drm/i915/display/intel_display_power.c    |   8 +
 drivers/gpu/drm/i915/i915_drv.h               |   6 +
 drivers/gpu/drm/i915/i915_irq.c               |  22 +-
 drivers/gpu/drm/i915/i915_reg.h               |  33 +-
 drivers/gpu/drm/i915/intel_pm.c               | 293 ++++++++++++++++++
 drivers/gpu/drm/i915/intel_pm.h               |  35 +++
 9 files changed, 412 insertions(+), 5 deletions(-)

diff --git a/drivers/gpu/drm/i915/display/intel_bw.c b/drivers/gpu/drm/i915/display/intel_bw.c
index 202321ffbe2a..87c20bf52123 100644
--- a/drivers/gpu/drm/i915/display/intel_bw.c
+++ b/drivers/gpu/drm/i915/display/intel_bw.c
@@ -746,8 +746,8 @@ static unsigned int intel_bw_num_active_planes(struct drm_i915_private *dev_priv
 	return num_active_planes;
 }
 
-static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
-				       const struct intel_bw_state *bw_state)
+unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
+				const struct intel_bw_state *bw_state)
 {
 	unsigned int data_rate = 0;
 	enum pipe pipe;
diff --git a/drivers/gpu/drm/i915/display/intel_bw.h b/drivers/gpu/drm/i915/display/intel_bw.h
index f20292143745..17fc0b61db04 100644
--- a/drivers/gpu/drm/i915/display/intel_bw.h
+++ b/drivers/gpu/drm/i915/display/intel_bw.h
@@ -62,6 +62,8 @@ int intel_bw_init(struct drm_i915_private *dev_priv);
 int intel_bw_atomic_check(struct intel_atomic_state *state);
 void intel_bw_crtc_update(struct intel_bw_state *bw_state,
 			  const struct intel_crtc_state *crtc_state);
+unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
+				const struct intel_bw_state *bw_state);
 int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
 				  u32 points_mask);
 int intel_bw_calc_min_cdclk(struct intel_atomic_state *state,
diff --git a/drivers/gpu/drm/i915/display/intel_display.c b/drivers/gpu/drm/i915/display/intel_display.c
index b53a1d969344..ee7ca33123b1 100644
--- a/drivers/gpu/drm/i915/display/intel_display.c
+++ b/drivers/gpu/drm/i915/display/intel_display.c
@@ -959,6 +959,9 @@ intel_get_crtc_new_encoder(const struct intel_atomic_state *state,
 		num_encoders++;
 	}
 
+	if (!encoder)
+		return NULL;
+
 	drm_WARN(encoder->base.dev, num_encoders != 1,
 		 "%d encoders for pipe %c\n",
 		 num_encoders, pipe_name(master_crtc->pipe));
@@ -6767,6 +6770,10 @@ int intel_atomic_check(struct drm_device *dev,
 		ret = intel_modeset_calc_cdclk(state);
 		if (ret)
 			return ret;
+
+		ret = intel_pmdemand_atomic_check(state);
+		if (ret)
+			goto fail;
 	}
 
 	ret = intel_atomic_check_crtcs(state);
@@ -7411,6 +7418,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
 	}
 
 	intel_sagv_pre_plane_update(state);
+	intel_pmdemand_pre_plane_update(state);
 
 	/* Complete the events for pipes that have now been disabled */
 	for_each_new_intel_crtc_in_state(state, crtc, new_crtc_state, i) {
@@ -7523,6 +7531,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
 		intel_verify_planes(state);
 
 	intel_sagv_post_plane_update(state);
+	intel_pmdemand_post_plane_update(state);
 
 	drm_atomic_helper_commit_hw_done(&state->base);
 
@@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
 	intel_color_init_hooks(dev_priv);
 	intel_init_cdclk_hooks(dev_priv);
 	intel_audio_hooks_init(dev_priv);
+	intel_init_pmdemand(dev_priv);
 
 	intel_dpll_init_clock_hook(dev_priv);
 
@@ -8476,6 +8486,10 @@ int intel_modeset_init_noirq(struct drm_i915_private *i915)
 	if (ret)
 		goto cleanup_vga_client_pw_domain_dmc;
 
+	ret = intel_pmdemand_init(i915);
+	if (ret)
+		goto cleanup_vga_client_pw_domain_dmc;
+
 	init_llist_head(&i915->display.atomic_helper.free_list);
 	INIT_WORK(&i915->display.atomic_helper.free_work,
 		  intel_atomic_helper_free_state_worker);
diff --git a/drivers/gpu/drm/i915/display/intel_display_power.c b/drivers/gpu/drm/i915/display/intel_display_power.c
index 5e85572dc8e4..04c172b5c17b 100644
--- a/drivers/gpu/drm/i915/display/intel_display_power.c
+++ b/drivers/gpu/drm/i915/display/intel_display_power.c
@@ -19,6 +19,7 @@
 #include "intel_mchbar_regs.h"
 #include "intel_pch_refclk.h"
 #include "intel_pcode.h"
+#include "intel_pm.h"
 #include "intel_pps_regs.h"
 #include "intel_snps_phy.h"
 #include "skl_watermark.h"
@@ -1083,6 +1084,10 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
 	dev_priv->display.dbuf.enabled_slices =
 		intel_enabled_dbuf_slices_mask(dev_priv);
 
+	if (DISPLAY_VER(dev_priv) >= 14)
+		intel_program_dbuf_pmdemand(dev_priv, BIT(DBUF_S1) |
+					    dev_priv->display.dbuf.enabled_slices);
+
 	/*
 	 * Just power up at least 1 slice, we will
 	 * figure out later which slices we have and what we need.
@@ -1094,6 +1099,9 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
 static void gen9_dbuf_disable(struct drm_i915_private *dev_priv)
 {
 	gen9_dbuf_slices_update(dev_priv, 0);
+
+	if (DISPLAY_VER(dev_priv) >= 14)
+		intel_program_dbuf_pmdemand(dev_priv, 0);
 }
 
 static void gen12_dbuf_slices_config(struct drm_i915_private *dev_priv)
diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
index e771fdc3099c..2a73e726c6ed 100644
--- a/drivers/gpu/drm/i915/i915_drv.h
+++ b/drivers/gpu/drm/i915/i915_drv.h
@@ -250,6 +250,12 @@ struct drm_i915_private {
 	unsigned int hpll_freq;
 	unsigned int czclk_freq;
 
+	struct {
+		wait_queue_head_t waitqueue;
+		struct mutex lock;
+		struct intel_global_obj obj;
+	} pmdemand;
+
 	/**
 	 * wq - Driver workqueue for GEM.
 	 *
diff --git a/drivers/gpu/drm/i915/i915_irq.c b/drivers/gpu/drm/i915/i915_irq.c
index c0888cc88d04..636033bb9650 100644
--- a/drivers/gpu/drm/i915/i915_irq.c
+++ b/drivers/gpu/drm/i915/i915_irq.c
@@ -1913,6 +1913,11 @@ static u32 gen8_de_pipe_fault_mask(struct drm_i915_private *dev_priv)
 		return GEN8_DE_PIPE_IRQ_FAULT_ERRORS;
 }
 
+static void intel_pmdemand_irq_handler(struct drm_i915_private *dev_priv)
+{
+	wake_up_all(&dev_priv->pmdemand.waitqueue);
+}
+
 static void
 gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
 {
@@ -1949,6 +1954,18 @@ gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
 		}
 	}
 
+	if (iir & XELPDP_PMDEMAND_RSPTOUT_ERR) {
+		drm_dbg(&dev_priv->drm,
+			"Error waiting for Punit PM Demand Response\n");
+		intel_pmdemand_irq_handler(dev_priv);
+		found = true;
+	}
+
+	if (iir & XELPDP_PMDEMAND_RSP) {
+		intel_pmdemand_irq_handler(dev_priv);
+		found = true;
+	}
+
 	if (!found)
 		drm_err(&dev_priv->drm, "Unexpected DE Misc interrupt\n");
 }
@@ -3315,7 +3332,10 @@ static void gen8_de_irq_postinstall(struct drm_i915_private *dev_priv)
 	if (IS_GEMINILAKE(dev_priv) || IS_BROXTON(dev_priv))
 		de_port_masked |= BXT_DE_PORT_GMBUS;
 
-	if (DISPLAY_VER(dev_priv) >= 11) {
+	if (DISPLAY_VER(dev_priv) >= 14)
+		de_misc_masked |= XELPDP_PMDEMAND_RSPTOUT_ERR |
+				  XELPDP_PMDEMAND_RSP;
+	else if (DISPLAY_VER(dev_priv) >= 11) {
 		enum port port;
 
 		if (intel_bios_is_dsi_present(dev_priv, &port))
diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
index 8d26fa2765c1..7f8e750665ed 100644
--- a/drivers/gpu/drm/i915/i915_reg.h
+++ b/drivers/gpu/drm/i915/i915_reg.h
@@ -4783,8 +4783,10 @@
 #define GEN8_DE_MISC_IMR _MMIO(0x44464)
 #define GEN8_DE_MISC_IIR _MMIO(0x44468)
 #define GEN8_DE_MISC_IER _MMIO(0x4446c)
-#define  GEN8_DE_MISC_GSE		(1 << 27)
-#define  GEN8_DE_EDP_PSR		(1 << 19)
+#define  XELPDP_PMDEMAND_RSPTOUT_ERR	REG_BIT(27)
+#define  GEN8_DE_MISC_GSE		REG_BIT(27)
+#define  GEN8_DE_EDP_PSR		REG_BIT(19)
+#define  XELPDP_PMDEMAND_RSP		REG_BIT(3)
 
 #define GEN8_PCU_ISR _MMIO(0x444e0)
 #define GEN8_PCU_IMR _MMIO(0x444e4)
@@ -4847,6 +4849,33 @@
 #define  GEN11_HOTPLUG_CTL_SHORT_DETECT(hpd_pin)	(1 << (_HPD_PIN_TC(hpd_pin) * 4))
 #define  GEN11_HOTPLUG_CTL_NO_DETECT(hpd_pin)		(0 << (_HPD_PIN_TC(hpd_pin) * 4))
 
+#define XELPDP_INITIATE_PMDEMAND_REQUEST(dword)		_MMIO(0x45230 + 4 * (dword))
+#define  XELPDP_PMDEMAND_QCLK_GV_BW_MASK		REG_GENMASK(31, 16)
+#define  XELPDP_PMDEMAND_QCLK_GV_BW(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_BW_MASK, x)
+#define  XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK		REG_GENMASK(14, 12)
+#define  XELPDP_PMDEMAND_VOLTAGE_INDEX(x)		REG_FIELD_PREP(XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK, x)
+#define  XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK		REG_GENMASK(11, 8)
+#define  XELPDP_PMDEMAND_QCLK_GV_INDEX(x)		REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK, x)
+#define  XELPDP_PMDEMAND_PIPES_MASK			REG_GENMASK(7, 6)
+#define  XELPDP_PMDEMAND_PIPES(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_PIPES_MASK, x)
+#define  XELPDP_PMDEMAND_DBUFS_MASK			REG_GENMASK(5, 4)
+#define  XELPDP_PMDEMAND_DBUFS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_DBUFS_MASK, x)
+#define  XELPDP_PMDEMAND_PHYS_MASK			REG_GENMASK(2, 0)
+#define  XELPDP_PMDEMAND_PHYS(x)				REG_FIELD_PREP(XELPDP_PMDEMAND_PHYS_MASK, x)
+
+#define  XELPDP_PMDEMAND_REQ_ENABLE			REG_BIT(31)
+#define  XELPDP_PMDEMAND_CDCLK_FREQ_MASK		REG_GENMASK(30, 20)
+#define  XELPDP_PMDEMAND_CDCLK_FREQ(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_CDCLK_FREQ_MASK, x)
+#define  XELPDP_PMDEMAND_DDICLK_FREQ_MASK		REG_GENMASK(18, 8)
+#define  XELPDP_PMDEMAND_DDICLK_FREQ(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_DDICLK_FREQ_MASK, x)
+#define  XELPDP_PMDEMAND_SCALERS_MASK			REG_GENMASK(6, 4)
+#define  XELPDP_PMDEMAND_SCALERS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_SCALERS_MASK, x)
+#define  XELPDP_PMDEMAND_PLLS_MASK			REG_GENMASK(2, 0)
+#define  XELPDP_PMDEMAND_PLLS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_PLLS_MASK, x)
+
+#define GEN12_DCPR_STATUS_1				_MMIO(0x46440)
+#define  XELPDP_PMDEMAND_INFLIGHT_STATUS		REG_BIT(26)
+
 #define ILK_DISPLAY_CHICKEN2	_MMIO(0x42004)
 /* Required on all Ironlake and Sandybridge according to the B-Spec. */
 #define  ILK_ELPIN_409_SELECT	(1 << 25)
diff --git a/drivers/gpu/drm/i915/intel_pm.c b/drivers/gpu/drm/i915/intel_pm.c
index c45af0d981fd..877997e4141d 100644
--- a/drivers/gpu/drm/i915/intel_pm.c
+++ b/drivers/gpu/drm/i915/intel_pm.c
@@ -25,6 +25,10 @@
  *
  */
 
+#include <linux/bitops.h>
+
+#include "display/intel_bw.h"
+#include "display/intel_cdclk.h"
 #include "display/intel_de.h"
 #include "display/intel_display.h"
 #include "display/intel_display_trace.h"
@@ -40,6 +44,14 @@
 #include "intel_pm.h"
 #include "vlv_sideband.h"
 
+bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
+{
+        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
+                return true;
+
+        return false;
+}
+
 struct drm_i915_clock_gating_funcs {
 	void (*init_clock_gating)(struct drm_i915_private *i915);
 };
@@ -124,6 +136,287 @@ static void glk_init_clock_gating(struct drm_i915_private *dev_priv)
 		   PWM1_GATING_DIS | PWM2_GATING_DIS);
 }
 
+static struct intel_global_state *intel_pmdemand_duplicate_state(struct intel_global_obj *obj)
+{
+	struct intel_pmdemand_state *pmdmnd_state;
+
+	pmdmnd_state = kmemdup(obj->state, sizeof(*pmdmnd_state), GFP_KERNEL);
+	if (!pmdmnd_state)
+		return NULL;
+
+	return &pmdmnd_state->base;
+}
+
+static void intel_pmdemand_destroy_state(struct intel_global_obj *obj,
+					 struct intel_global_state *state)
+{
+	kfree(state);
+}
+
+static const struct intel_global_state_funcs intel_pmdemand_funcs = {
+	.atomic_duplicate_state = intel_pmdemand_duplicate_state,
+	.atomic_destroy_state = intel_pmdemand_destroy_state,
+};
+
+struct intel_pmdemand_state *
+intel_atomic_get_pmdemand_state(struct intel_atomic_state *state)
+{
+	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
+	struct intel_global_state *pmdemand_state;
+
+	pmdemand_state = intel_atomic_get_global_obj_state(state, &dev_priv->pmdemand.obj);
+	if (IS_ERR(pmdemand_state))
+		return ERR_CAST(pmdemand_state);
+
+	return to_intel_pmdemand_state(pmdemand_state);
+}
+
+int intel_pmdemand_init(struct drm_i915_private *dev_priv)
+{
+	struct intel_pmdemand_state *pmdemand_state;
+
+	pmdemand_state = kzalloc(sizeof(*pmdemand_state), GFP_KERNEL);
+	if (!pmdemand_state)
+		return -ENOMEM;
+
+	intel_atomic_global_obj_init(dev_priv, &dev_priv->pmdemand.obj,
+				     &pmdemand_state->base, &intel_pmdemand_funcs);
+
+	return 0;
+}
+
+void intel_init_pmdemand(struct drm_i915_private *dev_priv)
+{
+	mutex_init(&dev_priv->pmdemand.lock);
+	init_waitqueue_head(&dev_priv->pmdemand.waitqueue);
+}
+
+int intel_pmdemand_atomic_check(struct intel_atomic_state *state)
+{
+	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
+	struct intel_pmdemand_state *new_pmdemand_state = NULL;
+	struct intel_crtc_state *old_crtc_state, *new_crtc_state;
+	struct intel_crtc *crtc;
+	struct intel_encoder *encoder;
+	struct intel_bw_state *new_bw_state;
+	const struct intel_dbuf_state *new_dbuf_state;
+	const struct intel_cdclk_state *new_cdclk_state;
+	int port_clock = 0;
+	unsigned int data_rate;
+	enum phy phy;
+	int i, ret;
+
+	if (DISPLAY_VER(dev_priv) < 14)
+		return 0;
+
+	new_pmdemand_state = intel_atomic_get_pmdemand_state(state);
+	if (IS_ERR(new_pmdemand_state))
+		return PTR_ERR(new_pmdemand_state);
+
+	ret = intel_atomic_lock_global_state(&new_pmdemand_state->base);
+	if (ret)
+		return ret;
+
+	/* Punit figures out the voltage index based on bandwidth*/
+	new_bw_state = intel_atomic_get_bw_state(state);
+	if (IS_ERR(new_bw_state))
+		return PTR_ERR(new_bw_state);
+
+	/* firmware will calculate the qclck_gc_index, requirement is set to 0 */
+	new_pmdemand_state->qclk_gv_index = 0;
+
+	data_rate = intel_bw_data_rate(dev_priv, new_bw_state);
+	/* To MBs then to multiples of 100MBs */
+	data_rate = DIV_ROUND_UP(data_rate, 1000);
+	data_rate = DIV_ROUND_UP(data_rate, 100);
+	new_pmdemand_state->qclk_gv_bw = data_rate;
+
+	new_dbuf_state = intel_atomic_get_dbuf_state(state);
+	if (IS_ERR(new_dbuf_state))
+		return PTR_ERR(new_dbuf_state);
+
+	i = hweight8(new_dbuf_state->active_pipes);
+	new_pmdemand_state->active_pipes = min(i, 3);
+
+	new_cdclk_state = intel_atomic_get_cdclk_state(state);
+	if (IS_ERR(new_cdclk_state))
+		return PTR_ERR(new_cdclk_state);
+
+	new_pmdemand_state->voltage_index = new_cdclk_state->logical.voltage_level;
+	/* KHz to MHz */
+	new_pmdemand_state->cdclk_freq_mhz = DIV_ROUND_UP(new_cdclk_state->logical.cdclk, 1000);
+
+	new_pmdemand_state->active_phys_plls_mask = 0;
+
+	for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state, new_crtc_state, i) {
+		if (!new_crtc_state->hw.active)
+			continue;
+
+		encoder = intel_get_crtc_new_encoder(state, new_crtc_state);
+		if (!encoder)
+			continue;
+
+		phy = intel_port_to_phy(dev_priv, encoder->port);
+
+		if (intel_is_c10phy(dev_priv, phy))
+			new_pmdemand_state->active_phys_plls_mask |= BIT(phy);
+
+		port_clock = max(port_clock, new_crtc_state->port_clock);
+	}
+
+	/* To MHz */
+	new_pmdemand_state->ddiclk_freq_mhz = DIV_ROUND_UP(port_clock, 1000);
+
+	/*
+	 * Setting scalers to max as it can not be calculated during flips and
+	 * fastsets without taking global states locks.
+	 */
+	new_pmdemand_state->scalers = 7;
+
+	return 0;
+}
+
+static bool intel_pmdemand_check_prev_transaction(struct drm_i915_private *dev_priv)
+{
+	return !((intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE) ||
+		(intel_de_read(dev_priv, GEN12_DCPR_STATUS_1) & XELPDP_PMDEMAND_INFLIGHT_STATUS));
+}
+
+static bool intel_pmdemand_req_complete(struct drm_i915_private *dev_priv)
+{
+	return !(intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE);
+}
+
+static int intel_pmdemand_wait(struct drm_i915_private *dev_priv)
+{
+	DEFINE_WAIT(wait);
+	int ret;
+	const unsigned int timeout_ms = 10;
+
+	add_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
+
+	ret = wait_event_timeout(dev_priv->pmdemand.waitqueue,
+				 intel_pmdemand_req_complete(dev_priv),
+				 msecs_to_jiffies_timeout(timeout_ms));
+	if (ret < 0)
+		drm_err(&dev_priv->drm,
+			"timed out waiting for Punit PM Demand Response\n");
+
+	remove_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
+
+	return ret;
+}
+
+/* Required to be programmed during Display Init Sequences. */
+void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
+				 u8 dbuf_slices)
+{
+	mutex_lock(&dev_priv->pmdemand.lock);
+	if (drm_WARN_ON(&dev_priv->drm,
+			!intel_pmdemand_check_prev_transaction(dev_priv)))
+		goto unlock;
+
+	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0),
+		     XELPDP_PMDEMAND_DBUFS_MASK,
+		     XELPDP_PMDEMAND_DBUFS(hweight32(dbuf_slices)));
+	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0,
+		     XELPDP_PMDEMAND_REQ_ENABLE);
+
+	intel_pmdemand_wait(dev_priv);
+unlock:
+	mutex_unlock(&dev_priv->pmdemand.lock);
+}
+
+static void intel_program_pmdemand(struct drm_i915_private *dev_priv,
+				   const struct intel_pmdemand_state *new,
+				   const struct intel_pmdemand_state *old)
+{
+	u32 val, tmp;
+
+#define UPDATE_PMDEMAND_VAL(val, F, f) do {            \
+	val &= (~(XELPDP_PMDEMAND_##F##_MASK));         \
+	val |= (XELPDP_PMDEMAND_##F((u32)(old ? max(old->f, new->f) : new->f))); \
+} while (0)
+
+	mutex_lock(&dev_priv->pmdemand.lock);
+	if (drm_WARN_ON(&dev_priv->drm,
+			!intel_pmdemand_check_prev_transaction(dev_priv)))
+		goto unlock;
+
+	/*
+	 * TODO: Update programming PM Demand for
+	 * PHYS, PLLS, DDI_CLKFREQ, SCALARS
+	 */
+	val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0));
+	UPDATE_PMDEMAND_VAL(val, QCLK_GV_INDEX, qclk_gv_index);
+	UPDATE_PMDEMAND_VAL(val, QCLK_GV_BW, qclk_gv_bw);
+	UPDATE_PMDEMAND_VAL(val, VOLTAGE_INDEX, voltage_index);
+	UPDATE_PMDEMAND_VAL(val, PIPES, active_pipes);
+	UPDATE_PMDEMAND_VAL(val, DBUFS, dbufs);
+	tmp = hweight32(new->active_phys_plls_mask);
+	if (old)
+		tmp = max(tmp, hweight32(old->active_phys_plls_mask));
+	val |= XELPDP_PMDEMAND_PHYS(tmp);
+
+	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0), val);
+
+	val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1));
+	UPDATE_PMDEMAND_VAL(val, CDCLK_FREQ, cdclk_freq_mhz);
+	UPDATE_PMDEMAND_VAL(val, DDICLK_FREQ, ddiclk_freq_mhz);
+	UPDATE_PMDEMAND_VAL(val, SCALERS, scalers);
+	/*
+	 * Active_PLLs starts with 1 because of CDCLK PLL.
+	 * TODO: Missing to account genlock filter when it gets used.
+	 */
+	val |= XELPDP_PMDEMAND_PLLS(tmp + 1);
+
+	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), val);
+
+#undef UPDATE_PM_DEMAND_VAL
+
+	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0, XELPDP_PMDEMAND_REQ_ENABLE);
+
+	intel_pmdemand_wait(dev_priv);
+unlock:
+	mutex_unlock(&dev_priv->pmdemand.lock);
+}
+
+void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state)
+{
+	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
+	const struct intel_pmdemand_state *new_pmdmnd_state =
+		intel_atomic_get_new_pmdemand_state(state);
+	const struct intel_pmdemand_state *old_pmdmnd_state =
+		intel_atomic_get_old_pmdemand_state(state);
+
+	if (DISPLAY_VER(dev_priv) < 14)
+		return;
+
+	if (!new_pmdmnd_state ||
+	    memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)
+		return;
+
+	intel_program_pmdemand(dev_priv, new_pmdmnd_state, old_pmdmnd_state);
+}
+
+void intel_pmdemand_post_plane_update(struct intel_atomic_state *state)
+{
+	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
+	const struct intel_pmdemand_state *new_pmdmnd_state =
+		intel_atomic_get_new_pmdemand_state(state);
+	const struct intel_pmdemand_state *old_pmdmnd_state =
+		intel_atomic_get_old_pmdemand_state(state);
+
+	if (DISPLAY_VER(dev_priv) < 14)
+		return;
+
+	if (!new_pmdmnd_state ||
+	    memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)
+		return;
+
+	intel_program_pmdemand(dev_priv, new_pmdmnd_state, NULL);
+}
+
 static void ibx_init_clock_gating(struct drm_i915_private *dev_priv)
 {
 	/*
diff --git a/drivers/gpu/drm/i915/intel_pm.h b/drivers/gpu/drm/i915/intel_pm.h
index f774bddcdca6..2663bec408c7 100644
--- a/drivers/gpu/drm/i915/intel_pm.h
+++ b/drivers/gpu/drm/i915/intel_pm.h
@@ -8,11 +8,46 @@
 
 #include <linux/types.h>
 
+#include "display/intel_global_state.h"
+
 struct drm_i915_private;
 struct intel_crtc_state;
 struct intel_plane_state;
 
 void intel_init_clock_gating(struct drm_i915_private *dev_priv);
+void intel_init_pmdemand(struct drm_i915_private *dev_priv);
 void intel_init_clock_gating_hooks(struct drm_i915_private *dev_priv);
 
+struct intel_pmdemand_state {
+	struct intel_global_state base;
+
+	u16 qclk_gv_bw;
+	u8 voltage_index;
+	u8 qclk_gv_index;
+	u8 active_pipes;
+	u8 dbufs;
+	u8 active_phys_plls_mask;
+	u16 cdclk_freq_mhz;
+	u16 ddiclk_freq_mhz;
+	u8 scalers;
+};
+
+int intel_pmdemand_init(struct drm_i915_private *dev_priv);
+
+struct intel_pmdemand_state *
+intel_atomic_get_pmdemand_state(struct intel_atomic_state *state);
+
+#define to_intel_pmdemand_state(x) container_of((x), struct intel_pmdemand_state, base)
+#define intel_atomic_get_old_pmdemand_state(state) \
+	to_intel_pmdemand_state(intel_atomic_get_old_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))
+#define intel_atomic_get_new_pmdemand_state(state) \
+	to_intel_pmdemand_state(intel_atomic_get_new_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))
+
+int intel_pmdemand_init(struct drm_i915_private *dev_priv);
+void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
+				 u8 dbuf_slices);
+void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state);
+void intel_pmdemand_post_plane_update(struct intel_atomic_state *state);
+int intel_pmdemand_atomic_check(struct intel_atomic_state *state);
+
 #endif /* __INTEL_PM_H__ */
-- 
2.34.1


^ permalink raw reply related	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
@ 2023-04-03  9:17 ` Jani Nikula
  2023-04-03 13:14   ` Kahola, Mika
  2023-04-03 10:55 ` kernel test robot
                   ` (5 subsequent siblings)
  6 siblings, 1 reply; 13+ messages in thread
From: Jani Nikula @ 2023-04-03  9:17 UTC (permalink / raw)
  To: Mika Kahola, intel-gfx; +Cc: Matt Roper, Lucas De Marchi

On Mon, 03 Apr 2023, Mika Kahola <mika.kahola@intel.com> wrote:
> Display14 introduces a new way to instruct the PUnit with
> power and bandwidth requirements of DE. Add the functionality
> to program the registers and handle waits using interrupts.
> The current wait time for timeouts is programmed for 10 msecs to
> factor in the worst case scenarios. Changes made to use REG_BIT
> for a register that we touched(GEN8_DE_MISC_IER _MMIO).
>
> v2:
>   - Removed repeated definition of dbuf, which has been moved to struct
>     intel_display. (Gustavo)
>   - s/dev_priv->dbuf/dev_priv->display.dbuf/ (Gustavo)
>
> Bspec: 66451, 64636, 64602, 64603
> Cc: Matt Atwood <matthew.s.atwood@intel.com>
> Cc: Matt Roper <matthew.d.roper@intel.com>
> Cc: Lucas De Marchi <lucas.demarchi@intel.com>
> Cc: Gustavo Sousa <gustavo.sousa@intel.com>
> Signed-off-by: José Roberto de Souza <jose.souza@intel.com>
> Signed-off-by: Radhakrishna Sripada <radhakrishna.sripada@intel.com>
> Signed-off-by: Mika Kahola <mika.kahola@intel.com>
> ---
>  drivers/gpu/drm/i915/display/intel_bw.c       |   4 +-
>  drivers/gpu/drm/i915/display/intel_bw.h       |   2 +
>  drivers/gpu/drm/i915/display/intel_display.c  |  14 +
>  .../drm/i915/display/intel_display_power.c    |   8 +
>  drivers/gpu/drm/i915/i915_drv.h               |   6 +
>  drivers/gpu/drm/i915/i915_irq.c               |  22 +-
>  drivers/gpu/drm/i915/i915_reg.h               |  33 +-
>  drivers/gpu/drm/i915/intel_pm.c               | 293 ++++++++++++++++++

This is the wrong place.

I've got reviewed patches to rename this to intel_clock_gating.c because
that's what it has left. Everything else has been moved out. They
would've been pushed already but there was a conflict so waited out a
bit.

Maybe a new display/intel_pmdemand.[ch]? This is only about display,
right?

>  drivers/gpu/drm/i915/intel_pm.h               |  35 +++
>  9 files changed, 412 insertions(+), 5 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/display/intel_bw.c b/drivers/gpu/drm/i915/display/intel_bw.c
> index 202321ffbe2a..87c20bf52123 100644
> --- a/drivers/gpu/drm/i915/display/intel_bw.c
> +++ b/drivers/gpu/drm/i915/display/intel_bw.c
> @@ -746,8 +746,8 @@ static unsigned int intel_bw_num_active_planes(struct drm_i915_private *dev_priv
>  	return num_active_planes;
>  }
>  
> -static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> -				       const struct intel_bw_state *bw_state)
> +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> +				const struct intel_bw_state *bw_state)
>  {
>  	unsigned int data_rate = 0;
>  	enum pipe pipe;
> diff --git a/drivers/gpu/drm/i915/display/intel_bw.h b/drivers/gpu/drm/i915/display/intel_bw.h
> index f20292143745..17fc0b61db04 100644
> --- a/drivers/gpu/drm/i915/display/intel_bw.h
> +++ b/drivers/gpu/drm/i915/display/intel_bw.h
> @@ -62,6 +62,8 @@ int intel_bw_init(struct drm_i915_private *dev_priv);
>  int intel_bw_atomic_check(struct intel_atomic_state *state);
>  void intel_bw_crtc_update(struct intel_bw_state *bw_state,
>  			  const struct intel_crtc_state *crtc_state);
> +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> +				const struct intel_bw_state *bw_state);
>  int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
>  				  u32 points_mask);
>  int intel_bw_calc_min_cdclk(struct intel_atomic_state *state,
> diff --git a/drivers/gpu/drm/i915/display/intel_display.c b/drivers/gpu/drm/i915/display/intel_display.c
> index b53a1d969344..ee7ca33123b1 100644
> --- a/drivers/gpu/drm/i915/display/intel_display.c
> +++ b/drivers/gpu/drm/i915/display/intel_display.c
> @@ -959,6 +959,9 @@ intel_get_crtc_new_encoder(const struct intel_atomic_state *state,
>  		num_encoders++;
>  	}
>  
> +	if (!encoder)
> +		return NULL;
> +

How's this related?

>  	drm_WARN(encoder->base.dev, num_encoders != 1,
>  		 "%d encoders for pipe %c\n",
>  		 num_encoders, pipe_name(master_crtc->pipe));
> @@ -6767,6 +6770,10 @@ int intel_atomic_check(struct drm_device *dev,
>  		ret = intel_modeset_calc_cdclk(state);
>  		if (ret)
>  			return ret;
> +
> +		ret = intel_pmdemand_atomic_check(state);
> +		if (ret)
> +			goto fail;
>  	}
>  
>  	ret = intel_atomic_check_crtcs(state);
> @@ -7411,6 +7418,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
>  	}
>  
>  	intel_sagv_pre_plane_update(state);
> +	intel_pmdemand_pre_plane_update(state);
>  
>  	/* Complete the events for pipes that have now been disabled */
>  	for_each_new_intel_crtc_in_state(state, crtc, new_crtc_state, i) {
> @@ -7523,6 +7531,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
>  		intel_verify_planes(state);
>  
>  	intel_sagv_post_plane_update(state);
> +	intel_pmdemand_post_plane_update(state);
>  
>  	drm_atomic_helper_commit_hw_done(&state->base);
>  
> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
>  	intel_color_init_hooks(dev_priv);
>  	intel_init_cdclk_hooks(dev_priv);
>  	intel_audio_hooks_init(dev_priv);
> +	intel_init_pmdemand(dev_priv);

intel_init_pmdemand()...

>  
>  	intel_dpll_init_clock_hook(dev_priv);
>  
> @@ -8476,6 +8486,10 @@ int intel_modeset_init_noirq(struct drm_i915_private *i915)
>  	if (ret)
>  		goto cleanup_vga_client_pw_domain_dmc;
>  
> +	ret = intel_pmdemand_init(i915);

...and intel_pmdemand_init(). Please just no.

Also, name them all intel_pmdemand_*().

> +	if (ret)
> +		goto cleanup_vga_client_pw_domain_dmc;
> +
>  	init_llist_head(&i915->display.atomic_helper.free_list);
>  	INIT_WORK(&i915->display.atomic_helper.free_work,
>  		  intel_atomic_helper_free_state_worker);
> diff --git a/drivers/gpu/drm/i915/display/intel_display_power.c b/drivers/gpu/drm/i915/display/intel_display_power.c
> index 5e85572dc8e4..04c172b5c17b 100644
> --- a/drivers/gpu/drm/i915/display/intel_display_power.c
> +++ b/drivers/gpu/drm/i915/display/intel_display_power.c
> @@ -19,6 +19,7 @@
>  #include "intel_mchbar_regs.h"
>  #include "intel_pch_refclk.h"
>  #include "intel_pcode.h"
> +#include "intel_pm.h"
>  #include "intel_pps_regs.h"
>  #include "intel_snps_phy.h"
>  #include "skl_watermark.h"
> @@ -1083,6 +1084,10 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
>  	dev_priv->display.dbuf.enabled_slices =
>  		intel_enabled_dbuf_slices_mask(dev_priv);
>  
> +	if (DISPLAY_VER(dev_priv) >= 14)
> +		intel_program_dbuf_pmdemand(dev_priv, BIT(DBUF_S1) |
> +					    dev_priv->display.dbuf.enabled_slices);
> +
>  	/*
>  	 * Just power up at least 1 slice, we will
>  	 * figure out later which slices we have and what we need.
> @@ -1094,6 +1099,9 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
>  static void gen9_dbuf_disable(struct drm_i915_private *dev_priv)
>  {
>  	gen9_dbuf_slices_update(dev_priv, 0);
> +
> +	if (DISPLAY_VER(dev_priv) >= 14)
> +		intel_program_dbuf_pmdemand(dev_priv, 0);
>  }
>  
>  static void gen12_dbuf_slices_config(struct drm_i915_private *dev_priv)
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index e771fdc3099c..2a73e726c6ed 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -250,6 +250,12 @@ struct drm_i915_private {
>  	unsigned int hpll_freq;
>  	unsigned int czclk_freq;
>  
> +	struct {
> +		wait_queue_head_t waitqueue;
> +		struct mutex lock;
> +		struct intel_global_obj obj;
> +	} pmdemand;
> +

Please don't add new display stuff to struct drm_i915_private. See
struct intel_display in display/intel_display_core.h.

>  	/**
>  	 * wq - Driver workqueue for GEM.
>  	 *
> diff --git a/drivers/gpu/drm/i915/i915_irq.c b/drivers/gpu/drm/i915/i915_irq.c
> index c0888cc88d04..636033bb9650 100644
> --- a/drivers/gpu/drm/i915/i915_irq.c
> +++ b/drivers/gpu/drm/i915/i915_irq.c
> @@ -1913,6 +1913,11 @@ static u32 gen8_de_pipe_fault_mask(struct drm_i915_private *dev_priv)
>  		return GEN8_DE_PIPE_IRQ_FAULT_ERRORS;
>  }
>  
> +static void intel_pmdemand_irq_handler(struct drm_i915_private *dev_priv)
> +{
> +	wake_up_all(&dev_priv->pmdemand.waitqueue);
> +}
> +
>  static void
>  gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
>  {
> @@ -1949,6 +1954,18 @@ gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
>  		}
>  	}
>  
> +	if (iir & XELPDP_PMDEMAND_RSPTOUT_ERR) {
> +		drm_dbg(&dev_priv->drm,
> +			"Error waiting for Punit PM Demand Response\n");
> +		intel_pmdemand_irq_handler(dev_priv);
> +		found = true;
> +	}
> +
> +	if (iir & XELPDP_PMDEMAND_RSP) {
> +		intel_pmdemand_irq_handler(dev_priv);
> +		found = true;
> +	}
> +
>  	if (!found)
>  		drm_err(&dev_priv->drm, "Unexpected DE Misc interrupt\n");
>  }
> @@ -3315,7 +3332,10 @@ static void gen8_de_irq_postinstall(struct drm_i915_private *dev_priv)
>  	if (IS_GEMINILAKE(dev_priv) || IS_BROXTON(dev_priv))
>  		de_port_masked |= BXT_DE_PORT_GMBUS;
>  
> -	if (DISPLAY_VER(dev_priv) >= 11) {
> +	if (DISPLAY_VER(dev_priv) >= 14)
> +		de_misc_masked |= XELPDP_PMDEMAND_RSPTOUT_ERR |
> +				  XELPDP_PMDEMAND_RSP;
> +	else if (DISPLAY_VER(dev_priv) >= 11) {
>  		enum port port;
>  
>  		if (intel_bios_is_dsi_present(dev_priv, &port))
> diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
> index 8d26fa2765c1..7f8e750665ed 100644
> --- a/drivers/gpu/drm/i915/i915_reg.h
> +++ b/drivers/gpu/drm/i915/i915_reg.h
> @@ -4783,8 +4783,10 @@
>  #define GEN8_DE_MISC_IMR _MMIO(0x44464)
>  #define GEN8_DE_MISC_IIR _MMIO(0x44468)
>  #define GEN8_DE_MISC_IER _MMIO(0x4446c)
> -#define  GEN8_DE_MISC_GSE		(1 << 27)
> -#define  GEN8_DE_EDP_PSR		(1 << 19)
> +#define  XELPDP_PMDEMAND_RSPTOUT_ERR	REG_BIT(27)
> +#define  GEN8_DE_MISC_GSE		REG_BIT(27)
> +#define  GEN8_DE_EDP_PSR		REG_BIT(19)
> +#define  XELPDP_PMDEMAND_RSP		REG_BIT(3)
>  
>  #define GEN8_PCU_ISR _MMIO(0x444e0)
>  #define GEN8_PCU_IMR _MMIO(0x444e4)
> @@ -4847,6 +4849,33 @@
>  #define  GEN11_HOTPLUG_CTL_SHORT_DETECT(hpd_pin)	(1 << (_HPD_PIN_TC(hpd_pin) * 4))
>  #define  GEN11_HOTPLUG_CTL_NO_DETECT(hpd_pin)		(0 << (_HPD_PIN_TC(hpd_pin) * 4))
>  
> +#define XELPDP_INITIATE_PMDEMAND_REQUEST(dword)		_MMIO(0x45230 + 4 * (dword))
> +#define  XELPDP_PMDEMAND_QCLK_GV_BW_MASK		REG_GENMASK(31, 16)
> +#define  XELPDP_PMDEMAND_QCLK_GV_BW(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_BW_MASK, x)
> +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK		REG_GENMASK(14, 12)
> +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX(x)		REG_FIELD_PREP(XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK, x)
> +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK		REG_GENMASK(11, 8)
> +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX(x)		REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK, x)
> +#define  XELPDP_PMDEMAND_PIPES_MASK			REG_GENMASK(7, 6)
> +#define  XELPDP_PMDEMAND_PIPES(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_PIPES_MASK, x)
> +#define  XELPDP_PMDEMAND_DBUFS_MASK			REG_GENMASK(5, 4)
> +#define  XELPDP_PMDEMAND_DBUFS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_DBUFS_MASK, x)
> +#define  XELPDP_PMDEMAND_PHYS_MASK			REG_GENMASK(2, 0)
> +#define  XELPDP_PMDEMAND_PHYS(x)				REG_FIELD_PREP(XELPDP_PMDEMAND_PHYS_MASK, x)
> +
> +#define  XELPDP_PMDEMAND_REQ_ENABLE			REG_BIT(31)
> +#define  XELPDP_PMDEMAND_CDCLK_FREQ_MASK		REG_GENMASK(30, 20)
> +#define  XELPDP_PMDEMAND_CDCLK_FREQ(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_CDCLK_FREQ_MASK, x)
> +#define  XELPDP_PMDEMAND_DDICLK_FREQ_MASK		REG_GENMASK(18, 8)
> +#define  XELPDP_PMDEMAND_DDICLK_FREQ(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_DDICLK_FREQ_MASK, x)
> +#define  XELPDP_PMDEMAND_SCALERS_MASK			REG_GENMASK(6, 4)
> +#define  XELPDP_PMDEMAND_SCALERS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_SCALERS_MASK, x)
> +#define  XELPDP_PMDEMAND_PLLS_MASK			REG_GENMASK(2, 0)
> +#define  XELPDP_PMDEMAND_PLLS(x)			REG_FIELD_PREP(XELPDP_PMDEMAND_PLLS_MASK, x)
> +
> +#define GEN12_DCPR_STATUS_1				_MMIO(0x46440)
> +#define  XELPDP_PMDEMAND_INFLIGHT_STATUS		REG_BIT(26)
> +
>  #define ILK_DISPLAY_CHICKEN2	_MMIO(0x42004)
>  /* Required on all Ironlake and Sandybridge according to the B-Spec. */
>  #define  ILK_ELPIN_409_SELECT	(1 << 25)
> diff --git a/drivers/gpu/drm/i915/intel_pm.c b/drivers/gpu/drm/i915/intel_pm.c
> index c45af0d981fd..877997e4141d 100644
> --- a/drivers/gpu/drm/i915/intel_pm.c
> +++ b/drivers/gpu/drm/i915/intel_pm.c
> @@ -25,6 +25,10 @@
>   *
>   */
>  
> +#include <linux/bitops.h>
> +
> +#include "display/intel_bw.h"
> +#include "display/intel_cdclk.h"
>  #include "display/intel_de.h"
>  #include "display/intel_display.h"
>  #include "display/intel_display_trace.h"
> @@ -40,6 +44,14 @@
>  #include "intel_pm.h"
>  #include "vlv_sideband.h"
>  
> +bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
> +{
> +        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
> +                return true;
> +
> +        return false;
> +}

This doesn't belong here or in intel_pmdemand.c. It's just not about pm
or pmdemand.

> +
>  struct drm_i915_clock_gating_funcs {
>  	void (*init_clock_gating)(struct drm_i915_private *i915);
>  };
> @@ -124,6 +136,287 @@ static void glk_init_clock_gating(struct drm_i915_private *dev_priv)
>  		   PWM1_GATING_DIS | PWM2_GATING_DIS);
>  }
>  
> +static struct intel_global_state *intel_pmdemand_duplicate_state(struct intel_global_obj *obj)
> +{
> +	struct intel_pmdemand_state *pmdmnd_state;
> +
> +	pmdmnd_state = kmemdup(obj->state, sizeof(*pmdmnd_state), GFP_KERNEL);
> +	if (!pmdmnd_state)
> +		return NULL;
> +
> +	return &pmdmnd_state->base;
> +}
> +
> +static void intel_pmdemand_destroy_state(struct intel_global_obj *obj,
> +					 struct intel_global_state *state)
> +{
> +	kfree(state);
> +}
> +
> +static const struct intel_global_state_funcs intel_pmdemand_funcs = {
> +	.atomic_duplicate_state = intel_pmdemand_duplicate_state,
> +	.atomic_destroy_state = intel_pmdemand_destroy_state,
> +};
> +
> +struct intel_pmdemand_state *
> +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state)
> +{
> +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +	struct intel_global_state *pmdemand_state;
> +
> +	pmdemand_state = intel_atomic_get_global_obj_state(state, &dev_priv->pmdemand.obj);
> +	if (IS_ERR(pmdemand_state))
> +		return ERR_CAST(pmdemand_state);
> +
> +	return to_intel_pmdemand_state(pmdemand_state);
> +}
> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv)
> +{
> +	struct intel_pmdemand_state *pmdemand_state;
> +
> +	pmdemand_state = kzalloc(sizeof(*pmdemand_state), GFP_KERNEL);
> +	if (!pmdemand_state)
> +		return -ENOMEM;
> +
> +	intel_atomic_global_obj_init(dev_priv, &dev_priv->pmdemand.obj,
> +				     &pmdemand_state->base, &intel_pmdemand_funcs);
> +
> +	return 0;
> +}
> +
> +void intel_init_pmdemand(struct drm_i915_private *dev_priv)
> +{
> +	mutex_init(&dev_priv->pmdemand.lock);
> +	init_waitqueue_head(&dev_priv->pmdemand.waitqueue);
> +}
> +
> +int intel_pmdemand_atomic_check(struct intel_atomic_state *state)
> +{
> +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +	struct intel_pmdemand_state *new_pmdemand_state = NULL;
> +	struct intel_crtc_state *old_crtc_state, *new_crtc_state;
> +	struct intel_crtc *crtc;
> +	struct intel_encoder *encoder;
> +	struct intel_bw_state *new_bw_state;
> +	const struct intel_dbuf_state *new_dbuf_state;
> +	const struct intel_cdclk_state *new_cdclk_state;
> +	int port_clock = 0;
> +	unsigned int data_rate;
> +	enum phy phy;
> +	int i, ret;
> +
> +	if (DISPLAY_VER(dev_priv) < 14)
> +		return 0;
> +
> +	new_pmdemand_state = intel_atomic_get_pmdemand_state(state);
> +	if (IS_ERR(new_pmdemand_state))
> +		return PTR_ERR(new_pmdemand_state);
> +
> +	ret = intel_atomic_lock_global_state(&new_pmdemand_state->base);
> +	if (ret)
> +		return ret;
> +
> +	/* Punit figures out the voltage index based on bandwidth*/
> +	new_bw_state = intel_atomic_get_bw_state(state);
> +	if (IS_ERR(new_bw_state))
> +		return PTR_ERR(new_bw_state);
> +
> +	/* firmware will calculate the qclck_gc_index, requirement is set to 0 */
> +	new_pmdemand_state->qclk_gv_index = 0;
> +
> +	data_rate = intel_bw_data_rate(dev_priv, new_bw_state);
> +	/* To MBs then to multiples of 100MBs */
> +	data_rate = DIV_ROUND_UP(data_rate, 1000);
> +	data_rate = DIV_ROUND_UP(data_rate, 100);
> +	new_pmdemand_state->qclk_gv_bw = data_rate;
> +
> +	new_dbuf_state = intel_atomic_get_dbuf_state(state);
> +	if (IS_ERR(new_dbuf_state))
> +		return PTR_ERR(new_dbuf_state);
> +
> +	i = hweight8(new_dbuf_state->active_pipes);
> +	new_pmdemand_state->active_pipes = min(i, 3);
> +
> +	new_cdclk_state = intel_atomic_get_cdclk_state(state);
> +	if (IS_ERR(new_cdclk_state))
> +		return PTR_ERR(new_cdclk_state);
> +
> +	new_pmdemand_state->voltage_index = new_cdclk_state->logical.voltage_level;
> +	/* KHz to MHz */
> +	new_pmdemand_state->cdclk_freq_mhz = DIV_ROUND_UP(new_cdclk_state->logical.cdclk, 1000);
> +
> +	new_pmdemand_state->active_phys_plls_mask = 0;
> +
> +	for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state, new_crtc_state, i) {
> +		if (!new_crtc_state->hw.active)
> +			continue;
> +
> +		encoder = intel_get_crtc_new_encoder(state, new_crtc_state);
> +		if (!encoder)
> +			continue;
> +
> +		phy = intel_port_to_phy(dev_priv, encoder->port);
> +
> +		if (intel_is_c10phy(dev_priv, phy))
> +			new_pmdemand_state->active_phys_plls_mask |= BIT(phy);
> +
> +		port_clock = max(port_clock, new_crtc_state->port_clock);
> +	}
> +
> +	/* To MHz */
> +	new_pmdemand_state->ddiclk_freq_mhz = DIV_ROUND_UP(port_clock, 1000);
> +
> +	/*
> +	 * Setting scalers to max as it can not be calculated during flips and
> +	 * fastsets without taking global states locks.
> +	 */
> +	new_pmdemand_state->scalers = 7;
> +
> +	return 0;
> +}
> +
> +static bool intel_pmdemand_check_prev_transaction(struct drm_i915_private *dev_priv)
> +{
> +	return !((intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE) ||
> +		(intel_de_read(dev_priv, GEN12_DCPR_STATUS_1) & XELPDP_PMDEMAND_INFLIGHT_STATUS));
> +}
> +
> +static bool intel_pmdemand_req_complete(struct drm_i915_private *dev_priv)
> +{
> +	return !(intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE);
> +}
> +
> +static int intel_pmdemand_wait(struct drm_i915_private *dev_priv)
> +{
> +	DEFINE_WAIT(wait);
> +	int ret;
> +	const unsigned int timeout_ms = 10;
> +
> +	add_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
> +
> +	ret = wait_event_timeout(dev_priv->pmdemand.waitqueue,
> +				 intel_pmdemand_req_complete(dev_priv),
> +				 msecs_to_jiffies_timeout(timeout_ms));
> +	if (ret < 0)
> +		drm_err(&dev_priv->drm,
> +			"timed out waiting for Punit PM Demand Response\n");
> +
> +	remove_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
> +
> +	return ret;
> +}
> +
> +/* Required to be programmed during Display Init Sequences. */
> +void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> +				 u8 dbuf_slices)
> +{
> +	mutex_lock(&dev_priv->pmdemand.lock);
> +	if (drm_WARN_ON(&dev_priv->drm,
> +			!intel_pmdemand_check_prev_transaction(dev_priv)))
> +		goto unlock;
> +
> +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0),
> +		     XELPDP_PMDEMAND_DBUFS_MASK,
> +		     XELPDP_PMDEMAND_DBUFS(hweight32(dbuf_slices)));
> +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0,
> +		     XELPDP_PMDEMAND_REQ_ENABLE);
> +
> +	intel_pmdemand_wait(dev_priv);
> +unlock:
> +	mutex_unlock(&dev_priv->pmdemand.lock);
> +}
> +
> +static void intel_program_pmdemand(struct drm_i915_private *dev_priv,
> +				   const struct intel_pmdemand_state *new,
> +				   const struct intel_pmdemand_state *old)
> +{
> +	u32 val, tmp;
> +
> +#define UPDATE_PMDEMAND_VAL(val, F, f) do {            \
> +	val &= (~(XELPDP_PMDEMAND_##F##_MASK));         \
> +	val |= (XELPDP_PMDEMAND_##F((u32)(old ? max(old->f, new->f) : new->f))); \
> +} while (0)

I'm not convinced this makes the code easier to follow.

> +
> +	mutex_lock(&dev_priv->pmdemand.lock);
> +	if (drm_WARN_ON(&dev_priv->drm,
> +			!intel_pmdemand_check_prev_transaction(dev_priv)))
> +		goto unlock;
> +
> +	/*
> +	 * TODO: Update programming PM Demand for
> +	 * PHYS, PLLS, DDI_CLKFREQ, SCALARS
> +	 */
> +	val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0));
> +	UPDATE_PMDEMAND_VAL(val, QCLK_GV_INDEX, qclk_gv_index);
> +	UPDATE_PMDEMAND_VAL(val, QCLK_GV_BW, qclk_gv_bw);
> +	UPDATE_PMDEMAND_VAL(val, VOLTAGE_INDEX, voltage_index);
> +	UPDATE_PMDEMAND_VAL(val, PIPES, active_pipes);
> +	UPDATE_PMDEMAND_VAL(val, DBUFS, dbufs);
> +	tmp = hweight32(new->active_phys_plls_mask);
> +	if (old)
> +		tmp = max(tmp, hweight32(old->active_phys_plls_mask));
> +	val |= XELPDP_PMDEMAND_PHYS(tmp);
> +
> +	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0), val);
> +
> +	val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1));
> +	UPDATE_PMDEMAND_VAL(val, CDCLK_FREQ, cdclk_freq_mhz);
> +	UPDATE_PMDEMAND_VAL(val, DDICLK_FREQ, ddiclk_freq_mhz);
> +	UPDATE_PMDEMAND_VAL(val, SCALERS, scalers);
> +	/*
> +	 * Active_PLLs starts with 1 because of CDCLK PLL.
> +	 * TODO: Missing to account genlock filter when it gets used.
> +	 */
> +	val |= XELPDP_PMDEMAND_PLLS(tmp + 1);
> +
> +	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), val);
> +
> +#undef UPDATE_PM_DEMAND_VAL
> +
> +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0, XELPDP_PMDEMAND_REQ_ENABLE);
> +
> +	intel_pmdemand_wait(dev_priv);
> +unlock:
> +	mutex_unlock(&dev_priv->pmdemand.lock);
> +}
> +
> +void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state)
> +{
> +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +	const struct intel_pmdemand_state *new_pmdmnd_state =
> +		intel_atomic_get_new_pmdemand_state(state);
> +	const struct intel_pmdemand_state *old_pmdmnd_state =
> +		intel_atomic_get_old_pmdemand_state(state);
> +
> +	if (DISPLAY_VER(dev_priv) < 14)
> +		return;
> +
> +	if (!new_pmdmnd_state ||
> +	    memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)
> +		return;
> +
> +	intel_program_pmdemand(dev_priv, new_pmdmnd_state, old_pmdmnd_state);
> +}
> +
> +void intel_pmdemand_post_plane_update(struct intel_atomic_state *state)
> +{
> +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +	const struct intel_pmdemand_state *new_pmdmnd_state =
> +		intel_atomic_get_new_pmdemand_state(state);
> +	const struct intel_pmdemand_state *old_pmdmnd_state =
> +		intel_atomic_get_old_pmdemand_state(state);
> +
> +	if (DISPLAY_VER(dev_priv) < 14)
> +		return;
> +
> +	if (!new_pmdmnd_state ||
> +	    memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)
> +		return;
> +
> +	intel_program_pmdemand(dev_priv, new_pmdmnd_state, NULL);
> +}
> +
>  static void ibx_init_clock_gating(struct drm_i915_private *dev_priv)
>  {
>  	/*
> diff --git a/drivers/gpu/drm/i915/intel_pm.h b/drivers/gpu/drm/i915/intel_pm.h
> index f774bddcdca6..2663bec408c7 100644
> --- a/drivers/gpu/drm/i915/intel_pm.h
> +++ b/drivers/gpu/drm/i915/intel_pm.h
> @@ -8,11 +8,46 @@
>  
>  #include <linux/types.h>
>  
> +#include "display/intel_global_state.h"
> +
>  struct drm_i915_private;
>  struct intel_crtc_state;
>  struct intel_plane_state;
>  
>  void intel_init_clock_gating(struct drm_i915_private *dev_priv);
> +void intel_init_pmdemand(struct drm_i915_private *dev_priv);
>  void intel_init_clock_gating_hooks(struct drm_i915_private *dev_priv);
>  
> +struct intel_pmdemand_state {
> +	struct intel_global_state base;
> +
> +	u16 qclk_gv_bw;
> +	u8 voltage_index;
> +	u8 qclk_gv_index;
> +	u8 active_pipes;
> +	u8 dbufs;
> +	u8 active_phys_plls_mask;
> +	u16 cdclk_freq_mhz;
> +	u16 ddiclk_freq_mhz;
> +	u8 scalers;
> +};

Could this actually be private to intel_pmdemand.c?

> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv);
> +
> +struct intel_pmdemand_state *
> +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state);
> +
> +#define to_intel_pmdemand_state(x) container_of((x), struct intel_pmdemand_state, base)
> +#define intel_atomic_get_old_pmdemand_state(state) \
> +	to_intel_pmdemand_state(intel_atomic_get_old_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))
> +#define intel_atomic_get_new_pmdemand_state(state) \
> +	to_intel_pmdemand_state(intel_atomic_get_new_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))

Please just make these proper functions and hide the details. I've been
meaning to do that elsewhere too. This shouldn't have to include
intel_global_state.h.

> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv);
> +void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> +				 u8 dbuf_slices);

intel_pmdemand_* naming please, if these will be put in
intel_pmdemand.[ch].

> +void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state);
> +void intel_pmdemand_post_plane_update(struct intel_atomic_state *state);
> +int intel_pmdemand_atomic_check(struct intel_atomic_state *state);
> +
>  #endif /* __INTEL_PM_H__ */

-- 
Jani Nikula, Intel Open Source Graphics Center

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
  2023-04-03  9:17 ` Jani Nikula
@ 2023-04-03 10:55 ` kernel test robot
  2023-04-03 13:49 ` kernel test robot
                   ` (4 subsequent siblings)
  6 siblings, 0 replies; 13+ messages in thread
From: kernel test robot @ 2023-04-03 10:55 UTC (permalink / raw)
  To: Mika Kahola; +Cc: oe-kbuild-all

Hi Mika,

Thank you for the patch! Yet something to improve:

[auto build test ERROR on drm-tip/drm-tip]

url:    https://github.com/intel-lab-lkp/linux/commits/Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
base:   git://anongit.freedesktop.org/drm/drm-tip drm-tip
patch link:    https://lore.kernel.org/r/20230403085043.2219092-1-mika.kahola%40intel.com
patch subject: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
config: x86_64-allyesconfig (https://download.01.org/0day-ci/archive/20230403/202304031821.7mf2eSpM-lkp@intel.com/config)
compiler: gcc-11 (Debian 11.3.0-8) 11.3.0
reproduce (this is a W=1 build):
        # https://github.com/intel-lab-lkp/linux/commit/4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        git remote add linux-review https://github.com/intel-lab-lkp/linux
        git fetch --no-tags linux-review Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
        git checkout 4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        # save the config file
        mkdir build_dir && cp config build_dir/.config
        make W=1 O=build_dir ARCH=x86_64 olddefconfig
        make W=1 O=build_dir ARCH=x86_64 SHELL=/bin/bash drivers/gpu/

If you fix the issue, kindly add following tag where applicable
| Reported-by: kernel test robot <lkp@intel.com>
| Link: https://lore.kernel.org/oe-kbuild-all/202304031821.7mf2eSpM-lkp@intel.com/

All errors (new ones prefixed by >>):

>> drivers/gpu/drm/i915/intel_pm.c:47:6: error: no previous prototype for 'intel_is_c10phy' [-Werror=missing-prototypes]
      47 | bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
         |      ^~~~~~~~~~~~~~~
   cc1: all warnings being treated as errors


vim +/intel_is_c10phy +47 drivers/gpu/drm/i915/intel_pm.c

    46	
  > 47	bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
    48	{
    49	        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
    50	                return true;
    51	
    52	        return false;
    53	}
    54	

-- 
0-DAY CI Kernel Test Service
https://github.com/intel/lkp-tests

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  9:17 ` Jani Nikula
@ 2023-04-03 13:14   ` Kahola, Mika
  0 siblings, 0 replies; 13+ messages in thread
From: Kahola, Mika @ 2023-04-03 13:14 UTC (permalink / raw)
  To: Jani Nikula, intel-gfx; +Cc: Roper, Matthew D, De Marchi, Lucas

> -----Original Message-----
> From: Jani Nikula <jani.nikula@linux.intel.com>
> Sent: Monday, April 3, 2023 12:17 PM
> To: Kahola, Mika <mika.kahola@intel.com>; intel-gfx@lists.freedesktop.org
> Cc: De Marchi, Lucas <lucas.demarchi@intel.com>; Roper, Matthew D
> <matthew.d.roper@intel.com>
> Subject: Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
> 
> On Mon, 03 Apr 2023, Mika Kahola <mika.kahola@intel.com> wrote:
> > Display14 introduces a new way to instruct the PUnit with power and
> > bandwidth requirements of DE. Add the functionality to program the
> > registers and handle waits using interrupts.
> > The current wait time for timeouts is programmed for 10 msecs to
> > factor in the worst case scenarios. Changes made to use REG_BIT for a
> > register that we touched(GEN8_DE_MISC_IER _MMIO).
> >
> > v2:
> >   - Removed repeated definition of dbuf, which has been moved to struct
> >     intel_display. (Gustavo)
> >   - s/dev_priv->dbuf/dev_priv->display.dbuf/ (Gustavo)
> >
> > Bspec: 66451, 64636, 64602, 64603
> > Cc: Matt Atwood <matthew.s.atwood@intel.com>
> > Cc: Matt Roper <matthew.d.roper@intel.com>
> > Cc: Lucas De Marchi <lucas.demarchi@intel.com>
> > Cc: Gustavo Sousa <gustavo.sousa@intel.com>
> > Signed-off-by: José Roberto de Souza <jose.souza@intel.com>
> > Signed-off-by: Radhakrishna Sripada <radhakrishna.sripada@intel.com>
> > Signed-off-by: Mika Kahola <mika.kahola@intel.com>
> > ---
> >  drivers/gpu/drm/i915/display/intel_bw.c       |   4 +-
> >  drivers/gpu/drm/i915/display/intel_bw.h       |   2 +
> >  drivers/gpu/drm/i915/display/intel_display.c  |  14 +
> >  .../drm/i915/display/intel_display_power.c    |   8 +
> >  drivers/gpu/drm/i915/i915_drv.h               |   6 +
> >  drivers/gpu/drm/i915/i915_irq.c               |  22 +-
> >  drivers/gpu/drm/i915/i915_reg.h               |  33 +-
> >  drivers/gpu/drm/i915/intel_pm.c               | 293 ++++++++++++++++++
> 
> This is the wrong place.
> 
> I've got reviewed patches to rename this to intel_clock_gating.c because that's
> what it has left. Everything else has been moved out. They would've been
> pushed already but there was a conflict so waited out a bit.
> 
> Maybe a new display/intel_pmdemand.[ch]? This is only about display, right?

Ok. This is about display. I look into if we need to create a new file for this.

> 
> >  drivers/gpu/drm/i915/intel_pm.h               |  35 +++
> >  9 files changed, 412 insertions(+), 5 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/i915/display/intel_bw.c
> > b/drivers/gpu/drm/i915/display/intel_bw.c
> > index 202321ffbe2a..87c20bf52123 100644
> > --- a/drivers/gpu/drm/i915/display/intel_bw.c
> > +++ b/drivers/gpu/drm/i915/display/intel_bw.c
> > @@ -746,8 +746,8 @@ static unsigned int intel_bw_num_active_planes(struct
> drm_i915_private *dev_priv
> >  	return num_active_planes;
> >  }
> >
> > -static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> > -				       const struct intel_bw_state *bw_state)
> > +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> > +				const struct intel_bw_state *bw_state)
> >  {
> >  	unsigned int data_rate = 0;
> >  	enum pipe pipe;
> > diff --git a/drivers/gpu/drm/i915/display/intel_bw.h
> > b/drivers/gpu/drm/i915/display/intel_bw.h
> > index f20292143745..17fc0b61db04 100644
> > --- a/drivers/gpu/drm/i915/display/intel_bw.h
> > +++ b/drivers/gpu/drm/i915/display/intel_bw.h
> > @@ -62,6 +62,8 @@ int intel_bw_init(struct drm_i915_private
> > *dev_priv);  int intel_bw_atomic_check(struct intel_atomic_state
> > *state);  void intel_bw_crtc_update(struct intel_bw_state *bw_state,
> >  			  const struct intel_crtc_state *crtc_state);
> > +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> > +				const struct intel_bw_state *bw_state);
> >  int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
> >  				  u32 points_mask);
> >  int intel_bw_calc_min_cdclk(struct intel_atomic_state *state, diff
> > --git a/drivers/gpu/drm/i915/display/intel_display.c
> > b/drivers/gpu/drm/i915/display/intel_display.c
> > index b53a1d969344..ee7ca33123b1 100644
> > --- a/drivers/gpu/drm/i915/display/intel_display.c
> > +++ b/drivers/gpu/drm/i915/display/intel_display.c
> > @@ -959,6 +959,9 @@ intel_get_crtc_new_encoder(const struct
> intel_atomic_state *state,
> >  		num_encoders++;
> >  	}
> >
> > +	if (!encoder)
> > +		return NULL;
> > +
> 
> How's this related?
> 
> >  	drm_WARN(encoder->base.dev, num_encoders != 1,
> >  		 "%d encoders for pipe %c\n",
> >  		 num_encoders, pipe_name(master_crtc->pipe)); @@ -6767,6
> +6770,10
> > @@ int intel_atomic_check(struct drm_device *dev,
> >  		ret = intel_modeset_calc_cdclk(state);
> >  		if (ret)
> >  			return ret;
> > +
> > +		ret = intel_pmdemand_atomic_check(state);
> > +		if (ret)
> > +			goto fail;
> >  	}
> >
> >  	ret = intel_atomic_check_crtcs(state); @@ -7411,6 +7418,7 @@ static
> > void intel_atomic_commit_tail(struct intel_atomic_state *state)
> >  	}
> >
> >  	intel_sagv_pre_plane_update(state);
> > +	intel_pmdemand_pre_plane_update(state);
> >
> >  	/* Complete the events for pipes that have now been disabled */
> >  	for_each_new_intel_crtc_in_state(state, crtc, new_crtc_state, i) {
> > @@ -7523,6 +7531,7 @@ static void intel_atomic_commit_tail(struct
> intel_atomic_state *state)
> >  		intel_verify_planes(state);
> >
> >  	intel_sagv_post_plane_update(state);
> > +	intel_pmdemand_post_plane_update(state);
> >
> >  	drm_atomic_helper_commit_hw_done(&state->base);
> >
> > @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct
> drm_i915_private *dev_priv)
> >  	intel_color_init_hooks(dev_priv);
> >  	intel_init_cdclk_hooks(dev_priv);
> >  	intel_audio_hooks_init(dev_priv);
> > +	intel_init_pmdemand(dev_priv);
> 
> intel_init_pmdemand()...
> 
> >
> >  	intel_dpll_init_clock_hook(dev_priv);
> >
> > @@ -8476,6 +8486,10 @@ int intel_modeset_init_noirq(struct
> drm_i915_private *i915)
> >  	if (ret)
> >  		goto cleanup_vga_client_pw_domain_dmc;
> >
> > +	ret = intel_pmdemand_init(i915);
> 
> ...and intel_pmdemand_init(). Please just no.

Right. Not really working well.

> ,
> Also, name them all intel_pmdemand_*().
> 
> > +	if (ret)
> > +		goto cleanup_vga_client_pw_domain_dmc;
> > +
> >  	init_llist_head(&i915->display.atomic_helper.free_list);
> >  	INIT_WORK(&i915->display.atomic_helper.free_work,
> >  		  intel_atomic_helper_free_state_worker);
> > diff --git a/drivers/gpu/drm/i915/display/intel_display_power.c
> > b/drivers/gpu/drm/i915/display/intel_display_power.c
> > index 5e85572dc8e4..04c172b5c17b 100644
> > --- a/drivers/gpu/drm/i915/display/intel_display_power.c
> > +++ b/drivers/gpu/drm/i915/display/intel_display_power.c
> > @@ -19,6 +19,7 @@
> >  #include "intel_mchbar_regs.h"
> >  #include "intel_pch_refclk.h"
> >  #include "intel_pcode.h"
> > +#include "intel_pm.h"
> >  #include "intel_pps_regs.h"
> >  #include "intel_snps_phy.h"
> >  #include "skl_watermark.h"
> > @@ -1083,6 +1084,10 @@ static void gen9_dbuf_enable(struct
> drm_i915_private *dev_priv)
> >  	dev_priv->display.dbuf.enabled_slices =
> >  		intel_enabled_dbuf_slices_mask(dev_priv);
> >
> > +	if (DISPLAY_VER(dev_priv) >= 14)
> > +		intel_program_dbuf_pmdemand(dev_priv, BIT(DBUF_S1) |
> > +					    dev_priv-
> >display.dbuf.enabled_slices);
> > +
> >  	/*
> >  	 * Just power up at least 1 slice, we will
> >  	 * figure out later which slices we have and what we need.
> > @@ -1094,6 +1099,9 @@ static void gen9_dbuf_enable(struct
> > drm_i915_private *dev_priv)  static void gen9_dbuf_disable(struct
> > drm_i915_private *dev_priv)  {
> >  	gen9_dbuf_slices_update(dev_priv, 0);
> > +
> > +	if (DISPLAY_VER(dev_priv) >= 14)
> > +		intel_program_dbuf_pmdemand(dev_priv, 0);
> >  }
> >
> >  static void gen12_dbuf_slices_config(struct drm_i915_private
> > *dev_priv) diff --git a/drivers/gpu/drm/i915/i915_drv.h
> > b/drivers/gpu/drm/i915/i915_drv.h index e771fdc3099c..2a73e726c6ed
> > 100644
> > --- a/drivers/gpu/drm/i915/i915_drv.h
> > +++ b/drivers/gpu/drm/i915/i915_drv.h
> > @@ -250,6 +250,12 @@ struct drm_i915_private {
> >  	unsigned int hpll_freq;
> >  	unsigned int czclk_freq;
> >
> > +	struct {
> > +		wait_queue_head_t waitqueue;
> > +		struct mutex lock;
> > +		struct intel_global_obj obj;
> > +	} pmdemand;
> > +
> 
> Please don't add new display stuff to struct drm_i915_private. See struct
> intel_display in display/intel_display_core.h.
Ok. I'll have a look at that

> 
> >  	/**
> >  	 * wq - Driver workqueue for GEM.
> >  	 *
> > diff --git a/drivers/gpu/drm/i915/i915_irq.c
> > b/drivers/gpu/drm/i915/i915_irq.c index c0888cc88d04..636033bb9650
> > 100644
> > --- a/drivers/gpu/drm/i915/i915_irq.c
> > +++ b/drivers/gpu/drm/i915/i915_irq.c
> > @@ -1913,6 +1913,11 @@ static u32 gen8_de_pipe_fault_mask(struct
> drm_i915_private *dev_priv)
> >  		return GEN8_DE_PIPE_IRQ_FAULT_ERRORS;  }
> >
> > +static void intel_pmdemand_irq_handler(struct drm_i915_private
> > +*dev_priv) {
> > +	wake_up_all(&dev_priv->pmdemand.waitqueue);
> > +}
> > +
> >  static void
> >  gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
> > { @@ -1949,6 +1954,18 @@ gen8_de_misc_irq_handler(struct
> > drm_i915_private *dev_priv, u32 iir)
> >  		}
> >  	}
> >
> > +	if (iir & XELPDP_PMDEMAND_RSPTOUT_ERR) {
> > +		drm_dbg(&dev_priv->drm,
> > +			"Error waiting for Punit PM Demand Response\n");
> > +		intel_pmdemand_irq_handler(dev_priv);
> > +		found = true;
> > +	}
> > +
> > +	if (iir & XELPDP_PMDEMAND_RSP) {
> > +		intel_pmdemand_irq_handler(dev_priv);
> > +		found = true;
> > +	}
> > +
> >  	if (!found)
> >  		drm_err(&dev_priv->drm, "Unexpected DE Misc interrupt\n");  }
> @@
> > -3315,7 +3332,10 @@ static void gen8_de_irq_postinstall(struct
> drm_i915_private *dev_priv)
> >  	if (IS_GEMINILAKE(dev_priv) || IS_BROXTON(dev_priv))
> >  		de_port_masked |= BXT_DE_PORT_GMBUS;
> >
> > -	if (DISPLAY_VER(dev_priv) >= 11) {
> > +	if (DISPLAY_VER(dev_priv) >= 14)
> > +		de_misc_masked |= XELPDP_PMDEMAND_RSPTOUT_ERR |
> > +				  XELPDP_PMDEMAND_RSP;
> > +	else if (DISPLAY_VER(dev_priv) >= 11) {
> >  		enum port port;
> >
> >  		if (intel_bios_is_dsi_present(dev_priv, &port)) diff --git
> > a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
> > index 8d26fa2765c1..7f8e750665ed 100644
> > --- a/drivers/gpu/drm/i915/i915_reg.h
> > +++ b/drivers/gpu/drm/i915/i915_reg.h
> > @@ -4783,8 +4783,10 @@
> >  #define GEN8_DE_MISC_IMR _MMIO(0x44464)  #define GEN8_DE_MISC_IIR
> > _MMIO(0x44468)  #define GEN8_DE_MISC_IER _MMIO(0x4446c)
> > -#define  GEN8_DE_MISC_GSE		(1 << 27)
> > -#define  GEN8_DE_EDP_PSR		(1 << 19)
> > +#define  XELPDP_PMDEMAND_RSPTOUT_ERR	REG_BIT(27)
> > +#define  GEN8_DE_MISC_GSE		REG_BIT(27)
> > +#define  GEN8_DE_EDP_PSR		REG_BIT(19)
> > +#define  XELPDP_PMDEMAND_RSP		REG_BIT(3)
> >
> >  #define GEN8_PCU_ISR _MMIO(0x444e0)
> >  #define GEN8_PCU_IMR _MMIO(0x444e4)
> > @@ -4847,6 +4849,33 @@
> >  #define  GEN11_HOTPLUG_CTL_SHORT_DETECT(hpd_pin)	(1 <<
> (_HPD_PIN_TC(hpd_pin) * 4))
> >  #define  GEN11_HOTPLUG_CTL_NO_DETECT(hpd_pin)		(0 <<
> (_HPD_PIN_TC(hpd_pin) * 4))
> >
> > +#define XELPDP_INITIATE_PMDEMAND_REQUEST(dword)
> 	_MMIO(0x45230 + 4 * (dword))
> > +#define  XELPDP_PMDEMAND_QCLK_GV_BW_MASK
> 	REG_GENMASK(31, 16)
> > +#define  XELPDP_PMDEMAND_QCLK_GV_BW(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_BW_MASK, x)
> > +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK
> 	REG_GENMASK(14, 12)
> > +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK, x)
> > +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK
> 	REG_GENMASK(11, 8)
> > +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK, x)
> > +#define  XELPDP_PMDEMAND_PIPES_MASK
> 	REG_GENMASK(7, 6)
> > +#define  XELPDP_PMDEMAND_PIPES(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_PIPES_MASK, x)
> > +#define  XELPDP_PMDEMAND_DBUFS_MASK
> 	REG_GENMASK(5, 4)
> > +#define  XELPDP_PMDEMAND_DBUFS(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_DBUFS_MASK, x)
> > +#define  XELPDP_PMDEMAND_PHYS_MASK
> 	REG_GENMASK(2, 0)
> > +#define  XELPDP_PMDEMAND_PHYS(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_PHYS_MASK, x)
> > +
> > +#define  XELPDP_PMDEMAND_REQ_ENABLE			REG_BIT(31)
> > +#define  XELPDP_PMDEMAND_CDCLK_FREQ_MASK
> 	REG_GENMASK(30, 20)
> > +#define  XELPDP_PMDEMAND_CDCLK_FREQ(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_CDCLK_FREQ_MASK, x)
> > +#define  XELPDP_PMDEMAND_DDICLK_FREQ_MASK
> 	REG_GENMASK(18, 8)
> > +#define  XELPDP_PMDEMAND_DDICLK_FREQ(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_DDICLK_FREQ_MASK, x)
> > +#define  XELPDP_PMDEMAND_SCALERS_MASK
> 	REG_GENMASK(6, 4)
> > +#define  XELPDP_PMDEMAND_SCALERS(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_SCALERS_MASK, x)
> > +#define  XELPDP_PMDEMAND_PLLS_MASK
> 	REG_GENMASK(2, 0)
> > +#define  XELPDP_PMDEMAND_PLLS(x)
> 	REG_FIELD_PREP(XELPDP_PMDEMAND_PLLS_MASK, x)
> > +
> > +#define GEN12_DCPR_STATUS_1
> 	_MMIO(0x46440)
> > +#define  XELPDP_PMDEMAND_INFLIGHT_STATUS		REG_BIT(26)
> > +
> >  #define ILK_DISPLAY_CHICKEN2	_MMIO(0x42004)
> >  /* Required on all Ironlake and Sandybridge according to the B-Spec. */
> >  #define  ILK_ELPIN_409_SELECT	(1 << 25)
> > diff --git a/drivers/gpu/drm/i915/intel_pm.c
> > b/drivers/gpu/drm/i915/intel_pm.c index c45af0d981fd..877997e4141d
> > 100644
> > --- a/drivers/gpu/drm/i915/intel_pm.c
> > +++ b/drivers/gpu/drm/i915/intel_pm.c
> > @@ -25,6 +25,10 @@
> >   *
> >   */
> >
> > +#include <linux/bitops.h>
> > +
> > +#include "display/intel_bw.h"
> > +#include "display/intel_cdclk.h"
> >  #include "display/intel_de.h"
> >  #include "display/intel_display.h"
> >  #include "display/intel_display_trace.h"
> > @@ -40,6 +44,14 @@
> >  #include "intel_pm.h"
> >  #include "vlv_sideband.h"
> >
> > +bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
> > +{
> > +        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
> > +                return true;
> > +
> > +        return false;
> > +}
> 
> This doesn't belong here or in intel_pmdemand.c. It's just not about pm or
> pmdemand.

It doesn't belong here. This was needed though as the C10/20 phy patches hasn't landed yet.

> 
> > +
> >  struct drm_i915_clock_gating_funcs {
> >  	void (*init_clock_gating)(struct drm_i915_private *i915);  }; @@
> > -124,6 +136,287 @@ static void glk_init_clock_gating(struct drm_i915_private
> *dev_priv)
> >  		   PWM1_GATING_DIS | PWM2_GATING_DIS);  }
> >
> > +static struct intel_global_state
> > +*intel_pmdemand_duplicate_state(struct intel_global_obj *obj) {
> > +	struct intel_pmdemand_state *pmdmnd_state;
> > +
> > +	pmdmnd_state = kmemdup(obj->state, sizeof(*pmdmnd_state),
> GFP_KERNEL);
> > +	if (!pmdmnd_state)
> > +		return NULL;
> > +
> > +	return &pmdmnd_state->base;
> > +}
> > +
> > +static void intel_pmdemand_destroy_state(struct intel_global_obj *obj,
> > +					 struct intel_global_state *state) {
> > +	kfree(state);
> > +}
> > +
> > +static const struct intel_global_state_funcs intel_pmdemand_funcs = {
> > +	.atomic_duplicate_state = intel_pmdemand_duplicate_state,
> > +	.atomic_destroy_state = intel_pmdemand_destroy_state, };
> > +
> > +struct intel_pmdemand_state *
> > +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state) {
> > +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > +	struct intel_global_state *pmdemand_state;
> > +
> > +	pmdemand_state = intel_atomic_get_global_obj_state(state,
> &dev_priv->pmdemand.obj);
> > +	if (IS_ERR(pmdemand_state))
> > +		return ERR_CAST(pmdemand_state);
> > +
> > +	return to_intel_pmdemand_state(pmdemand_state);
> > +}
> > +
> > +int intel_pmdemand_init(struct drm_i915_private *dev_priv) {
> > +	struct intel_pmdemand_state *pmdemand_state;
> > +
> > +	pmdemand_state = kzalloc(sizeof(*pmdemand_state), GFP_KERNEL);
> > +	if (!pmdemand_state)
> > +		return -ENOMEM;
> > +
> > +	intel_atomic_global_obj_init(dev_priv, &dev_priv->pmdemand.obj,
> > +				     &pmdemand_state->base,
> &intel_pmdemand_funcs);
> > +
> > +	return 0;
> > +}
> > +
> > +void intel_init_pmdemand(struct drm_i915_private *dev_priv) {
> > +	mutex_init(&dev_priv->pmdemand.lock);
> > +	init_waitqueue_head(&dev_priv->pmdemand.waitqueue);
> > +}
> > +
> > +int intel_pmdemand_atomic_check(struct intel_atomic_state *state) {
> > +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > +	struct intel_pmdemand_state *new_pmdemand_state = NULL;
> > +	struct intel_crtc_state *old_crtc_state, *new_crtc_state;
> > +	struct intel_crtc *crtc;
> > +	struct intel_encoder *encoder;
> > +	struct intel_bw_state *new_bw_state;
> > +	const struct intel_dbuf_state *new_dbuf_state;
> > +	const struct intel_cdclk_state *new_cdclk_state;
> > +	int port_clock = 0;
> > +	unsigned int data_rate;
> > +	enum phy phy;
> > +	int i, ret;
> > +
> > +	if (DISPLAY_VER(dev_priv) < 14)
> > +		return 0;
> > +
> > +	new_pmdemand_state = intel_atomic_get_pmdemand_state(state);
> > +	if (IS_ERR(new_pmdemand_state))
> > +		return PTR_ERR(new_pmdemand_state);
> > +
> > +	ret = intel_atomic_lock_global_state(&new_pmdemand_state->base);
> > +	if (ret)
> > +		return ret;
> > +
> > +	/* Punit figures out the voltage index based on bandwidth*/
> > +	new_bw_state = intel_atomic_get_bw_state(state);
> > +	if (IS_ERR(new_bw_state))
> > +		return PTR_ERR(new_bw_state);
> > +
> > +	/* firmware will calculate the qclck_gc_index, requirement is set to 0 */
> > +	new_pmdemand_state->qclk_gv_index = 0;
> > +
> > +	data_rate = intel_bw_data_rate(dev_priv, new_bw_state);
> > +	/* To MBs then to multiples of 100MBs */
> > +	data_rate = DIV_ROUND_UP(data_rate, 1000);
> > +	data_rate = DIV_ROUND_UP(data_rate, 100);
> > +	new_pmdemand_state->qclk_gv_bw = data_rate;
> > +
> > +	new_dbuf_state = intel_atomic_get_dbuf_state(state);
> > +	if (IS_ERR(new_dbuf_state))
> > +		return PTR_ERR(new_dbuf_state);
> > +
> > +	i = hweight8(new_dbuf_state->active_pipes);
> > +	new_pmdemand_state->active_pipes = min(i, 3);
> > +
> > +	new_cdclk_state = intel_atomic_get_cdclk_state(state);
> > +	if (IS_ERR(new_cdclk_state))
> > +		return PTR_ERR(new_cdclk_state);
> > +
> > +	new_pmdemand_state->voltage_index = new_cdclk_state-
> >logical.voltage_level;
> > +	/* KHz to MHz */
> > +	new_pmdemand_state->cdclk_freq_mhz =
> > +DIV_ROUND_UP(new_cdclk_state->logical.cdclk, 1000);
> > +
> > +	new_pmdemand_state->active_phys_plls_mask = 0;
> > +
> > +	for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state,
> new_crtc_state, i) {
> > +		if (!new_crtc_state->hw.active)
> > +			continue;
> > +
> > +		encoder = intel_get_crtc_new_encoder(state, new_crtc_state);
> > +		if (!encoder)
> > +			continue;
> > +
> > +		phy = intel_port_to_phy(dev_priv, encoder->port);
> > +
> > +		if (intel_is_c10phy(dev_priv, phy))
> > +			new_pmdemand_state->active_phys_plls_mask |=
> BIT(phy);
> > +
> > +		port_clock = max(port_clock, new_crtc_state->port_clock);
> > +	}
> > +
> > +	/* To MHz */
> > +	new_pmdemand_state->ddiclk_freq_mhz =
> DIV_ROUND_UP(port_clock,
> > +1000);
> > +
> > +	/*
> > +	 * Setting scalers to max as it can not be calculated during flips and
> > +	 * fastsets without taking global states locks.
> > +	 */
> > +	new_pmdemand_state->scalers = 7;
> > +
> > +	return 0;
> > +}
> > +
> > +static bool intel_pmdemand_check_prev_transaction(struct
> > +drm_i915_private *dev_priv) {
> > +	return !((intel_de_read(dev_priv,
> XELPDP_INITIATE_PMDEMAND_REQUEST(1)) &
> XELPDP_PMDEMAND_REQ_ENABLE) ||
> > +		(intel_de_read(dev_priv, GEN12_DCPR_STATUS_1) &
> > +XELPDP_PMDEMAND_INFLIGHT_STATUS));
> > +}
> > +
> > +static bool intel_pmdemand_req_complete(struct drm_i915_private
> > +*dev_priv) {
> > +	return !(intel_de_read(dev_priv,
> > +XELPDP_INITIATE_PMDEMAND_REQUEST(1)) &
> XELPDP_PMDEMAND_REQ_ENABLE); }
> > +
> > +static int intel_pmdemand_wait(struct drm_i915_private *dev_priv) {
> > +	DEFINE_WAIT(wait);
> > +	int ret;
> > +	const unsigned int timeout_ms = 10;
> > +
> > +	add_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
> > +
> > +	ret = wait_event_timeout(dev_priv->pmdemand.waitqueue,
> > +				 intel_pmdemand_req_complete(dev_priv),
> > +				 msecs_to_jiffies_timeout(timeout_ms));
> > +	if (ret < 0)
> > +		drm_err(&dev_priv->drm,
> > +			"timed out waiting for Punit PM Demand Response\n");
> > +
> > +	remove_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
> > +
> > +	return ret;
> > +}
> > +
> > +/* Required to be programmed during Display Init Sequences. */ void
> > +intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> > +				 u8 dbuf_slices)
> > +{
> > +	mutex_lock(&dev_priv->pmdemand.lock);
> > +	if (drm_WARN_ON(&dev_priv->drm,
> > +			!intel_pmdemand_check_prev_transaction(dev_priv)))
> > +		goto unlock;
> > +
> > +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0),
> > +		     XELPDP_PMDEMAND_DBUFS_MASK,
> > +		     XELPDP_PMDEMAND_DBUFS(hweight32(dbuf_slices)));
> > +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0,
> > +		     XELPDP_PMDEMAND_REQ_ENABLE);
> > +
> > +	intel_pmdemand_wait(dev_priv);
> > +unlock:
> > +	mutex_unlock(&dev_priv->pmdemand.lock);
> > +}
> > +
> > +static void intel_program_pmdemand(struct drm_i915_private *dev_priv,
> > +				   const struct intel_pmdemand_state *new,
> > +				   const struct intel_pmdemand_state *old) {
> > +	u32 val, tmp;
> > +
> > +#define UPDATE_PMDEMAND_VAL(val, F, f) do {            \
> > +	val &= (~(XELPDP_PMDEMAND_##F##_MASK));         \
> > +	val |= (XELPDP_PMDEMAND_##F((u32)(old ? max(old->f, new->f) :
> > +new->f))); \ } while (0)
> 
> I'm not convinced this makes the code easier to follow.
> 
> > +
> > +	mutex_lock(&dev_priv->pmdemand.lock);
> > +	if (drm_WARN_ON(&dev_priv->drm,
> > +			!intel_pmdemand_check_prev_transaction(dev_priv)))
> > +		goto unlock;
> > +
> > +	/*
> > +	 * TODO: Update programming PM Demand for
> > +	 * PHYS, PLLS, DDI_CLKFREQ, SCALARS
> > +	 */
> > +	val = intel_de_read(dev_priv,
> XELPDP_INITIATE_PMDEMAND_REQUEST(0));
> > +	UPDATE_PMDEMAND_VAL(val, QCLK_GV_INDEX, qclk_gv_index);
> > +	UPDATE_PMDEMAND_VAL(val, QCLK_GV_BW, qclk_gv_bw);
> > +	UPDATE_PMDEMAND_VAL(val, VOLTAGE_INDEX, voltage_index);
> > +	UPDATE_PMDEMAND_VAL(val, PIPES, active_pipes);
> > +	UPDATE_PMDEMAND_VAL(val, DBUFS, dbufs);
> > +	tmp = hweight32(new->active_phys_plls_mask);
> > +	if (old)
> > +		tmp = max(tmp, hweight32(old->active_phys_plls_mask));
> > +	val |= XELPDP_PMDEMAND_PHYS(tmp);
> > +
> > +	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0),
> val);
> > +
> > +	val = intel_de_read(dev_priv,
> XELPDP_INITIATE_PMDEMAND_REQUEST(1));
> > +	UPDATE_PMDEMAND_VAL(val, CDCLK_FREQ, cdclk_freq_mhz);
> > +	UPDATE_PMDEMAND_VAL(val, DDICLK_FREQ, ddiclk_freq_mhz);
> > +	UPDATE_PMDEMAND_VAL(val, SCALERS, scalers);
> > +	/*
> > +	 * Active_PLLs starts with 1 because of CDCLK PLL.
> > +	 * TODO: Missing to account genlock filter when it gets used.
> > +	 */
> > +	val |= XELPDP_PMDEMAND_PLLS(tmp + 1);
> > +
> > +	intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1),
> val);
> > +
> > +#undef UPDATE_PM_DEMAND_VAL
> > +
> > +	intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0,
> > +XELPDP_PMDEMAND_REQ_ENABLE);
> > +
> > +	intel_pmdemand_wait(dev_priv);
> > +unlock:
> > +	mutex_unlock(&dev_priv->pmdemand.lock);
> > +}
> > +
> > +void intel_pmdemand_pre_plane_update(struct intel_atomic_state
> > +*state) {
> > +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > +	const struct intel_pmdemand_state *new_pmdmnd_state =
> > +		intel_atomic_get_new_pmdemand_state(state);
> > +	const struct intel_pmdemand_state *old_pmdmnd_state =
> > +		intel_atomic_get_old_pmdemand_state(state);
> > +
> > +	if (DISPLAY_VER(dev_priv) < 14)
> > +		return;
> > +
> > +	if (!new_pmdmnd_state ||
> > +	    memcmp(new_pmdmnd_state, old_pmdmnd_state,
> sizeof(*new_pmdmnd_state)) == 0)
> > +		return;
> > +
> > +	intel_program_pmdemand(dev_priv, new_pmdmnd_state,
> > +old_pmdmnd_state); }
> > +
> > +void intel_pmdemand_post_plane_update(struct intel_atomic_state
> > +*state) {
> > +	struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> > +	const struct intel_pmdemand_state *new_pmdmnd_state =
> > +		intel_atomic_get_new_pmdemand_state(state);
> > +	const struct intel_pmdemand_state *old_pmdmnd_state =
> > +		intel_atomic_get_old_pmdemand_state(state);
> > +
> > +	if (DISPLAY_VER(dev_priv) < 14)
> > +		return;
> > +
> > +	if (!new_pmdmnd_state ||
> > +	    memcmp(new_pmdmnd_state, old_pmdmnd_state,
> sizeof(*new_pmdmnd_state)) == 0)
> > +		return;
> > +
> > +	intel_program_pmdemand(dev_priv, new_pmdmnd_state, NULL); }
> > +
> >  static void ibx_init_clock_gating(struct drm_i915_private *dev_priv)
> > {
> >  	/*
> > diff --git a/drivers/gpu/drm/i915/intel_pm.h
> > b/drivers/gpu/drm/i915/intel_pm.h index f774bddcdca6..2663bec408c7
> > 100644
> > --- a/drivers/gpu/drm/i915/intel_pm.h
> > +++ b/drivers/gpu/drm/i915/intel_pm.h
> > @@ -8,11 +8,46 @@
> >
> >  #include <linux/types.h>
> >
> > +#include "display/intel_global_state.h"
> > +
> >  struct drm_i915_private;
> >  struct intel_crtc_state;
> >  struct intel_plane_state;
> >
,> >  void intel_init_clock_gating(struct drm_i915_private *dev_priv);
> > +void intel_init_pmdemand(struct drm_i915_private *dev_priv);
> >  void intel_init_clock_gating_hooks(struct drm_i915_private
> > *dev_priv);
> >
> > +struct intel_pmdemand_state {
> > +	struct intel_global_state base;
> > +
> > +	u16 qclk_gv_bw;
> > +	u8 voltage_index;
> > +	u8 qclk_gv_index;
> > +	u8 active_pipes;
> > +	u8 dbufs;
> > +	u8 active_phys_plls_mask;
> > +	u16 cdclk_freq_mhz;
> > +	u16 ddiclk_freq_mhz;
> > +	u8 scalers;
> > +};
> 
> Could this actually be private to intel_pmdemand.c?

It probably could. I have to double check this

> 
> > +
> > +int intel_pmdemand_init(struct drm_i915_private *dev_priv);
> > +
> > +struct intel_pmdemand_state *
> > +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state);
> > +
> > +#define to_intel_pmdemand_state(x) container_of((x), struct
> > +intel_pmdemand_state, base) #define
> intel_atomic_get_old_pmdemand_state(state) \
> > +
> 	to_intel_pmdemand_state(intel_atomic_get_old_global_obj_state(stat
> e,
> > +&to_i915(state->base.dev)->pmdemand.obj))
> > +#define intel_atomic_get_new_pmdemand_state(state) \
> > +
> 	to_intel_pmdemand_state(intel_atomic_get_new_global_obj_state(sta
> te,
> > +&to_i915(state->base.dev)->pmdemand.obj))
> 
> Please just make these proper functions and hide the details. I've been meaning
> to do that elsewhere too. This shouldn't have to include intel_global_state.h.

Ok. This needs to be rewritten.

Thanks for review and comments.

-Mika-

> 
> > +
> > +int intel_pmdemand_init(struct drm_i915_private *dev_priv); void
> > +intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> > +				 u8 dbuf_slices);
> 
> intel_pmdemand_* naming please, if these will be put in intel_pmdemand.[ch].
> 
> > +void intel_pmdemand_pre_plane_update(struct intel_atomic_state
> > +*state); void intel_pmdemand_post_plane_update(struct
> > +intel_atomic_state *state); int intel_pmdemand_atomic_check(struct
> > +intel_atomic_state *state);
> > +
> >  #endif /* __INTEL_PM_H__ */
> 
> --
> Jani Nikula, Intel Open Source Graphics Center

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
  2023-04-03  9:17 ` Jani Nikula
  2023-04-03 10:55 ` kernel test robot
@ 2023-04-03 13:49 ` kernel test robot
  2023-04-03 17:33 ` kernel test robot
                   ` (3 subsequent siblings)
  6 siblings, 0 replies; 13+ messages in thread
From: kernel test robot @ 2023-04-03 13:49 UTC (permalink / raw)
  To: Mika Kahola; +Cc: oe-kbuild-all

Hi Mika,

Thank you for the patch! Perhaps something to improve:

[auto build test WARNING on drm-tip/drm-tip]

url:    https://github.com/intel-lab-lkp/linux/commits/Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
base:   git://anongit.freedesktop.org/drm/drm-tip drm-tip
patch link:    https://lore.kernel.org/r/20230403085043.2219092-1-mika.kahola%40intel.com
patch subject: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
config: i386-randconfig-a016-20230403 (https://download.01.org/0day-ci/archive/20230403/202304032107.aoVUtLmT-lkp@intel.com/config)
compiler: gcc-11 (Debian 11.3.0-8) 11.3.0
reproduce (this is a W=1 build):
        # https://github.com/intel-lab-lkp/linux/commit/4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        git remote add linux-review https://github.com/intel-lab-lkp/linux
        git fetch --no-tags linux-review Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
        git checkout 4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        # save the config file
        mkdir build_dir && cp config build_dir/.config
        make W=1 O=build_dir ARCH=i386 olddefconfig
        make W=1 O=build_dir ARCH=i386 SHELL=/bin/bash drivers/gpu/drm/i915/

If you fix the issue, kindly add following tag where applicable
| Reported-by: kernel test robot <lkp@intel.com>
| Link: https://lore.kernel.org/oe-kbuild-all/202304032107.aoVUtLmT-lkp@intel.com/

All warnings (new ones prefixed by >>):

>> drivers/gpu/drm/i915/intel_pm.c:47:6: warning: no previous prototype for 'intel_is_c10phy' [-Wmissing-prototypes]
      47 | bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
         |      ^~~~~~~~~~~~~~~


vim +/intel_is_c10phy +47 drivers/gpu/drm/i915/intel_pm.c

    46	
  > 47	bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
    48	{
    49	        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
    50	                return true;
    51	
    52	        return false;
    53	}
    54	

-- 
0-DAY CI Kernel Test Service
https://github.com/intel/lkp-tests

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
                   ` (2 preceding siblings ...)
  2023-04-03 13:49 ` kernel test robot
@ 2023-04-03 17:33 ` kernel test robot
  2023-04-03 17:33 ` kernel test robot
                   ` (2 subsequent siblings)
  6 siblings, 0 replies; 13+ messages in thread
From: kernel test robot @ 2023-04-03 17:33 UTC (permalink / raw)
  To: Mika Kahola; +Cc: llvm, oe-kbuild-all

Hi Mika,

kernel test robot noticed the following build errors:

[auto build test ERROR on drm-tip/drm-tip]

url:    https://github.com/intel-lab-lkp/linux/commits/Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
base:   git://anongit.freedesktop.org/drm/drm-tip drm-tip
patch link:    https://lore.kernel.org/r/20230403085043.2219092-1-mika.kahola%40intel.com
patch subject: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
config: x86_64-randconfig-r031-20230403 (https://download.01.org/0day-ci/archive/20230404/202304040133.G6vbHTdV-lkp@intel.com/config)
compiler: clang version 14.0.6 (https://github.com/llvm/llvm-project f28c006a5895fc0e329fe15fead81e37457cb1d1)
reproduce (this is a W=1 build):
        wget https://raw.githubusercontent.com/intel/lkp-tests/master/sbin/make.cross -O ~/bin/make.cross
        chmod +x ~/bin/make.cross
        # https://github.com/intel-lab-lkp/linux/commit/4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        git remote add linux-review https://github.com/intel-lab-lkp/linux
        git fetch --no-tags linux-review Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
        git checkout 4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        # save the config file
        mkdir build_dir && cp config build_dir/.config
        COMPILER_INSTALL_PATH=$HOME/0day COMPILER=clang make.cross W=1 O=build_dir ARCH=x86_64 olddefconfig
        COMPILER_INSTALL_PATH=$HOME/0day COMPILER=clang make.cross W=1 O=build_dir ARCH=x86_64 SHELL=/bin/bash drivers/gpu/drm/i915/

If you fix the issue, kindly add following tag where applicable
| Reported-by: kernel test robot <lkp@intel.com>
| Link: https://lore.kernel.org/oe-kbuild-all/202304040133.G6vbHTdV-lkp@intel.com/

All errors (new ones prefixed by >>):

>> drivers/gpu/drm/i915/intel_pm.c:47:6: error: no previous prototype for function 'intel_is_c10phy' [-Werror,-Wmissing-prototypes]
   bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
        ^
   drivers/gpu/drm/i915/intel_pm.c:47:1: note: declare 'static' if the function is not intended to be used outside of this translation unit
   bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
   ^
   static 
   1 error generated.


vim +/intel_is_c10phy +47 drivers/gpu/drm/i915/intel_pm.c

    46	
  > 47	bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
    48	{
    49	        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
    50	                return true;
    51	
    52	        return false;
    53	}
    54	

-- 
0-DAY CI Kernel Test Service
https://github.com/intel/lkp-tests

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
                   ` (3 preceding siblings ...)
  2023-04-03 17:33 ` kernel test robot
@ 2023-04-03 17:33 ` kernel test robot
  2023-04-03 19:07 ` [Intel-gfx] ✗ Fi.CI.BUILD: failure for " Patchwork
  2023-04-11 22:47 ` [Intel-gfx] [PATCH] " Gustavo Sousa
  6 siblings, 0 replies; 13+ messages in thread
From: kernel test robot @ 2023-04-03 17:33 UTC (permalink / raw)
  To: Mika Kahola; +Cc: llvm, oe-kbuild-all

Hi Mika,

kernel test robot noticed the following build warnings:

[auto build test WARNING on drm-tip/drm-tip]

url:    https://github.com/intel-lab-lkp/linux/commits/Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
base:   git://anongit.freedesktop.org/drm/drm-tip drm-tip
patch link:    https://lore.kernel.org/r/20230403085043.2219092-1-mika.kahola%40intel.com
patch subject: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
config: i386-randconfig-a002-20230403 (https://download.01.org/0day-ci/archive/20230404/202304040120.VkYG8WG8-lkp@intel.com/config)
compiler: clang version 14.0.6 (https://github.com/llvm/llvm-project f28c006a5895fc0e329fe15fead81e37457cb1d1)
reproduce (this is a W=1 build):
        wget https://raw.githubusercontent.com/intel/lkp-tests/master/sbin/make.cross -O ~/bin/make.cross
        chmod +x ~/bin/make.cross
        # https://github.com/intel-lab-lkp/linux/commit/4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        git remote add linux-review https://github.com/intel-lab-lkp/linux
        git fetch --no-tags linux-review Mika-Kahola/drm-i915-mtl-Add-support-for-PM-DEMAND/20230403-165720
        git checkout 4be7899ed410c745e6af3dbc42d17ee129ba5fd5
        # save the config file
        mkdir build_dir && cp config build_dir/.config
        COMPILER_INSTALL_PATH=$HOME/0day COMPILER=clang make.cross W=1 O=build_dir ARCH=i386 olddefconfig
        COMPILER_INSTALL_PATH=$HOME/0day COMPILER=clang make.cross W=1 O=build_dir ARCH=i386 SHELL=/bin/bash drivers/gpu/drm/i915/

If you fix the issue, kindly add following tag where applicable
| Reported-by: kernel test robot <lkp@intel.com>
| Link: https://lore.kernel.org/oe-kbuild-all/202304040120.VkYG8WG8-lkp@intel.com/

All warnings (new ones prefixed by >>):

>> drivers/gpu/drm/i915/intel_pm.c:47:6: warning: no previous prototype for function 'intel_is_c10phy' [-Wmissing-prototypes]
   bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
        ^
   drivers/gpu/drm/i915/intel_pm.c:47:1: note: declare 'static' if the function is not intended to be used outside of this translation unit
   bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
   ^
   static 
   1 warning generated.


vim +/intel_is_c10phy +47 drivers/gpu/drm/i915/intel_pm.c

    46	
  > 47	bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
    48	{
    49	        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
    50	                return true;
    51	
    52	        return false;
    53	}
    54	

-- 
0-DAY CI Kernel Test Service
https://github.com/intel/lkp-tests

^ permalink raw reply	[flat|nested] 13+ messages in thread

* [Intel-gfx] ✗ Fi.CI.BUILD: failure for drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
                   ` (4 preceding siblings ...)
  2023-04-03 17:33 ` kernel test robot
@ 2023-04-03 19:07 ` Patchwork
  2023-04-11 22:47 ` [Intel-gfx] [PATCH] " Gustavo Sousa
  6 siblings, 0 replies; 13+ messages in thread
From: Patchwork @ 2023-04-03 19:07 UTC (permalink / raw)
  To: Kahola, Mika; +Cc: intel-gfx

== Series Details ==

Series: drm/i915/mtl: Add support for PM DEMAND
URL   : https://patchwork.freedesktop.org/series/116012/
State : failure

== Summary ==

Error: make failed
  CALL    scripts/checksyscalls.sh
  DESCEND objtool
  INSTALL libsubcmd_headers
  CC [M]  drivers/gpu/drm/i915/intel_pm.o
drivers/gpu/drm/i915/intel_pm.c:47:6: error: no previous prototype for ‘intel_is_c10phy’ [-Werror=missing-prototypes]
   47 | bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
      |      ^~~~~~~~~~~~~~~
cc1: all warnings being treated as errors
make[5]: *** [scripts/Makefile.build:252: drivers/gpu/drm/i915/intel_pm.o] Error 1
make[4]: *** [scripts/Makefile.build:494: drivers/gpu/drm/i915] Error 2
make[3]: *** [scripts/Makefile.build:494: drivers/gpu/drm] Error 2
make[2]: *** [scripts/Makefile.build:494: drivers/gpu] Error 2
make[1]: *** [scripts/Makefile.build:494: drivers] Error 2
make: *** [Makefile:2025: .] Error 2
Build failed, no error log produced



^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
                   ` (5 preceding siblings ...)
  2023-04-03 19:07 ` [Intel-gfx] ✗ Fi.CI.BUILD: failure for " Patchwork
@ 2023-04-11 22:47 ` Gustavo Sousa
  2023-04-12  9:33   ` Jani Nikula
  6 siblings, 1 reply; 13+ messages in thread
From: Gustavo Sousa @ 2023-04-11 22:47 UTC (permalink / raw)
  To: Mika Kahola, intel-gfx; +Cc: Lucas De Marchi, Matt Roper

Quoting Mika Kahola (2023-04-03 05:50:43)
> Display14 introduces a new way to instruct the PUnit with
> power and bandwidth requirements of DE. Add the functionality
> to program the registers and handle waits using interrupts.
> The current wait time for timeouts is programmed for 10 msecs to
> factor in the worst case scenarios. Changes made to use REG_BIT
> for a register that we touched(GEN8_DE_MISC_IER _MMIO).
> 
> v2:
>   - Removed repeated definition of dbuf, which has been moved to struct
>     intel_display. (Gustavo)
>   - s/dev_priv->dbuf/dev_priv->display.dbuf/ (Gustavo)
> 
> Bspec: 66451, 64636, 64602, 64603
> Cc: Matt Atwood <matthew.s.atwood@intel.com>
> Cc: Matt Roper <matthew.d.roper@intel.com>
> Cc: Lucas De Marchi <lucas.demarchi@intel.com>
> Cc: Gustavo Sousa <gustavo.sousa@intel.com>
> Signed-off-by: José Roberto de Souza <jose.souza@intel.com>
> Signed-off-by: Radhakrishna Sripada <radhakrishna.sripada@intel.com>
> Signed-off-by: Mika Kahola <mika.kahola@intel.com>
> ---
>  drivers/gpu/drm/i915/display/intel_bw.c       |   4 +-
>  drivers/gpu/drm/i915/display/intel_bw.h       |   2 +
>  drivers/gpu/drm/i915/display/intel_display.c  |  14 +
>  .../drm/i915/display/intel_display_power.c    |   8 +
>  drivers/gpu/drm/i915/i915_drv.h               |   6 +
>  drivers/gpu/drm/i915/i915_irq.c               |  22 +-
>  drivers/gpu/drm/i915/i915_reg.h               |  33 +-
>  drivers/gpu/drm/i915/intel_pm.c               | 293 ++++++++++++++++++
>  drivers/gpu/drm/i915/intel_pm.h               |  35 +++
>  9 files changed, 412 insertions(+), 5 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/display/intel_bw.c b/drivers/gpu/drm/i915/display/intel_bw.c
> index 202321ffbe2a..87c20bf52123 100644
> --- a/drivers/gpu/drm/i915/display/intel_bw.c
> +++ b/drivers/gpu/drm/i915/display/intel_bw.c
> @@ -746,8 +746,8 @@ static unsigned int intel_bw_num_active_planes(struct drm_i915_private *dev_priv
>         return num_active_planes;
>  }
>  
> -static unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> -                                 const struct intel_bw_state *bw_state)
> +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> +                          const struct intel_bw_state *bw_state)
>  {
>         unsigned int data_rate = 0;
>         enum pipe pipe;
> diff --git a/drivers/gpu/drm/i915/display/intel_bw.h b/drivers/gpu/drm/i915/display/intel_bw.h
> index f20292143745..17fc0b61db04 100644
> --- a/drivers/gpu/drm/i915/display/intel_bw.h
> +++ b/drivers/gpu/drm/i915/display/intel_bw.h
> @@ -62,6 +62,8 @@ int intel_bw_init(struct drm_i915_private *dev_priv);
>  int intel_bw_atomic_check(struct intel_atomic_state *state);
>  void intel_bw_crtc_update(struct intel_bw_state *bw_state,
>                           const struct intel_crtc_state *crtc_state);
> +unsigned int intel_bw_data_rate(struct drm_i915_private *dev_priv,
> +                          const struct intel_bw_state *bw_state);
>  int icl_pcode_restrict_qgv_points(struct drm_i915_private *dev_priv,
>                                   u32 points_mask);
>  int intel_bw_calc_min_cdclk(struct intel_atomic_state *state,
> diff --git a/drivers/gpu/drm/i915/display/intel_display.c b/drivers/gpu/drm/i915/display/intel_display.c
> index b53a1d969344..ee7ca33123b1 100644
> --- a/drivers/gpu/drm/i915/display/intel_display.c
> +++ b/drivers/gpu/drm/i915/display/intel_display.c
> @@ -959,6 +959,9 @@ intel_get_crtc_new_encoder(const struct intel_atomic_state *state,
>                 num_encoders++;
>         }
>  
> +  if (!encoder)
> +          return NULL;
> +

I believe callers of this function expect a warning to be issued if no encoder
(or more than one) was found for the crtc. With this we are changing that
behavior.

>         drm_WARN(encoder->base.dev, num_encoders != 1,
>                  "%d encoders for pipe %c\n",
>                  num_encoders, pipe_name(master_crtc->pipe));
> @@ -6767,6 +6770,10 @@ int intel_atomic_check(struct drm_device *dev,
>                 ret = intel_modeset_calc_cdclk(state);
>                 if (ret)
>                         return ret;
> +
> +          ret = intel_pmdemand_atomic_check(state);
> +          if (ret)
> +                  goto fail;
>         }
>  
>         ret = intel_atomic_check_crtcs(state);
> @@ -7411,6 +7418,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
>         }
>  
>         intel_sagv_pre_plane_update(state);
> +  intel_pmdemand_pre_plane_update(state);
>  
>         /* Complete the events for pipes that have now been disabled */
>         for_each_new_intel_crtc_in_state(state, crtc, new_crtc_state, i) {
> @@ -7523,6 +7531,7 @@ static void intel_atomic_commit_tail(struct intel_atomic_state *state)
>                 intel_verify_planes(state);
>  
>         intel_sagv_post_plane_update(state);
> +  intel_pmdemand_post_plane_update(state);
>  
>         drm_atomic_helper_commit_hw_done(&state->base);
>  
> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
>         intel_color_init_hooks(dev_priv);
>         intel_init_cdclk_hooks(dev_priv);
>         intel_audio_hooks_init(dev_priv);
> +  intel_init_pmdemand(dev_priv);

I think intel_init_display_hooks() is meant to call functions setting up
function pointers, right? That would not be the case for intel_init_pmdemand().

I think we could rename intel_init_pmdemand() to
intel_pmdemand_init_early() and call it inside i915_driver_early_probe().

>  
>         intel_dpll_init_clock_hook(dev_priv);
>  
> @@ -8476,6 +8486,10 @@ int intel_modeset_init_noirq(struct drm_i915_private *i915)
>         if (ret)
>                 goto cleanup_vga_client_pw_domain_dmc;
>  
> +  ret = intel_pmdemand_init(i915);
> +  if (ret)
> +          goto cleanup_vga_client_pw_domain_dmc;
> +
>         init_llist_head(&i915->display.atomic_helper.free_list);
>         INIT_WORK(&i915->display.atomic_helper.free_work,
>                   intel_atomic_helper_free_state_worker);
> diff --git a/drivers/gpu/drm/i915/display/intel_display_power.c b/drivers/gpu/drm/i915/display/intel_display_power.c
> index 5e85572dc8e4..04c172b5c17b 100644
> --- a/drivers/gpu/drm/i915/display/intel_display_power.c
> +++ b/drivers/gpu/drm/i915/display/intel_display_power.c
> @@ -19,6 +19,7 @@
>  #include "intel_mchbar_regs.h"
>  #include "intel_pch_refclk.h"
>  #include "intel_pcode.h"
> +#include "intel_pm.h"
>  #include "intel_pps_regs.h"
>  #include "intel_snps_phy.h"
>  #include "skl_watermark.h"
> @@ -1083,6 +1084,10 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
>         dev_priv->display.dbuf.enabled_slices =
>                 intel_enabled_dbuf_slices_mask(dev_priv);
>  
> +  if (DISPLAY_VER(dev_priv) >= 14)
> +          intel_program_dbuf_pmdemand(dev_priv, BIT(DBUF_S1) |
> +                                      dev_priv->display.dbuf.enabled_slices);
> +
>         /*
>          * Just power up at least 1 slice, we will
>          * figure out later which slices we have and what we need.
> @@ -1094,6 +1099,9 @@ static void gen9_dbuf_enable(struct drm_i915_private *dev_priv)
>  static void gen9_dbuf_disable(struct drm_i915_private *dev_priv)
>  {
>         gen9_dbuf_slices_update(dev_priv, 0);
> +
> +  if (DISPLAY_VER(dev_priv) >= 14)
> +          intel_program_dbuf_pmdemand(dev_priv, 0);
>  }
>  
>  static void gen12_dbuf_slices_config(struct drm_i915_private *dev_priv)
> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> index e771fdc3099c..2a73e726c6ed 100644
> --- a/drivers/gpu/drm/i915/i915_drv.h
> +++ b/drivers/gpu/drm/i915/i915_drv.h
> @@ -250,6 +250,12 @@ struct drm_i915_private {
>         unsigned int hpll_freq;
>         unsigned int czclk_freq;
>  
> +  struct {
> +          wait_queue_head_t waitqueue;
> +          struct mutex lock;
> +          struct intel_global_obj obj;
> +  } pmdemand;
> +
>         /**
>          * wq - Driver workqueue for GEM.
>          *
> diff --git a/drivers/gpu/drm/i915/i915_irq.c b/drivers/gpu/drm/i915/i915_irq.c
> index c0888cc88d04..636033bb9650 100644
> --- a/drivers/gpu/drm/i915/i915_irq.c
> +++ b/drivers/gpu/drm/i915/i915_irq.c
> @@ -1913,6 +1913,11 @@ static u32 gen8_de_pipe_fault_mask(struct drm_i915_private *dev_priv)
>                 return GEN8_DE_PIPE_IRQ_FAULT_ERRORS;
>  }
>  
> +static void intel_pmdemand_irq_handler(struct drm_i915_private *dev_priv)
> +{
> +  wake_up_all(&dev_priv->pmdemand.waitqueue);
> +}
> +
>  static void
>  gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
>  {
> @@ -1949,6 +1954,18 @@ gen8_de_misc_irq_handler(struct drm_i915_private *dev_priv, u32 iir)
>                 }
>         }
>  
> +  if (iir & XELPDP_PMDEMAND_RSPTOUT_ERR) {
> +          drm_dbg(&dev_priv->drm,
> +                  "Error waiting for Punit PM Demand Response\n");
> +          intel_pmdemand_irq_handler(dev_priv);
> +          found = true;
> +  }
> +
> +  if (iir & XELPDP_PMDEMAND_RSP) {
> +          intel_pmdemand_irq_handler(dev_priv);
> +          found = true;
> +  }
> +

Two comments here:

  1. Shouldn't we also make sure that DISPLAY_VER(dev_priv) >= 14 before
     checking those bits?

  2. Intuitively, I would agree that XELPDP_PMDEMAND_RSPTOUT_ERR and
     XELPDP_PMDEMAND_RSP should not happen at the same time, but to be safe, I
     would replace the above two ifs above with something like below:

      if (iir & (XELPDP_PMDEMAND_RSP | XELPDP_PMDEMAND_RSPTOUT_ERR)) {
              if (irr & XELPDP_PMDEMAND_RSPTOUT_ERR)
                      drm_dbg(&dev_priv->drm,
                              "Error waiting for Punit PM Demand Response\n");
              intel_pmdemand_irq_handler(dev_priv);
              found = true;
      }

>         if (!found)
>                 drm_err(&dev_priv->drm, "Unexpected DE Misc interrupt\n");
>  }
> @@ -3315,7 +3332,10 @@ static void gen8_de_irq_postinstall(struct drm_i915_private *dev_priv)
>         if (IS_GEMINILAKE(dev_priv) || IS_BROXTON(dev_priv))
>                 de_port_masked |= BXT_DE_PORT_GMBUS;
>  
> -  if (DISPLAY_VER(dev_priv) >= 11) {
> +  if (DISPLAY_VER(dev_priv) >= 14)
> +          de_misc_masked |= XELPDP_PMDEMAND_RSPTOUT_ERR |
> +                            XELPDP_PMDEMAND_RSP;

Although the sequence for PM Demand in the BSpec does not mention it, there is
also a PM_DMD_msg_error bit in the interrupt register. I wonder if we should
handle it as well.

> +  else if (DISPLAY_VER(dev_priv) >= 11) {
>                 enum port port;
>  
>                 if (intel_bios_is_dsi_present(dev_priv, &port))
> diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
> index 8d26fa2765c1..7f8e750665ed 100644
> --- a/drivers/gpu/drm/i915/i915_reg.h
> +++ b/drivers/gpu/drm/i915/i915_reg.h
> @@ -4783,8 +4783,10 @@
>  #define GEN8_DE_MISC_IMR _MMIO(0x44464)
>  #define GEN8_DE_MISC_IIR _MMIO(0x44468)
>  #define GEN8_DE_MISC_IER _MMIO(0x4446c)
> -#define  GEN8_DE_MISC_GSE         (1 << 27)
> -#define  GEN8_DE_EDP_PSR          (1 << 19)
> +#define  XELPDP_PMDEMAND_RSPTOUT_ERR      REG_BIT(27)
> +#define  GEN8_DE_MISC_GSE         REG_BIT(27)
> +#define  GEN8_DE_EDP_PSR          REG_BIT(19)
> +#define  XELPDP_PMDEMAND_RSP              REG_BIT(3)
>  
>  #define GEN8_PCU_ISR _MMIO(0x444e0)
>  #define GEN8_PCU_IMR _MMIO(0x444e4)
> @@ -4847,6 +4849,33 @@
>  #define  GEN11_HOTPLUG_CTL_SHORT_DETECT(hpd_pin)       (1 << (_HPD_PIN_TC(hpd_pin) * 4))
>  #define  GEN11_HOTPLUG_CTL_NO_DETECT(hpd_pin)          (0 << (_HPD_PIN_TC(hpd_pin) * 4))
>  
> +#define XELPDP_INITIATE_PMDEMAND_REQUEST(dword)           _MMIO(0x45230 + 4 * (dword))
> +#define  XELPDP_PMDEMAND_QCLK_GV_BW_MASK          REG_GENMASK(31, 16)
> +#define  XELPDP_PMDEMAND_QCLK_GV_BW(x)                    REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_BW_MASK, x)
> +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK               REG_GENMASK(14, 12)
> +#define  XELPDP_PMDEMAND_VOLTAGE_INDEX(x)         REG_FIELD_PREP(XELPDP_PMDEMAND_VOLTAGE_INDEX_MASK, x)
> +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK               REG_GENMASK(11, 8)
> +#define  XELPDP_PMDEMAND_QCLK_GV_INDEX(x)         REG_FIELD_PREP(XELPDP_PMDEMAND_QCLK_GV_INDEX_MASK, x)
> +#define  XELPDP_PMDEMAND_PIPES_MASK                       REG_GENMASK(7, 6)
> +#define  XELPDP_PMDEMAND_PIPES(x)                 REG_FIELD_PREP(XELPDP_PMDEMAND_PIPES_MASK, x)
> +#define  XELPDP_PMDEMAND_DBUFS_MASK                       REG_GENMASK(5, 4)
> +#define  XELPDP_PMDEMAND_DBUFS(x)                 REG_FIELD_PREP(XELPDP_PMDEMAND_DBUFS_MASK, x)
> +#define  XELPDP_PMDEMAND_PHYS_MASK                        REG_GENMASK(2, 0)
> +#define  XELPDP_PMDEMAND_PHYS(x)                          REG_FIELD_PREP(XELPDP_PMDEMAND_PHYS_MASK, x)
> +
> +#define  XELPDP_PMDEMAND_REQ_ENABLE                       REG_BIT(31)
> +#define  XELPDP_PMDEMAND_CDCLK_FREQ_MASK          REG_GENMASK(30, 20)
> +#define  XELPDP_PMDEMAND_CDCLK_FREQ(x)                    REG_FIELD_PREP(XELPDP_PMDEMAND_CDCLK_FREQ_MASK, x)
> +#define  XELPDP_PMDEMAND_DDICLK_FREQ_MASK         REG_GENMASK(18, 8)
> +#define  XELPDP_PMDEMAND_DDICLK_FREQ(x)                   REG_FIELD_PREP(XELPDP_PMDEMAND_DDICLK_FREQ_MASK, x)
> +#define  XELPDP_PMDEMAND_SCALERS_MASK                     REG_GENMASK(6, 4)
> +#define  XELPDP_PMDEMAND_SCALERS(x)                       REG_FIELD_PREP(XELPDP_PMDEMAND_SCALERS_MASK, x)
> +#define  XELPDP_PMDEMAND_PLLS_MASK                        REG_GENMASK(2, 0)
> +#define  XELPDP_PMDEMAND_PLLS(x)                  REG_FIELD_PREP(XELPDP_PMDEMAND_PLLS_MASK, x)
> +
> +#define GEN12_DCPR_STATUS_1                               _MMIO(0x46440)
> +#define  XELPDP_PMDEMAND_INFLIGHT_STATUS          REG_BIT(26)
> +
>  #define ILK_DISPLAY_CHICKEN2   _MMIO(0x42004)
>  /* Required on all Ironlake and Sandybridge according to the B-Spec. */
>  #define  ILK_ELPIN_409_SELECT  (1 << 25)
> diff --git a/drivers/gpu/drm/i915/intel_pm.c b/drivers/gpu/drm/i915/intel_pm.c
> index c45af0d981fd..877997e4141d 100644
> --- a/drivers/gpu/drm/i915/intel_pm.c
> +++ b/drivers/gpu/drm/i915/intel_pm.c
> @@ -25,6 +25,10 @@
>   *
>   */
>  
> +#include <linux/bitops.h>
> +
> +#include "display/intel_bw.h"
> +#include "display/intel_cdclk.h"
>  #include "display/intel_de.h"
>  #include "display/intel_display.h"
>  #include "display/intel_display_trace.h"
> @@ -40,6 +44,14 @@
>  #include "intel_pm.h"
>  #include "vlv_sideband.h"
>  
> +bool intel_is_c10phy(struct drm_i915_private *dev_priv, enum phy phy)
> +{
> +        if (IS_METEORLAKE(dev_priv) && (phy < PHY_C))
> +                return true;
> +
> +        return false;
> +}
> +
>  struct drm_i915_clock_gating_funcs {
>         void (*init_clock_gating)(struct drm_i915_private *i915);
>  };
> @@ -124,6 +136,287 @@ static void glk_init_clock_gating(struct drm_i915_private *dev_priv)
>                    PWM1_GATING_DIS | PWM2_GATING_DIS);
>  }
>  
> +static struct intel_global_state *intel_pmdemand_duplicate_state(struct intel_global_obj *obj)
> +{
> +  struct intel_pmdemand_state *pmdmnd_state;
> +
> +  pmdmnd_state = kmemdup(obj->state, sizeof(*pmdmnd_state), GFP_KERNEL);
> +  if (!pmdmnd_state)
> +          return NULL;
> +
> +  return &pmdmnd_state->base;
> +}
> +
> +static void intel_pmdemand_destroy_state(struct intel_global_obj *obj,
> +                                   struct intel_global_state *state)
> +{
> +  kfree(state);
> +}
> +
> +static const struct intel_global_state_funcs intel_pmdemand_funcs = {
> +  .atomic_duplicate_state = intel_pmdemand_duplicate_state,
> +  .atomic_destroy_state = intel_pmdemand_destroy_state,
> +};
> +
> +struct intel_pmdemand_state *
> +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state)
> +{
> +  struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +  struct intel_global_state *pmdemand_state;
> +
> +  pmdemand_state = intel_atomic_get_global_obj_state(state, &dev_priv->pmdemand.obj);
> +  if (IS_ERR(pmdemand_state))
> +          return ERR_CAST(pmdemand_state);
> +
> +  return to_intel_pmdemand_state(pmdemand_state);
> +}
> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv)

As general recomendation for the whole patch, we should name pointers to our
private struct i915 instead of dev_priv, specially for new code.

> +{
> +  struct intel_pmdemand_state *pmdemand_state;
> +
> +  pmdemand_state = kzalloc(sizeof(*pmdemand_state), GFP_KERNEL);
> +  if (!pmdemand_state)
> +          return -ENOMEM;
> +
> +  intel_atomic_global_obj_init(dev_priv, &dev_priv->pmdemand.obj,
> +                               &pmdemand_state->base, &intel_pmdemand_funcs);
> +
> +  return 0;
> +}
> +
> +void intel_init_pmdemand(struct drm_i915_private *dev_priv)
> +{
> +  mutex_init(&dev_priv->pmdemand.lock);
> +  init_waitqueue_head(&dev_priv->pmdemand.waitqueue);
> +}
> +
> +int intel_pmdemand_atomic_check(struct intel_atomic_state *state)
> +{
> +  struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +  struct intel_pmdemand_state *new_pmdemand_state = NULL;

Looks like this initialization is unnecessary.

> +  struct intel_crtc_state *old_crtc_state, *new_crtc_state;
> +  struct intel_crtc *crtc;
> +  struct intel_encoder *encoder;
> +  struct intel_bw_state *new_bw_state;
> +  const struct intel_dbuf_state *new_dbuf_state;
> +  const struct intel_cdclk_state *new_cdclk_state;
> +  int port_clock = 0;
> +  unsigned int data_rate;
> +  enum phy phy;
> +  int i, ret;
> +
> +  if (DISPLAY_VER(dev_priv) < 14)
> +          return 0;
> +
> +  new_pmdemand_state = intel_atomic_get_pmdemand_state(state);
> +  if (IS_ERR(new_pmdemand_state))
> +          return PTR_ERR(new_pmdemand_state);
> +
> +  ret = intel_atomic_lock_global_state(&new_pmdemand_state->base);

I was looking at the other usages of intel_atomic_lock_global_state() and it
seems we do that only when we change the state of our global object. Should we
really be calling it this early for PM Demand?

> +  if (ret)
> +          return ret;
> +
> +  /* Punit figures out the voltage index based on bandwidth*/
> +  new_bw_state = intel_atomic_get_bw_state(state);
> +  if (IS_ERR(new_bw_state))
> +          return PTR_ERR(new_bw_state);
> +
> +  /* firmware will calculate the qclck_gc_index, requirement is set to 0 */
> +  new_pmdemand_state->qclk_gv_index = 0;
> +
> +  data_rate = intel_bw_data_rate(dev_priv, new_bw_state);
> +  /* To MBs then to multiples of 100MBs */
> +  data_rate = DIV_ROUND_UP(data_rate, 1000);
> +  data_rate = DIV_ROUND_UP(data_rate, 100);
> +  new_pmdemand_state->qclk_gv_bw = data_rate;
> +
> +  new_dbuf_state = intel_atomic_get_dbuf_state(state);
> +  if (IS_ERR(new_dbuf_state))
> +          return PTR_ERR(new_dbuf_state);

Looks like calculation of the mask of active pipes has many users now: PM
Demand, CDCLOCK and watermark related code. Maybe we could refactor the code in
a future patch so that we have a single source for this value?

> +
> +  i = hweight8(new_dbuf_state->active_pipes);
> +  new_pmdemand_state->active_pipes = min(i, 3);
> +
> +  new_cdclk_state = intel_atomic_get_cdclk_state(state);
> +  if (IS_ERR(new_cdclk_state))
> +          return PTR_ERR(new_cdclk_state);
> +
> +  new_pmdemand_state->voltage_index = new_cdclk_state->logical.voltage_level;
> +  /* KHz to MHz */
> +  new_pmdemand_state->cdclk_freq_mhz = DIV_ROUND_UP(new_cdclk_state->logical.cdclk, 1000);
> +
> +  new_pmdemand_state->active_phys_plls_mask = 0;
> +
> +  for_each_oldnew_intel_crtc_in_state(state, crtc, old_crtc_state, new_crtc_state, i) {
> +          if (!new_crtc_state->hw.active)
> +                  continue;

Unless I have misunderstood how for_each_oldnew_intel_crtc_in_state() works, I
think there is an issue with this loop: we are potentially ignoring CRTCs not
being modified by the atomic update. This could get us the wrong values for
ddiclk_freq_mhz and active_phys_plls_mask.

While active_phys_plls_mask could be handled like active_pipes (i.e. using the
old value as initial and cearing/setting bits using the new states), I don't
think the same is true for ddiclk_freq_mhz.

Since ddiclk_freq_mhz needs to be the maximum port clock value, I'm afraid we
can't escape having to check all active crtcs, meaning that we should probably
iterate with for_each_intel_crtc() and use intel_atomic_get_crtc_state() so we
ensure we get the state for each crtc.

> +
> +          encoder = intel_get_crtc_new_encoder(state, new_crtc_state);
> +          if (!encoder)
> +                  continue;
> +
> +          phy = intel_port_to_phy(dev_priv, encoder->port);
> +
> +          if (intel_is_c10phy(dev_priv, phy))
> +                  new_pmdemand_state->active_phys_plls_mask |= BIT(phy);

Since both C10 and PM Demand patches are currently in-flight, to make patch flow
"synchronization" easier, maybe we should send a separate patch doing
C10-specific stuff for PM Demand after both C10 and PM Demand series are
applied?

> +
> +          port_clock = max(port_clock, new_crtc_state->port_clock);
> +  }
> +
> +  /* To MHz */
> +  new_pmdemand_state->ddiclk_freq_mhz = DIV_ROUND_UP(port_clock, 1000);
> +
> +  /*
> +   * Setting scalers to max as it can not be calculated during flips and
> +   * fastsets without taking global states locks.
> +   */
> +  new_pmdemand_state->scalers = 7;
> +
> +  return 0;
> +}
> +
> +static bool intel_pmdemand_check_prev_transaction(struct drm_i915_private *dev_priv)
> +{
> +  return !((intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE) ||
> +          (intel_de_read(dev_priv, GEN12_DCPR_STATUS_1) & XELPDP_PMDEMAND_INFLIGHT_STATUS));
> +}
> +
> +static bool intel_pmdemand_req_complete(struct drm_i915_private *dev_priv)
> +{
> +  return !(intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1)) & XELPDP_PMDEMAND_REQ_ENABLE);
> +}
> +
> +static int intel_pmdemand_wait(struct drm_i915_private *dev_priv)
> +{
> +  DEFINE_WAIT(wait);
> +  int ret;
> +  const unsigned int timeout_ms = 10;
> +
> +  add_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);

Looking at how wait_event_timeout() is implemented, I think calling
add_wait_queue() and remove_wait_queue() is unnecessary. In fact,
wait_event_timeout() creates its own entry and adds it to the queue (and removes
it afterwards).

> +
> +  ret = wait_event_timeout(dev_priv->pmdemand.waitqueue,
> +                           intel_pmdemand_req_complete(dev_priv),
> +                           msecs_to_jiffies_timeout(timeout_ms));
> +  if (ret < 0)

Looking at the documentation of wait_event_timeout(), the returned value should
never be negative. I think the correct check here should be (ret == 0), which
indicates a timeout and intel_pmdemand_req_complete(dev_priv) still evaluating
false.

> +          drm_err(&dev_priv->drm,
> +                  "timed out waiting for Punit PM Demand Response\n");
> +
> +  remove_wait_queue(&dev_priv->pmdemand.waitqueue, &wait);
> +
> +  return ret;
> +}
> +
> +/* Required to be programmed during Display Init Sequences. */
> +void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> +                           u8 dbuf_slices)
> +{
> +  mutex_lock(&dev_priv->pmdemand.lock);
> +  if (drm_WARN_ON(&dev_priv->drm,
> +                  !intel_pmdemand_check_prev_transaction(dev_priv)))
> +          goto unlock;
> +
> +  intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0),
> +               XELPDP_PMDEMAND_DBUFS_MASK,
> +               XELPDP_PMDEMAND_DBUFS(hweight32(dbuf_slices)));
> +  intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0,
> +               XELPDP_PMDEMAND_REQ_ENABLE);
> +
> +  intel_pmdemand_wait(dev_priv);
> +unlock:
> +  mutex_unlock(&dev_priv->pmdemand.lock);
> +}
> +
> +static void intel_program_pmdemand(struct drm_i915_private *dev_priv,
> +                             const struct intel_pmdemand_state *new,
> +                             const struct intel_pmdemand_state *old)

Looking at how this is implemented and called, I understand that calling this
with old != NULL means the update is for "increased values" and, with old as
NULL, means the update is for "decreased values". Nitpick: I would leave a
comment just for clarity.

> +{
> +  u32 val, tmp;
> +
> +#define UPDATE_PMDEMAND_VAL(val, F, f) do {            \
> +  val &= (~(XELPDP_PMDEMAND_##F##_MASK));         \
> +  val |= (XELPDP_PMDEMAND_##F((u32)(old ? max(old->f, new->f) : new->f))); \
> +} while (0)
> +
> +  mutex_lock(&dev_priv->pmdemand.lock);
> +  if (drm_WARN_ON(&dev_priv->drm,
> +                  !intel_pmdemand_check_prev_transaction(dev_priv)))

Shouldn't we actually wait and timeout here? If so, we could probably do that
inside intel_pmdemand_check_prev_transaction() and rename it to
intel_pmdemand_wait_prev_transaction().

> +          goto unlock;
> +
> +  /*
> +   * TODO: Update programming PM Demand for
> +   * PHYS, PLLS, DDI_CLKFREQ, SCALARS
> +   */
> +  val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0));
> +  UPDATE_PMDEMAND_VAL(val, QCLK_GV_INDEX, qclk_gv_index);
> +  UPDATE_PMDEMAND_VAL(val, QCLK_GV_BW, qclk_gv_bw);

I couldn't find instructions in the BSpec regarding SAGV for "increased values"
and "decreased values" (differently from other sequences like Voltage Switching,
where there are separate PM Demand steps for increased and decreased values).

Am I missing it? Or should we instead just use the new value here
unconditionally?

> +  UPDATE_PMDEMAND_VAL(val, VOLTAGE_INDEX, voltage_index);
> +  UPDATE_PMDEMAND_VAL(val, PIPES, active_pipes);
> +  UPDATE_PMDEMAND_VAL(val, DBUFS, dbufs);
> +  tmp = hweight32(new->active_phys_plls_mask);
> +  if (old)
> +          tmp = max(tmp, hweight32(old->active_phys_plls_mask));
> +  val |= XELPDP_PMDEMAND_PHYS(tmp);
> +
> +  intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(0), val);
> +
> +  val = intel_de_read(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1));
> +  UPDATE_PMDEMAND_VAL(val, CDCLK_FREQ, cdclk_freq_mhz);
> +  UPDATE_PMDEMAND_VAL(val, DDICLK_FREQ, ddiclk_freq_mhz);
> +  UPDATE_PMDEMAND_VAL(val, SCALERS, scalers);
> +  /*
> +   * Active_PLLs starts with 1 because of CDCLK PLL.
> +   * TODO: Missing to account genlock filter when it gets used.
> +   */
> +  val |= XELPDP_PMDEMAND_PLLS(tmp + 1);
> +
> +  intel_de_write(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), val);
> +
> +#undef UPDATE_PM_DEMAND_VAL
> +
> +  intel_de_rmw(dev_priv, XELPDP_INITIATE_PMDEMAND_REQUEST(1), 0, XELPDP_PMDEMAND_REQ_ENABLE);
> +
> +  intel_pmdemand_wait(dev_priv);
> +unlock:
> +  mutex_unlock(&dev_priv->pmdemand.lock);
> +}
> +
> +void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state)
> +{
> +  struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +  const struct intel_pmdemand_state *new_pmdmnd_state =
> +          intel_atomic_get_new_pmdemand_state(state);
> +  const struct intel_pmdemand_state *old_pmdmnd_state =
> +          intel_atomic_get_old_pmdemand_state(state);
> +
> +  if (DISPLAY_VER(dev_priv) < 14)
> +          return;
> +
> +  if (!new_pmdmnd_state ||
> +      memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)

We are comparing the whole structure here, including fields specific to struct
intel_global_state (which are modified when the state is duplicated). As such, I
thinkg this comparison has potential to yield false positives (i.e. making us
think that the state has changed while it has not).

We should have a function intel_pmdemand_state_changed() that compares only data
specific to PM Demand. The implementation could be done by either (i) comparing
member by member or (ii) combining offsetof() with sizeof() to get the correct
slice of memory to compare with memcmp(). I would go with (ii).

> +          return;
> +
> +  intel_program_pmdemand(dev_priv, new_pmdmnd_state, old_pmdmnd_state);
> +}
> +
> +void intel_pmdemand_post_plane_update(struct intel_atomic_state *state)
> +{
> +  struct drm_i915_private *dev_priv = to_i915(state->base.dev);
> +  const struct intel_pmdemand_state *new_pmdmnd_state =
> +          intel_atomic_get_new_pmdemand_state(state);
> +  const struct intel_pmdemand_state *old_pmdmnd_state =
> +          intel_atomic_get_old_pmdemand_state(state);
> +
> +  if (DISPLAY_VER(dev_priv) < 14)
> +          return;
> +
> +  if (!new_pmdmnd_state ||
> +      memcmp(new_pmdmnd_state, old_pmdmnd_state, sizeof(*new_pmdmnd_state)) == 0)
> +          return;
> +
> +  intel_program_pmdemand(dev_priv, new_pmdmnd_state, NULL);
> +}
> +
>  static void ibx_init_clock_gating(struct drm_i915_private *dev_priv)
>  {
>         /*
> diff --git a/drivers/gpu/drm/i915/intel_pm.h b/drivers/gpu/drm/i915/intel_pm.h
> index f774bddcdca6..2663bec408c7 100644
> --- a/drivers/gpu/drm/i915/intel_pm.h
> +++ b/drivers/gpu/drm/i915/intel_pm.h
> @@ -8,11 +8,46 @@
>  
>  #include <linux/types.h>
>  
> +#include "display/intel_global_state.h"
> +
>  struct drm_i915_private;
>  struct intel_crtc_state;
>  struct intel_plane_state;
>  
>  void intel_init_clock_gating(struct drm_i915_private *dev_priv);
> +void intel_init_pmdemand(struct drm_i915_private *dev_priv);
>  void intel_init_clock_gating_hooks(struct drm_i915_private *dev_priv);
>  
> +struct intel_pmdemand_state {
> +  struct intel_global_state base;
> +
> +  u16 qclk_gv_bw;
> +  u8 voltage_index;
> +  u8 qclk_gv_index;
> +  u8 active_pipes;
> +  u8 dbufs;
> +  u8 active_phys_plls_mask;
> +  u16 cdclk_freq_mhz;
> +  u16 ddiclk_freq_mhz;
> +  u8 scalers;
> +};
> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv);
> +
> +struct intel_pmdemand_state *
> +intel_atomic_get_pmdemand_state(struct intel_atomic_state *state);
> +
> +#define to_intel_pmdemand_state(x) container_of((x), struct intel_pmdemand_state, base)
> +#define intel_atomic_get_old_pmdemand_state(state) \
> +  to_intel_pmdemand_state(intel_atomic_get_old_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))
> +#define intel_atomic_get_new_pmdemand_state(state) \
> +  to_intel_pmdemand_state(intel_atomic_get_new_global_obj_state(state, &to_i915(state->base.dev)->pmdemand.obj))
> +
> +int intel_pmdemand_init(struct drm_i915_private *dev_priv);
> +void intel_program_dbuf_pmdemand(struct drm_i915_private *dev_priv,
> +                           u8 dbuf_slices);
> +void intel_pmdemand_pre_plane_update(struct intel_atomic_state *state);
> +void intel_pmdemand_post_plane_update(struct intel_atomic_state *state);
> +int intel_pmdemand_atomic_check(struct intel_atomic_state *state);
> +
>  #endif /* __INTEL_PM_H__ */
> -- 
> 2.34.1
>

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-11 22:47 ` [Intel-gfx] [PATCH] " Gustavo Sousa
@ 2023-04-12  9:33   ` Jani Nikula
  2023-04-12 12:26     ` Gustavo Sousa
  0 siblings, 1 reply; 13+ messages in thread
From: Jani Nikula @ 2023-04-12  9:33 UTC (permalink / raw)
  To: Gustavo Sousa, Mika Kahola, intel-gfx; +Cc: Matt Roper, Lucas De Marchi

On Tue, 11 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
> Quoting Mika Kahola (2023-04-03 05:50:43)
>> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
>>         intel_color_init_hooks(dev_priv);
>>         intel_init_cdclk_hooks(dev_priv);
>>         intel_audio_hooks_init(dev_priv);
>> +  intel_init_pmdemand(dev_priv);
>
> I think intel_init_display_hooks() is meant to call functions setting up
> function pointers, right? That would not be the case for intel_init_pmdemand().
>
> I think we could rename intel_init_pmdemand() to
> intel_pmdemand_init_early() and call it inside i915_driver_early_probe().

Please let's not add new direct calls to display from top level driver
code. See also [1].


BR,
Jani.


[1] https://lore.kernel.org/r/87r0t11g19.fsf@intel.com


-- 
Jani Nikula, Intel Open Source Graphics Center

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-12  9:33   ` Jani Nikula
@ 2023-04-12 12:26     ` Gustavo Sousa
  2023-04-12 13:34       ` Jani Nikula
  0 siblings, 1 reply; 13+ messages in thread
From: Gustavo Sousa @ 2023-04-12 12:26 UTC (permalink / raw)
  To: Jani Nikula, Mika Kahola, intel-gfx; +Cc: Matt Roper, Lucas De Marchi

Quoting Jani Nikula (2023-04-12 06:33:54)
> On Tue, 11 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
> > Quoting Mika Kahola (2023-04-03 05:50:43)
> >> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
> >>         intel_color_init_hooks(dev_priv);
> >>         intel_init_cdclk_hooks(dev_priv);
> >>         intel_audio_hooks_init(dev_priv);
> >> +  intel_init_pmdemand(dev_priv);
> >
> > I think intel_init_display_hooks() is meant to call functions setting up
> > function pointers, right? That would not be the case for intel_init_pmdemand().
> >
> > I think we could rename intel_init_pmdemand() to
> > intel_pmdemand_init_early() and call it inside i915_driver_early_probe().
> 
> Please let's not add new direct calls to display from top level driver
> code. See also [1].

Okay. What would be the suggested place to do this SW-only initialization?

Should we just merge the two init functions into one named intel_pmdemand_init()
and call the new function under intel_modeset_init_noirq()?

--
Gustavo Sousa

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-12 12:26     ` Gustavo Sousa
@ 2023-04-12 13:34       ` Jani Nikula
  2023-04-13  9:50         ` Jani Nikula
  0 siblings, 1 reply; 13+ messages in thread
From: Jani Nikula @ 2023-04-12 13:34 UTC (permalink / raw)
  To: Gustavo Sousa, Mika Kahola, intel-gfx; +Cc: Matt Roper, Lucas De Marchi

On Wed, 12 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
> Quoting Jani Nikula (2023-04-12 06:33:54)
>> On Tue, 11 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
>> > Quoting Mika Kahola (2023-04-03 05:50:43)
>> >> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
>> >>         intel_color_init_hooks(dev_priv);
>> >>         intel_init_cdclk_hooks(dev_priv);
>> >>         intel_audio_hooks_init(dev_priv);
>> >> +  intel_init_pmdemand(dev_priv);
>> >
>> > I think intel_init_display_hooks() is meant to call functions setting up
>> > function pointers, right? That would not be the case for intel_init_pmdemand().
>> >
>> > I think we could rename intel_init_pmdemand() to
>> > intel_pmdemand_init_early() and call it inside i915_driver_early_probe().
>> 
>> Please let's not add new direct calls to display from top level driver
>> code. See also [1].
>
> Okay. What would be the suggested place to do this SW-only initialization?
>
> Should we just merge the two init functions into one named intel_pmdemand_init()
> and call the new function under intel_modeset_init_noirq()?

Or add a new function intel_display_early_probe() or somesuch, which
will call the early pmdemand init as well as intel_init_display_hooks()
that is currently called from i915_driver_early_probe().

Bottom line, there should only be one high level call from
i915_driver_early_probe().

There are similar needs for other things [1].

BR,
Jani.


[1] https://lore.kernel.org/r/20230411195918.hdxyir5w7dp2qx55@ldmartin-desk2.lan


>
> --
> Gustavo Sousa

-- 
Jani Nikula, Intel Open Source Graphics Center

^ permalink raw reply	[flat|nested] 13+ messages in thread

* Re: [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND
  2023-04-12 13:34       ` Jani Nikula
@ 2023-04-13  9:50         ` Jani Nikula
  0 siblings, 0 replies; 13+ messages in thread
From: Jani Nikula @ 2023-04-13  9:50 UTC (permalink / raw)
  To: Gustavo Sousa, Mika Kahola, intel-gfx; +Cc: Lucas De Marchi, Matt Roper

On Wed, 12 Apr 2023, Jani Nikula <jani.nikula@linux.intel.com> wrote:
> On Wed, 12 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
>> Quoting Jani Nikula (2023-04-12 06:33:54)
>>> On Tue, 11 Apr 2023, Gustavo Sousa <gustavo.sousa@intel.com> wrote:
>>> > Quoting Mika Kahola (2023-04-03 05:50:43)
>>> >> @@ -8250,6 +8259,7 @@ void intel_init_display_hooks(struct drm_i915_private *dev_priv)
>>> >>         intel_color_init_hooks(dev_priv);
>>> >>         intel_init_cdclk_hooks(dev_priv);
>>> >>         intel_audio_hooks_init(dev_priv);
>>> >> +  intel_init_pmdemand(dev_priv);
>>> >
>>> > I think intel_init_display_hooks() is meant to call functions setting up
>>> > function pointers, right? That would not be the case for intel_init_pmdemand().
>>> >
>>> > I think we could rename intel_init_pmdemand() to
>>> > intel_pmdemand_init_early() and call it inside i915_driver_early_probe().
>>> 
>>> Please let's not add new direct calls to display from top level driver
>>> code. See also [1].
>>
>> Okay. What would be the suggested place to do this SW-only initialization?
>>
>> Should we just merge the two init functions into one named intel_pmdemand_init()
>> and call the new function under intel_modeset_init_noirq()?
>
> Or add a new function intel_display_early_probe() or somesuch, which
> will call the early pmdemand init as well as intel_init_display_hooks()
> that is currently called from i915_driver_early_probe().
>
> Bottom line, there should only be one high level call from
> i915_driver_early_probe().
>
> There are similar needs for other things [1].
>
> BR,
> Jani.
>
>
> [1] https://lore.kernel.org/r/20230411195918.hdxyir5w7dp2qx55@ldmartin-desk2.lan

All of this is cleaned up in
https://patchwork.freedesktop.org/series/116431/

BR,
Jani.


>
>
>>
>> --
>> Gustavo Sousa

-- 
Jani Nikula, Intel Open Source Graphics Center

^ permalink raw reply	[flat|nested] 13+ messages in thread

end of thread, other threads:[~2023-04-13  9:50 UTC | newest]

Thread overview: 13+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2023-04-03  8:50 [Intel-gfx] [PATCH] drm/i915/mtl: Add support for PM DEMAND Mika Kahola
2023-04-03  9:17 ` Jani Nikula
2023-04-03 13:14   ` Kahola, Mika
2023-04-03 10:55 ` kernel test robot
2023-04-03 13:49 ` kernel test robot
2023-04-03 17:33 ` kernel test robot
2023-04-03 17:33 ` kernel test robot
2023-04-03 19:07 ` [Intel-gfx] ✗ Fi.CI.BUILD: failure for " Patchwork
2023-04-11 22:47 ` [Intel-gfx] [PATCH] " Gustavo Sousa
2023-04-12  9:33   ` Jani Nikula
2023-04-12 12:26     ` Gustavo Sousa
2023-04-12 13:34       ` Jani Nikula
2023-04-13  9:50         ` Jani Nikula

This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.