All of lore.kernel.org
 help / color / mirror / Atom feed
* [PATCH] stm32mp: psci: Implement PSCI system suspend and DRAM SSR
@ 2022-02-02 11:52 Marek Vasut
  2022-02-10 19:20 ` Patrick DELAUNAY
  0 siblings, 1 reply; 3+ messages in thread
From: Marek Vasut @ 2022-02-02 11:52 UTC (permalink / raw)
  To: u-boot; +Cc: Marek Vasut, Patrick Delaunay, Patrice Chotard

Implement PSCI system suspend and placement of DRAM into SSR while the
CPUs are in suspend. This saves non-trivial amount of power in suspend,
on 2x W632GU6NB-15 ~710mW.

Signed-off-by: Marek Vasut <marex@denx.de>
Cc: Patrick Delaunay <patrick.delaunay@foss.st.com>
Cc: Patrice Chotard <patrice.chotard@foss.st.com>
---
 arch/arm/mach-stm32mp/include/mach/stm32.h |   3 +
 arch/arm/mach-stm32mp/psci.c               | 481 +++++++++++++++++++++
 2 files changed, 484 insertions(+)

diff --git a/arch/arm/mach-stm32mp/include/mach/stm32.h b/arch/arm/mach-stm32mp/include/mach/stm32.h
index c11a9903f20..47e88fc3dcd 100644
--- a/arch/arm/mach-stm32mp/include/mach/stm32.h
+++ b/arch/arm/mach-stm32mp/include/mach/stm32.h
@@ -16,8 +16,11 @@
  */
 #define STM32_RCC_BASE			0x50000000
 #define STM32_PWR_BASE			0x50001000
+#define STM32_SYSCFG_BASE		0x50020000
 #define STM32_DBGMCU_BASE		0x50081000
 #define STM32_FMC2_BASE			0x58002000
+#define STM32_DDRCTRL_BASE		0x5A003000
+#define STM32_DDRPHYC_BASE		0x5A004000
 #define STM32_TZC_BASE			0x5C006000
 #define STM32_ETZPC_BASE		0x5C007000
 #define STM32_STGEN_BASE		0x5C008000
diff --git a/arch/arm/mach-stm32mp/psci.c b/arch/arm/mach-stm32mp/psci.c
index 155aa79cd5e..7be34054f6b 100644
--- a/arch/arm/mach-stm32mp/psci.c
+++ b/arch/arm/mach-stm32mp/psci.c
@@ -11,8 +11,141 @@
 #include <asm/io.h>
 #include <asm/psci.h>
 #include <asm/secure.h>
+#include <hang.h>
 #include <linux/bitops.h>
 
+/* PWR */
+#define PWR_CR3					0x0c
+#define PWR_MPUCR				0x10
+
+#define PWR_CR3_DDRRETEN			BIT(12)
+#define PWR_CR3_DDRSREN				BIT(10)
+
+#define PWR_MPUCR_PDDS				BIT(0)
+#define PWR_MPUCR_CSTDBYDIS			BIT(3)
+#define PWR_MPUCR_CSSF				BIT(9)
+
+/* RCC */
+#define RCC_DDRITFCR				0xd8
+
+#define RCC_DDRITFCR_DDRC1EN			BIT(0)
+#define RCC_DDRITFCR_DDRC1LPEN			BIT(1)
+#define RCC_DDRITFCR_DDRC2EN			BIT(2)
+#define RCC_DDRITFCR_DDRC2LPEN			BIT(3)
+#define RCC_DDRITFCR_DDRPHYCEN			BIT(4)
+#define RCC_DDRITFCR_DDRPHYCLPEN		BIT(5)
+#define RCC_DDRITFCR_DDRCAPBEN			BIT(6)
+#define RCC_DDRITFCR_DDRCAPBLPEN		BIT(7)
+#define RCC_DDRITFCR_AXIDCGEN			BIT(8)
+#define RCC_DDRITFCR_DDRPHYCAPBEN		BIT(9)
+#define RCC_DDRITFCR_DDRPHYCAPBLPEN		BIT(10)
+#define RCC_DDRITFCR_DDRCKMOD_MASK		(0x7 << 20)
+#define RCC_DDRITFCR_GSKPCTRL			BIT(24)
+
+#define RCC_MP_SREQSETR				0x104
+#define RCC_MP_SREQCLRR				0x108
+
+#define RCC_MP_CIER				0x414
+#define RCC_MP_CIFR				0x418
+#define RCC_MP_CIFR_WKUPF			BIT(20)
+
+/* SYSCFG */
+#define SYSCFG_CMPCR				0x20
+#define SYSCFG_CMPCR_MPUEN			BIT(0)
+#define SYSCFG_CMPCR_SW_CTRL			BIT(2)
+#define SYSCFG_CMPENSETR			0x24
+#define SYSCFG_CMPENCLRR			0x28
+
+/* DDR Controller registers offsets */
+#define DDRCTRL_STAT				0x004
+#define DDRCTRL_PWRCTL				0x030
+#define DDRCTRL_PWRTMG				0x034
+#define DDRCTRL_HWLPCTL				0x038
+#define DDRCTRL_DFIMISC				0x1B0
+#define DDRCTRL_SWCTL				0x320
+#define DDRCTRL_SWSTAT				0x324
+#define DDRCTRL_PSTAT				0x3FC
+#define DDRCTRL_PCTRL_0				0x490
+#define DDRCTRL_PCTRL_1				0x540
+
+/* DDR Controller Register fields */
+#define DDRCTRL_STAT_OPERATING_MODE_MASK	0x7
+#define DDRCTRL_STAT_OPERATING_MODE_NORMAL	0x1
+#define DDRCTRL_STAT_OPERATING_MODE_SR		0x3
+#define DDRCTRL_STAT_SELFREF_TYPE_MASK		(0x3 << 4)
+#define DDRCTRL_STAT_SELFREF_TYPE_ASR		(0x3 << 4)
+#define DDRCTRL_STAT_SELFREF_TYPE_SR		(0x2 << 4)
+
+#define DDRCTRL_PWRCTL_SELFREF_EN		BIT(0)
+#define DDRCTRL_PWRCTL_EN_DFI_DRAM_CLK_DISABLE	BIT(3)
+#define DDRCTRL_PWRCTL_SELFREF_SW		BIT(5)
+
+#define DDRCTRL_PWRTMG_SELFREF_TO_X32_MASK	(0xff << 16)
+#define DDRCTRL_PWRTMG_SELFREF_TO_X32_0		BIT(16)
+
+#define DDRCTRL_HWLPCTL_HW_LP_EN		BIT(0)
+
+#define DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN	BIT(0)
+
+#define DDRCTRL_SWCTL_SW_DONE			BIT(0)
+
+#define DDRCTRL_SWSTAT_SW_DONE_ACK		BIT(0)
+
+#define DDRCTRL_PSTAT_RD_PORT_BUSY_0		BIT(0)
+#define DDRCTRL_PSTAT_RD_PORT_BUSY_1		BIT(1)
+#define DDRCTRL_PSTAT_WR_PORT_BUSY_0		BIT(16)
+#define DDRCTRL_PSTAT_WR_PORT_BUSY_1		BIT(17)
+
+#define DDRCTRL_PCTRL_N_PORT_EN			BIT(0)
+
+/* DDR PHY registers offsets */
+#define DDRPHYC_PIR				0x004
+#define DDRPHYC_PGSR				0x00C
+#define DDRPHYC_ACDLLCR				0x014
+#define DDRPHYC_ACIOCR				0x024
+#define DDRPHYC_DXCCR				0x028
+#define DDRPHYC_DSGCR				0x02C
+#define DDRPHYC_ZQ0CR0				0x180
+#define DDRPHYC_DX0DLLCR			0x1CC
+#define DDRPHYC_DX1DLLCR			0x20C
+#define DDRPHYC_DX2DLLCR			0x24C
+#define DDRPHYC_DX3DLLCR			0x28C
+
+/* DDR PHY Register fields */
+#define DDRPHYC_PIR_INIT			BIT(0)
+#define DDRPHYC_PIR_DLLSRST			BIT(1)
+#define DDRPHYC_PIR_DLLLOCK			BIT(2)
+#define DDRPHYC_PIR_ITMSRST			BIT(4)
+
+#define DDRPHYC_PGSR_IDONE			BIT(0)
+
+#define DDRPHYC_ACDLLCR_DLLSRST			BIT(30)
+#define DDRPHYC_ACDLLCR_DLLDIS			BIT(31)
+
+#define DDRPHYC_ACIOCR_ACOE			BIT(1)
+#define DDRPHYC_ACIOCR_ACPDD			BIT(3)
+#define DDRPHYC_ACIOCR_ACPDR			BIT(4)
+#define DDRPHYC_ACIOCR_CKPDD_MASK		(0x7 << 8)
+#define DDRPHYC_ACIOCR_CKPDD_0			BIT(8)
+#define DDRPHYC_ACIOCR_CKPDR_MASK		(0x7 << 11)
+#define DDRPHYC_ACIOCR_CKPDR_0			BIT(11)
+#define DDRPHYC_ACIOCR_CSPDD_MASK		(0x7 << 18)
+#define DDRPHYC_ACIOCR_CSPDD_0			BIT(18)
+
+#define DDRPHYC_DXCCR_DXPDD			BIT(2)
+#define DDRPHYC_DXCCR_DXPDR			BIT(3)
+
+#define DDRPHYC_DSGCR_CKEPDD_MASK		(0xf << 16)
+#define DDRPHYC_DSGCR_CKEPDD_0			BIT(16)
+#define DDRPHYC_DSGCR_ODTPDD_MASK		(0xf << 20)
+#define DDRPHYC_DSGCR_ODTPDD_0			BIT(20)
+#define DDRPHYC_DSGCR_NL2PD			BIT(24)
+#define DDRPHYC_DSGCR_CKOE			BIT(28)
+
+#define DDRPHYC_ZQ0CRN_ZQPD			BIT(31)
+
+#define DDRPHYC_DXNDLLCR_DLLDIS			BIT(31)
+
 #define BOOT_API_A7_CORE0_MAGIC_NUMBER	0xCA7FACE0
 #define BOOT_API_A7_CORE1_MAGIC_NUMBER	0xCA7FACE1
 
@@ -98,6 +231,7 @@ s32 __secure psci_features(u32 function_id, u32 psci_fid)
 	case ARM_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
 	case ARM_PSCI_0_2_FN_SYSTEM_OFF:
 	case ARM_PSCI_0_2_FN_SYSTEM_RESET:
+	case ARM_PSCI_1_0_FN_SYSTEM_SUSPEND:
 		return 0x0;
 	}
 	return ARM_PSCI_RET_NI;
@@ -222,3 +356,350 @@ void __secure psci_system_off(void)
 	while (1)
 		wfi();
 }
+
+static void __secure secure_udelay(unsigned int delay)
+{
+	/* This counts instructions, at 800 MHz, 1us = 800 instructions */
+	asm volatile(
+		"1:	subs	%0, #1\n"
+		"	bne	1b\n"
+	::"r"(delay * 800 / 2));
+}
+
+static int __secure secure_waitbits(u32 reg, u32 mask, u32 val)
+{
+	/* ~500 us worth of 6-opcode long cycles at 800 MHz */
+	unsigned int loopcount = 500;
+	u32 tmp;
+
+	while (loopcount--) {
+		tmp = readl(reg);
+		tmp &= mask;
+		if ((tmp & val) == val)
+			return 0;
+	}
+
+	return -ETIMEDOUT;
+}
+
+static void __secure ddr_sr_mode_ssr(void)
+{
+	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
+		     RCC_DDRITFCR_DDRC1LPEN | RCC_DDRITFCR_DDRC1EN |
+		     RCC_DDRITFCR_DDRC2LPEN | RCC_DDRITFCR_DDRC2EN |
+		     RCC_DDRITFCR_DDRCAPBLPEN | RCC_DDRITFCR_DDRPHYCAPBLPEN |
+		     RCC_DDRITFCR_DDRCAPBEN | RCC_DDRITFCR_DDRPHYCAPBEN |
+		     RCC_DDRITFCR_DDRPHYCEN);
+
+	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
+		     RCC_DDRITFCR_AXIDCGEN | RCC_DDRITFCR_DDRCKMOD_MASK);
+
+	/* Disable HW LP interface of uMCTL2 */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_HWLPCTL,
+		     DDRCTRL_HWLPCTL_HW_LP_EN);
+
+	/* Configure Automatic LP modes of uMCTL2 */
+	clrsetbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRTMG,
+			DDRCTRL_PWRTMG_SELFREF_TO_X32_MASK,
+			DDRCTRL_PWRTMG_SELFREF_TO_X32_0);
+
+	/*
+	 * Disable Clock disable with LP modes
+	 * (used in RUN mode for LPDDR2 with specific timing).
+	 */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
+		     DDRCTRL_PWRCTL_EN_DFI_DRAM_CLK_DISABLE);
+
+	/* Disable automatic Self-Refresh mode */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
+		     DDRCTRL_PWRCTL_SELFREF_EN);
+}
+
+static int __secure ddr_sw_self_refresh_in(void)
+{
+	int ret;
+
+	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_AXIDCGEN);
+
+	/* Blocks AXI ports from taking anymore transactions */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0,
+		     DDRCTRL_PCTRL_N_PORT_EN);
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1,
+		     DDRCTRL_PCTRL_N_PORT_EN);
+
+	/*
+	 * Waits unit all AXI ports are idle
+	 * Poll PSTAT.rd_port_busy_n = 0
+	 * Poll PSTAT.wr_port_busy_n = 0
+	 */
+	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_PSTAT,
+			      DDRCTRL_PSTAT_RD_PORT_BUSY_0 |
+			      DDRCTRL_PSTAT_RD_PORT_BUSY_1 |
+			      DDRCTRL_PSTAT_WR_PORT_BUSY_0 |
+			      DDRCTRL_PSTAT_WR_PORT_BUSY_1, 0);
+	if (ret)
+		goto pstat_failed;
+
+	/* SW Self-Refresh entry */
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL, DDRCTRL_PWRCTL_SELFREF_SW);
+
+	/*
+	 * Wait operating mode change in self-refresh mode
+	 * with STAT.operating_mode[1:0]==11.
+	 * Ensure transition to self-refresh was due to software
+	 * by checking also that STAT.selfref_type[1:0]=2.
+	 */
+	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_STAT,
+			      DDRCTRL_STAT_OPERATING_MODE_MASK |
+			      DDRCTRL_STAT_SELFREF_TYPE_MASK,
+			      DDRCTRL_STAT_OPERATING_MODE_SR |
+			      DDRCTRL_STAT_SELFREF_TYPE_SR);
+	if (ret)
+		goto selfref_sw_failed;
+
+	/* IOs powering down (PUBL registers) */
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDD);
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDR);
+
+	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
+			DDRPHYC_ACIOCR_CKPDD_MASK,
+			DDRPHYC_ACIOCR_CKPDD_0);
+
+	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
+			DDRPHYC_ACIOCR_CKPDR_MASK,
+			DDRPHYC_ACIOCR_CKPDR_0);
+
+	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
+			DDRPHYC_ACIOCR_CSPDD_MASK,
+			DDRPHYC_ACIOCR_CSPDD_0);
+
+	/* Disable command/address output driver */
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACOE);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDD);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDR);
+
+	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR,
+			DDRPHYC_DSGCR_ODTPDD_MASK,
+			DDRPHYC_DSGCR_ODTPDD_0);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_NL2PD);
+
+	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR,
+			DDRPHYC_DSGCR_CKEPDD_MASK,
+			DDRPHYC_DSGCR_CKEPDD_0);
+
+	/* Disable PZQ cell (PUBL register) */
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ZQ0CR0, DDRPHYC_ZQ0CRN_ZQPD);
+
+	/* Set latch */
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKOE);
+
+	/* Additional delay to avoid early latch */
+	secure_udelay(10);
+
+	/* Activate sw retention in PWRCTRL */
+	setbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRRETEN);
+
+	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
+	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
+
+	/* Disable all DLLs: GLITCH window */
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLDIS);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX0DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX1DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX2DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX3DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	/* Switch controller clocks (uMCTL2/PUBL) to DLL output clock */
+	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
+
+	/* Deactivate all DDR clocks */
+	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
+		     RCC_DDRITFCR_DDRC1EN | RCC_DDRITFCR_DDRC2EN |
+		     RCC_DDRITFCR_DDRCAPBEN | RCC_DDRITFCR_DDRPHYCAPBEN);
+
+	return 0;
+
+selfref_sw_failed:
+	/* This bit should be cleared to restore DDR in its previous state */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
+		     DDRCTRL_PWRCTL_SELFREF_SW);
+
+pstat_failed:
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0,
+		     DDRCTRL_PCTRL_N_PORT_EN);
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1,
+		     DDRCTRL_PCTRL_N_PORT_EN);
+
+	return -EINVAL;
+};
+
+static void __secure ddr_sw_self_refresh_exit(void)
+{
+	int ret;
+
+	/* Enable all clocks */
+	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
+		     RCC_DDRITFCR_DDRC1EN | RCC_DDRITFCR_DDRC2EN |
+		     RCC_DDRITFCR_DDRPHYCEN | RCC_DDRITFCR_DDRPHYCAPBEN |
+		     RCC_DDRITFCR_DDRCAPBEN);
+
+	/* Handshake */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
+
+	/* Mask dfi_init_complete_en */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_DFIMISC,
+		     DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN);
+
+	/* Ack */
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
+	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_SWSTAT,
+			      DDRCTRL_SWSTAT_SW_DONE_ACK,
+			      DDRCTRL_SWSTAT_SW_DONE_ACK);
+	if (ret)
+		hang();
+
+	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
+	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
+
+	/* Enable all DLLs: GLITCH window */
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR,
+		     DDRPHYC_ACDLLCR_DLLDIS);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX0DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX1DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX2DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX3DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
+
+	/* Additional delay to avoid early DLL clock switch */
+	secure_udelay(50);
+
+	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
+	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLSRST);
+
+	secure_udelay(10);
+
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLSRST);
+
+	/* PHY partial init: (DLL lock and ITM reset) */
+	writel(DDRPHYC_PIR_DLLSRST | DDRPHYC_PIR_DLLLOCK |
+	       DDRPHYC_PIR_ITMSRST | DDRPHYC_PIR_INIT,
+	       STM32_DDRPHYC_BASE + DDRPHYC_PIR);
+
+	/* Need to wait at least 10 clock cycles before accessing PGSR */
+	secure_udelay(1);
+
+	/* Pool end of init */
+	ret = secure_waitbits(STM32_DDRPHYC_BASE + DDRPHYC_PGSR,
+			      DDRPHYC_PGSR_IDONE, DDRPHYC_PGSR_IDONE);
+	if (ret)
+		hang();
+
+	/* Handshake */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
+
+	/* Unmask dfi_init_complete_en to uMCTL2 */
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_DFIMISC, DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN);
+
+	/* Ack */
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
+	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_SWSTAT,
+			      DDRCTRL_SWSTAT_SW_DONE_ACK,
+			      DDRCTRL_SWSTAT_SW_DONE_ACK);
+	if (ret)
+		hang();
+
+	/* Deactivate sw retention in PWR */
+	clrbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRRETEN);
+
+	/* Enable PZQ cell (PUBL register) */
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ZQ0CR0, DDRPHYC_ZQ0CRN_ZQPD);
+
+	/* Enable pad drivers */
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDD);
+
+	/* Enable command/address output driver */
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACOE);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_CKPDD_MASK);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_CSPDD_MASK);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDD);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDR);
+
+	/* Release latch */
+	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKOE);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_ODTPDD_MASK);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_NL2PD);
+
+	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKEPDD_MASK);
+
+	/* Remove selfrefresh */
+	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL, DDRCTRL_PWRCTL_SELFREF_SW);
+
+	/* Wait operating_mode == normal */
+	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_STAT,
+			      DDRCTRL_STAT_OPERATING_MODE_MASK,
+			      DDRCTRL_STAT_OPERATING_MODE_NORMAL);
+	if (ret)
+		hang();
+
+	/* AXI ports are no longer blocked from taking transactions */
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0, DDRCTRL_PCTRL_N_PORT_EN);
+	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1, DDRCTRL_PCTRL_N_PORT_EN);
+
+	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_AXIDCGEN);
+}
+
+void __secure psci_system_suspend(u32 __always_unused function_id,
+				  u32 ep, u32 context_id)
+{
+	u32 reg;
+
+	/* Place current APSRC/ANSRC into RAPSRC/RANSRC */
+	reg = readl(STM32_SYSCFG_BASE + SYSCFG_CMPCR);
+	reg >>= 8;
+	reg &= 0xff << 16;
+	reg |= SYSCFG_CMPCR_SW_CTRL;
+	writel(reg, STM32_SYSCFG_BASE + SYSCFG_CMPCR);
+	writel(SYSCFG_CMPCR_MPUEN, STM32_SYSCFG_BASE + SYSCFG_CMPENCLRR);
+
+	writel(RCC_MP_CIFR_WKUPF, STM32_RCC_BASE + RCC_MP_CIFR);
+	setbits_le32(STM32_RCC_BASE + RCC_MP_CIER, RCC_MP_CIFR_WKUPF);
+
+	setbits_le32(STM32_PWR_BASE + PWR_MPUCR,
+		     PWR_MPUCR_CSSF | PWR_MPUCR_CSTDBYDIS | PWR_MPUCR_PDDS);
+
+	psci_v7_flush_dcache_all();
+	ddr_sr_mode_ssr();
+	ddr_sw_self_refresh_in();
+	setbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRSREN);
+	writel(0x3, STM32_RCC_BASE + RCC_MP_SREQSETR);
+
+	/* Zzz, enter stop mode */
+	asm volatile(
+		"wfi\n"
+		"isb\n"
+		"dsb\n");
+
+	writel(0x3, STM32_RCC_BASE + RCC_MP_SREQCLRR);
+	ddr_sw_self_refresh_exit();
+
+	writel(SYSCFG_CMPCR_MPUEN, STM32_SYSCFG_BASE + SYSCFG_CMPENSETR);
+	clrbits_le32(STM32_SYSCFG_BASE + SYSCFG_CMPCR, SYSCFG_CMPCR_SW_CTRL);
+}
-- 
2.34.1


^ permalink raw reply related	[flat|nested] 3+ messages in thread

* Re: [PATCH] stm32mp: psci: Implement PSCI system suspend and DRAM SSR
  2022-02-02 11:52 [PATCH] stm32mp: psci: Implement PSCI system suspend and DRAM SSR Marek Vasut
@ 2022-02-10 19:20 ` Patrick DELAUNAY
  2022-02-21 20:02   ` Marek Vasut
  0 siblings, 1 reply; 3+ messages in thread
From: Patrick DELAUNAY @ 2022-02-10 19:20 UTC (permalink / raw)
  To: Marek Vasut, u-boot; +Cc: Patrice Chotard

Hi,

On 2/2/22 12:52, Marek Vasut wrote:
> Implement PSCI system suspend and placement of DRAM into SSR while the
> CPUs are in suspend. This saves non-trivial amount of power in suspend,
> on 2x W632GU6NB-15 ~710mW.
>
> Signed-off-by: Marek Vasut <marex@denx.de>
> Cc: Patrick Delaunay <patrick.delaunay@foss.st.com>
> Cc: Patrice Chotard <patrice.chotard@foss.st.com>
> ---
>   arch/arm/mach-stm32mp/include/mach/stm32.h |   3 +
>   arch/arm/mach-stm32mp/psci.c               | 481 +++++++++++++++++++++
>   2 files changed, 484 insertions(+)
>
> diff --git a/arch/arm/mach-stm32mp/include/mach/stm32.h b/arch/arm/mach-stm32mp/include/mach/stm32.h
> index c11a9903f20..47e88fc3dcd 100644
> --- a/arch/arm/mach-stm32mp/include/mach/stm32.h
> +++ b/arch/arm/mach-stm32mp/include/mach/stm32.h
> @@ -16,8 +16,11 @@
>    */
>   #define STM32_RCC_BASE			0x50000000
>   #define STM32_PWR_BASE			0x50001000
> +#define STM32_SYSCFG_BASE		0x50020000
>   #define STM32_DBGMCU_BASE		0x50081000
>   #define STM32_FMC2_BASE			0x58002000
> +#define STM32_DDRCTRL_BASE		0x5A003000
> +#define STM32_DDRPHYC_BASE		0x5A004000
>   #define STM32_TZC_BASE			0x5C006000
>   #define STM32_ETZPC_BASE		0x5C007000
>   #define STM32_STGEN_BASE		0x5C008000
> diff --git a/arch/arm/mach-stm32mp/psci.c b/arch/arm/mach-stm32mp/psci.c
> index 155aa79cd5e..7be34054f6b 100644
> --- a/arch/arm/mach-stm32mp/psci.c
> +++ b/arch/arm/mach-stm32mp/psci.c
> @@ -11,8 +11,141 @@
>   #include <asm/io.h>
>   #include <asm/psci.h>
>   #include <asm/secure.h>
> +#include <hang.h>
>   #include <linux/bitops.h>
>   
> +/* PWR */
> +#define PWR_CR3					0x0c
s/0c/0C/
> +#define PWR_MPUCR				0x10
> +
> +#define PWR_CR3_DDRRETEN			BIT(12)
> +#define PWR_CR3_DDRSREN				BIT(10)

bit order

+#define PWR_CR3_DDRSREN				BIT(10)
+#define PWR_CR3_DDRRETEN			BIT(12)


> +
> +#define PWR_MPUCR_PDDS				BIT(0)
> +#define PWR_MPUCR_CSTDBYDIS			BIT(3)
> +#define PWR_MPUCR_CSSF				BIT(9)
> +
> +/* RCC */
> +#define RCC_DDRITFCR				0xd8
s/d8/D8/
> +
> +#define RCC_DDRITFCR_DDRC1EN			BIT(0)
> +#define RCC_DDRITFCR_DDRC1LPEN			BIT(1)
> +#define RCC_DDRITFCR_DDRC2EN			BIT(2)
> +#define RCC_DDRITFCR_DDRC2LPEN			BIT(3)
> +#define RCC_DDRITFCR_DDRPHYCEN			BIT(4)
> +#define RCC_DDRITFCR_DDRPHYCLPEN		BIT(5)
> +#define RCC_DDRITFCR_DDRCAPBEN			BIT(6)
> +#define RCC_DDRITFCR_DDRCAPBLPEN		BIT(7)
> +#define RCC_DDRITFCR_AXIDCGEN			BIT(8)
> +#define RCC_DDRITFCR_DDRPHYCAPBEN		BIT(9)
> +#define RCC_DDRITFCR_DDRPHYCAPBLPEN		BIT(10)
> +#define RCC_DDRITFCR_DDRCKMOD_MASK		(0x7 << 20)
GENMASK(22, 20)
> +#define RCC_DDRITFCR_GSKPCTRL			BIT(24)
> +
> +#define RCC_MP_SREQSETR				0x104
> +#define RCC_MP_SREQCLRR				0x108
> +
> +#define RCC_MP_CIER				0x414
> +#define RCC_MP_CIFR				0x418
> +#define RCC_MP_CIFR_WKUPF			BIT(20)
> +
> +/* SYSCFG */
> +#define SYSCFG_CMPCR				0x20
> +#define SYSCFG_CMPCR_MPUEN			BIT(0)

'MPUEN' bit is not in SYSCFG_CMPCR register but in CMPENSETR/CLRR


+#define SYSCFG_CMPENSETR_MPU_EN            BIT(0)

> +#define SYSCFG_CMPCR_SW_CTRL			BIT(2)
> +#define SYSCFG_CMPENSETR			0x24
> +#define SYSCFG_CMPENCLRR			0x28
> +
> +/* DDR Controller registers offsets */
> +#define DDRCTRL_STAT				0x004
> +#define DDRCTRL_PWRCTL				0x030
> +#define DDRCTRL_PWRTMG				0x034
> +#define DDRCTRL_HWLPCTL				0x038
> +#define DDRCTRL_DFIMISC				0x1B0
> +#define DDRCTRL_SWCTL				0x320
> +#define DDRCTRL_SWSTAT				0x324
> +#define DDRCTRL_PSTAT				0x3FC
> +#define DDRCTRL_PCTRL_0				0x490
> +#define DDRCTRL_PCTRL_1				0x540
> +
> +/* DDR Controller Register fields */
> +#define DDRCTRL_STAT_OPERATING_MODE_MASK	0x7
GENMASK(2, 0)
> +#define DDRCTRL_STAT_OPERATING_MODE_NORMAL	0x1
> +#define DDRCTRL_STAT_OPERATING_MODE_SR		0x3
> +#define DDRCTRL_STAT_SELFREF_TYPE_MASK		(0x3 << 4)
GENMASK(5, 4)
> +#define DDRCTRL_STAT_SELFREF_TYPE_ASR		(0x3 << 4)
> +#define DDRCTRL_STAT_SELFREF_TYPE_SR		(0x2 << 4)
> +
> +#define DDRCTRL_PWRCTL_SELFREF_EN		BIT(0)
> +#define DDRCTRL_PWRCTL_EN_DFI_DRAM_CLK_DISABLE	BIT(3)
> +#define DDRCTRL_PWRCTL_SELFREF_SW		BIT(5)
> +
> +#define DDRCTRL_PWRTMG_SELFREF_TO_X32_MASK	(0xff << 16)
GENMASK(23, 16)
> +#define DDRCTRL_PWRTMG_SELFREF_TO_X32_0		BIT(16)
> +
> +#define DDRCTRL_HWLPCTL_HW_LP_EN		BIT(0)
> +
> +#define DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN	BIT(0)
> +
> +#define DDRCTRL_SWCTL_SW_DONE			BIT(0)
> +
> +#define DDRCTRL_SWSTAT_SW_DONE_ACK		BIT(0)
> +
> +#define DDRCTRL_PSTAT_RD_PORT_BUSY_0		BIT(0)
> +#define DDRCTRL_PSTAT_RD_PORT_BUSY_1		BIT(1)
> +#define DDRCTRL_PSTAT_WR_PORT_BUSY_0		BIT(16)
> +#define DDRCTRL_PSTAT_WR_PORT_BUSY_1		BIT(17)
> +
> +#define DDRCTRL_PCTRL_N_PORT_EN			BIT(0)
> +
> +/* DDR PHY registers offsets */
> +#define DDRPHYC_PIR				0x004
> +#define DDRPHYC_PGSR				0x00C
> +#define DDRPHYC_ACDLLCR				0x014
> +#define DDRPHYC_ACIOCR				0x024
> +#define DDRPHYC_DXCCR				0x028
> +#define DDRPHYC_DSGCR				0x02C
> +#define DDRPHYC_ZQ0CR0				0x180
> +#define DDRPHYC_DX0DLLCR			0x1CC
> +#define DDRPHYC_DX1DLLCR			0x20C
> +#define DDRPHYC_DX2DLLCR			0x24C
> +#define DDRPHYC_DX3DLLCR			0x28C
> +
> +/* DDR PHY Register fields */
> +#define DDRPHYC_PIR_INIT			BIT(0)
> +#define DDRPHYC_PIR_DLLSRST			BIT(1)
> +#define DDRPHYC_PIR_DLLLOCK			BIT(2)
> +#define DDRPHYC_PIR_ITMSRST			BIT(4)
> +
> +#define DDRPHYC_PGSR_IDONE			BIT(0)
> +
> +#define DDRPHYC_ACDLLCR_DLLSRST			BIT(30)
> +#define DDRPHYC_ACDLLCR_DLLDIS			BIT(31)
> +
> +#define DDRPHYC_ACIOCR_ACOE			BIT(1)
> +#define DDRPHYC_ACIOCR_ACPDD			BIT(3)
> +#define DDRPHYC_ACIOCR_ACPDR			BIT(4)
> +#define DDRPHYC_ACIOCR_CKPDD_MASK		(0x7 << 8)
GENMASK(10, 8)
> +#define DDRPHYC_ACIOCR_CKPDD_0			BIT(8)
> +#define DDRPHYC_ACIOCR_CKPDR_MASK		(0x7 << 11)
GENMASK(13, 11)
> +#define DDRPHYC_ACIOCR_CKPDR_0			BIT(11)
> +#define DDRPHYC_ACIOCR_CSPDD_MASK		(0x7 << 18)
GENMASK(21, 18
> +#define DDRPHYC_ACIOCR_CSPDD_0			BIT(18)
> +
> +#define DDRPHYC_DXCCR_DXPDD			BIT(2)
> +#define DDRPHYC_DXCCR_DXPDR			BIT(3)
> +
> +#define DDRPHYC_DSGCR_CKEPDD_MASK		(0xf << 16)
GENMASK(19, 16)
> +#define DDRPHYC_DSGCR_CKEPDD_0			BIT(16)
> +#define DDRPHYC_DSGCR_ODTPDD_MASK		(0xf << 20)
GENMASK(23, 20)
> +#define DDRPHYC_DSGCR_ODTPDD_0			BIT(20)
> +#define DDRPHYC_DSGCR_NL2PD			BIT(24)
> +#define DDRPHYC_DSGCR_CKOE			BIT(28)
> +
> +#define DDRPHYC_ZQ0CRN_ZQPD			BIT(31)
> +
> +#define DDRPHYC_DXNDLLCR_DLLDIS			BIT(31)
> +
>   #define BOOT_API_A7_CORE0_MAGIC_NUMBER	0xCA7FACE0
>   #define BOOT_API_A7_CORE1_MAGIC_NUMBER	0xCA7FACE1
>   
> @@ -98,6 +231,7 @@ s32 __secure psci_features(u32 function_id, u32 psci_fid)
>   	case ARM_PSCI_0_2_FN_MIGRATE_INFO_TYPE:
>   	case ARM_PSCI_0_2_FN_SYSTEM_OFF:
>   	case ARM_PSCI_0_2_FN_SYSTEM_RESET:
> +	case ARM_PSCI_1_0_FN_SYSTEM_SUSPEND:
>   		return 0x0;
>   	}
>   	return ARM_PSCI_RET_NI;
> @@ -222,3 +356,350 @@ void __secure psci_system_off(void)
>   	while (1)
>   		wfi();
>   }
> +
> +static void __secure secure_udelay(unsigned int delay)
> +{
> +	/* This counts instructions, at 800 MHz, 1us = 800 instructions */
> +	asm volatile(
> +		"1:	subs	%0, #1\n"
> +		"	bne	1b\n"
> +	::"r"(delay * 800 / 2));
> +}

STM32MP15 frequency can be 800 or 650 MHz

CP15 Generic timer is more precise => STM32MP U-Boot use it

- arch/arm/cpu/armv7/arch_timer.c => read_cntfrq() / get_ticks()

- lib/time.c => __udelay use the previous fucntion

I think you can use it here from (as arch/arm/mach-imx/mx7/psci-mx7.c)

#define time_after(&,b)	((long)((b) - (a)) < 0))


static void __secure secure_udelay(unsigned int delay)

{

     u32 freq;
     u64 start, end, now;


     asm volatile("mrc p15, 0, %0, c14, c0, 0" : "=r" (freq));
     asm volatile("mrrc p15, 0, %Q0, %R0, c14" : "=r" (start));

     end = start + delay * (freq / 1000000);

     do {
         asm volatile("mrrc p15, 0, %Q0, %R0, c14" : "=r" (now));
         if (time_after(now, end))
             break;
     } while (1);
}




> +
> +static int __secure secure_waitbits(u32 reg, u32 mask, u32 val)
> +{
> +	/* ~500 us worth of 6-opcode long cycles at 800 MHz */
> +	unsigned int loopcount = 500;
> +	u32 tmp;
> +
> +	while (loopcount--) {
> +		tmp = readl(reg);
> +		tmp &= mask;
> +		if ((tmp & val) == val)
> +			return 0;
> +	}
> +
> +	return -ETIMEDOUT;
> +}

same here :

static u64 __secure secure_timer_get_us(void)

{

     u32 freq;
     u64 time;


     asm volatile("mrrc p15, 0, %Q0, %R0, c14" : "=r" (time));
     asm volatile("mrc p15, 0, %0, c14, c0, 0" : "=r" (freq));

     return time / (freq / 1000000);
}

static int __secure secure_waitbits(u32 reg, u32 mask, u32 val)
{
	u64 end = secure_timer_get_us() + 500;
	u32 tmp;

	do {
		tmp = readl(reg);
		tmp &= mask;
		if ((tmp & val) == val)
			return 0;
	} while (time_after(secure_timer_get_us(), end))

	return -ETIMEDOUT;
}

> +static void __secure ddr_sr_mode_ssr(void)
> +{
> +	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
> +		     RCC_DDRITFCR_DDRC1LPEN | RCC_DDRITFCR_DDRC1EN |
> +		     RCC_DDRITFCR_DDRC2LPEN | RCC_DDRITFCR_DDRC2EN |
> +		     RCC_DDRITFCR_DDRCAPBLPEN | RCC_DDRITFCR_DDRPHYCAPBLPEN |
> +		     RCC_DDRITFCR_DDRCAPBEN | RCC_DDRITFCR_DDRPHYCAPBEN |
> +		     RCC_DDRITFCR_DDRPHYCEN);
> +
> +	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
> +		     RCC_DDRITFCR_AXIDCGEN | RCC_DDRITFCR_DDRCKMOD_MASK);
> +
> +	/* Disable HW LP interface of uMCTL2 */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_HWLPCTL,
> +		     DDRCTRL_HWLPCTL_HW_LP_EN);
> +
> +	/* Configure Automatic LP modes of uMCTL2 */
> +	clrsetbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRTMG,
> +			DDRCTRL_PWRTMG_SELFREF_TO_X32_MASK,
> +			DDRCTRL_PWRTMG_SELFREF_TO_X32_0);
> +
> +	/*
> +	 * Disable Clock disable with LP modes
> +	 * (used in RUN mode for LPDDR2 with specific timing).
> +	 */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
> +		     DDRCTRL_PWRCTL_EN_DFI_DRAM_CLK_DISABLE);
> +
> +	/* Disable automatic Self-Refresh mode */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
> +		     DDRCTRL_PWRCTL_SELFREF_EN);
> +}
> +
> +static int __secure ddr_sw_self_refresh_in(void)
> +{
> +	int ret;
> +
> +	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_AXIDCGEN);
> +
> +	/* Blocks AXI ports from taking anymore transactions */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0,
> +		     DDRCTRL_PCTRL_N_PORT_EN);
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1,
> +		     DDRCTRL_PCTRL_N_PORT_EN);
> +
> +	/*
> +	 * Waits unit all AXI ports are idle
> +	 * Poll PSTAT.rd_port_busy_n = 0
> +	 * Poll PSTAT.wr_port_busy_n = 0
> +	 */
> +	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_PSTAT,
> +			      DDRCTRL_PSTAT_RD_PORT_BUSY_0 |
> +			      DDRCTRL_PSTAT_RD_PORT_BUSY_1 |
> +			      DDRCTRL_PSTAT_WR_PORT_BUSY_0 |
> +			      DDRCTRL_PSTAT_WR_PORT_BUSY_1, 0);
> +	if (ret)
> +		goto pstat_failed;
> +
> +	/* SW Self-Refresh entry */
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL, DDRCTRL_PWRCTL_SELFREF_SW);
> +
> +	/*
> +	 * Wait operating mode change in self-refresh mode
> +	 * with STAT.operating_mode[1:0]==11.
> +	 * Ensure transition to self-refresh was due to software
> +	 * by checking also that STAT.selfref_type[1:0]=2.
> +	 */
> +	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_STAT,
> +			      DDRCTRL_STAT_OPERATING_MODE_MASK |
> +			      DDRCTRL_STAT_SELFREF_TYPE_MASK,
> +			      DDRCTRL_STAT_OPERATING_MODE_SR |
> +			      DDRCTRL_STAT_SELFREF_TYPE_SR);
> +	if (ret)
> +		goto selfref_sw_failed;
> +
> +	/* IOs powering down (PUBL registers) */
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDD);
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDR);
> +
> +	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
> +			DDRPHYC_ACIOCR_CKPDD_MASK,
> +			DDRPHYC_ACIOCR_CKPDD_0);
> +
> +	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
> +			DDRPHYC_ACIOCR_CKPDR_MASK,
> +			DDRPHYC_ACIOCR_CKPDR_0);
> +
> +	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR,
> +			DDRPHYC_ACIOCR_CSPDD_MASK,
> +			DDRPHYC_ACIOCR_CSPDD_0);
> +
> +	/* Disable command/address output driver */
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACOE);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDD);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDR);
> +
> +	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR,
> +			DDRPHYC_DSGCR_ODTPDD_MASK,
> +			DDRPHYC_DSGCR_ODTPDD_0);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_NL2PD);
> +
> +	clrsetbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR,
> +			DDRPHYC_DSGCR_CKEPDD_MASK,
> +			DDRPHYC_DSGCR_CKEPDD_0);
> +
> +	/* Disable PZQ cell (PUBL register) */
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ZQ0CR0, DDRPHYC_ZQ0CRN_ZQPD);
> +
> +	/* Set latch */
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKOE);
> +
> +	/* Additional delay to avoid early latch */
> +	secure_udelay(10);
> +
> +	/* Activate sw retention in PWRCTRL */
> +	setbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRRETEN);
> +
> +	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
> +	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
> +
> +	/* Disable all DLLs: GLITCH window */
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLDIS);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX0DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX1DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX2DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX3DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	/* Switch controller clocks (uMCTL2/PUBL) to DLL output clock */
> +	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
> +
> +	/* Deactivate all DDR clocks */
> +	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
> +		     RCC_DDRITFCR_DDRC1EN | RCC_DDRITFCR_DDRC2EN |
> +		     RCC_DDRITFCR_DDRCAPBEN | RCC_DDRITFCR_DDRPHYCAPBEN);
> +
> +	return 0;
> +
> +selfref_sw_failed:
> +	/* This bit should be cleared to restore DDR in its previous state */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL,
> +		     DDRCTRL_PWRCTL_SELFREF_SW);
> +
> +pstat_failed:
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0,
> +		     DDRCTRL_PCTRL_N_PORT_EN);
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1,
> +		     DDRCTRL_PCTRL_N_PORT_EN);
> +
> +	return -EINVAL;
> +};
> +
> +static void __secure ddr_sw_self_refresh_exit(void)
> +{
> +	int ret;
> +
> +	/* Enable all clocks */
> +	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR,
> +		     RCC_DDRITFCR_DDRC1EN | RCC_DDRITFCR_DDRC2EN |
> +		     RCC_DDRITFCR_DDRPHYCEN | RCC_DDRITFCR_DDRPHYCAPBEN |
> +		     RCC_DDRITFCR_DDRCAPBEN);
> +
> +	/* Handshake */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
> +
> +	/* Mask dfi_init_complete_en */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_DFIMISC,
> +		     DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN);
> +
> +	/* Ack */
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
> +	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_SWSTAT,
> +			      DDRCTRL_SWSTAT_SW_DONE_ACK,
> +			      DDRCTRL_SWSTAT_SW_DONE_ACK);
> +	if (ret)
> +		hang();
> +
> +	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
> +	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
> +
> +	/* Enable all DLLs: GLITCH window */
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR,
> +		     DDRPHYC_ACDLLCR_DLLDIS);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX0DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX1DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX2DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DX3DLLCR, DDRPHYC_DXNDLLCR_DLLDIS);
> +
> +	/* Additional delay to avoid early DLL clock switch */
> +	secure_udelay(50);
> +
> +	/* Switch controller clocks (uMCTL2/PUBL) to DLL ref clock */
> +	clrbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_GSKPCTRL);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLSRST);
> +
> +	secure_udelay(10);
> +
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACDLLCR, DDRPHYC_ACDLLCR_DLLSRST);
> +
> +	/* PHY partial init: (DLL lock and ITM reset) */
> +	writel(DDRPHYC_PIR_DLLSRST | DDRPHYC_PIR_DLLLOCK |
> +	       DDRPHYC_PIR_ITMSRST | DDRPHYC_PIR_INIT,
> +	       STM32_DDRPHYC_BASE + DDRPHYC_PIR);
> +
> +	/* Need to wait at least 10 clock cycles before accessing PGSR */
> +	secure_udelay(1);
> +
> +	/* Pool end of init */
> +	ret = secure_waitbits(STM32_DDRPHYC_BASE + DDRPHYC_PGSR,
> +			      DDRPHYC_PGSR_IDONE, DDRPHYC_PGSR_IDONE);
> +	if (ret)
> +		hang();
> +
> +	/* Handshake */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
> +
> +	/* Unmask dfi_init_complete_en to uMCTL2 */
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_DFIMISC, DDRCTRL_DFIMISC_DFI_INIT_COMPLETE_EN);
> +
> +	/* Ack */
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_SWCTL, DDRCTRL_SWCTL_SW_DONE);
> +	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_SWSTAT,
> +			      DDRCTRL_SWSTAT_SW_DONE_ACK,
> +			      DDRCTRL_SWSTAT_SW_DONE_ACK);
> +	if (ret)
> +		hang();
> +
> +	/* Deactivate sw retention in PWR */
> +	clrbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRRETEN);
> +
> +	/* Enable PZQ cell (PUBL register) */
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ZQ0CR0, DDRPHYC_ZQ0CRN_ZQPD);
> +
> +	/* Enable pad drivers */
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACPDD);
> +
> +	/* Enable command/address output driver */
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_ACOE);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_CKPDD_MASK);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_ACIOCR, DDRPHYC_ACIOCR_CSPDD_MASK);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDD);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DXCCR, DDRPHYC_DXCCR_DXPDR);
> +
> +	/* Release latch */
> +	setbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKOE);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_ODTPDD_MASK);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_NL2PD);
> +
> +	clrbits_le32(STM32_DDRPHYC_BASE + DDRPHYC_DSGCR, DDRPHYC_DSGCR_CKEPDD_MASK);
> +
> +	/* Remove selfrefresh */
> +	clrbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PWRCTL, DDRCTRL_PWRCTL_SELFREF_SW);
> +
> +	/* Wait operating_mode == normal */
> +	ret = secure_waitbits(STM32_DDRCTRL_BASE + DDRCTRL_STAT,
> +			      DDRCTRL_STAT_OPERATING_MODE_MASK,
> +			      DDRCTRL_STAT_OPERATING_MODE_NORMAL);
> +	if (ret)
> +		hang();
> +
> +	/* AXI ports are no longer blocked from taking transactions */
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_0, DDRCTRL_PCTRL_N_PORT_EN);
> +	setbits_le32(STM32_DDRCTRL_BASE + DDRCTRL_PCTRL_1, DDRCTRL_PCTRL_N_PORT_EN);
> +
> +	setbits_le32(STM32_RCC_BASE + RCC_DDRITFCR, RCC_DDRITFCR_AXIDCGEN);
> +}
> +
> +void __secure psci_system_suspend(u32 __always_unused function_id,
> +				  u32 ep, u32 context_id)
> +{
> +	u32 reg;
> +
+ /* disable IO compensation */
> +	/* Place current APSRC/ANSRC into RAPSRC/RANSRC */
> +	reg = readl(STM32_SYSCFG_BASE + SYSCFG_CMPCR);
> +	reg >>= 8;
> +	reg &= 0xff << 16;
> +	reg |= SYSCFG_CMPCR_SW_CTRL;
> +	writel(reg, STM32_SYSCFG_BASE + SYSCFG_CMPCR);
> +	writel(SYSCFG_CMPCR_MPUEN, STM32_SYSCFG_BASE + SYSCFG_CMPENCLRR);

s/SYSCFG_CMPCR_MPUEN/SYSCFG_CMPENSETR_MPU_EN/


> +	writel(RCC_MP_CIFR_WKUPF, STM32_RCC_BASE + RCC_MP_CIFR);
> +	setbits_le32(STM32_RCC_BASE + RCC_MP_CIER, RCC_MP_CIFR_WKUPF);
> +
> +	setbits_le32(STM32_PWR_BASE + PWR_MPUCR,
> +		     PWR_MPUCR_CSSF | PWR_MPUCR_CSTDBYDIS | PWR_MPUCR_PDDS);
> +
> +	psci_v7_flush_dcache_all();
> +	ddr_sr_mode_ssr();

=> here SSR is forced in DDR self refresh entry,

       it was normal in TF-A which manage ASR and HSR mode are managed

       but that seens strange for SPL as only SSR mode is correclty 
managed (DDR_PWRCTL = 0x0)

       previous mode is not restored after in this code

       => I think the  ddr_sr_mode_ssr() can be done in DDR driver

     as it is done in TF-A driver = ./drivers/st/ddr/stm32mp1_ram.c


static int stm32mp1_ddr_setup(void)
{

.....


     /*
      * Initialization sequence has configured DDR registers with settings.
      * The Self Refresh (SR) mode corresponding to these settings has now
      * to be set.
      */
     ddr_set_sr_mode(ddr_read_sr_mode());

  .....

}

=> same can be done at the end of  DDr driver in SPL:

      drivers/ram/stm32mp1/stm32mp1_ddr.c::stm32mp1_ddr_init()


void stm32mp1_ddr_init(struct ddr_info *priv,
                const struct stm32mp1_ddr_config *config)
{

....
/* 12. set back registers in step 8 to the orginal values if desidered */
     stm32mp1_refresh_restore(priv->ctl, config->c_reg.rfshctl3,
                  config->c_reg.pwrctl);

+   /* Force the Self Refresh (SR) mode = SSR for SPL, HSR or ASR are 
not supported */

+   ddr_sr_mode_ssr();

     /* enable uMCTL2 AXI port 0 and 1 */
.....

}


Then the call of ddr_sr_mode_ssr() can be removed here.


see also ./drivers/clk/clk_stm32mp1.c::stm32mp1_clktree()

=> Software Self-Refresh mode (SSR) during DDR initilialization


> +	ddr_sw_self_refresh_in();
> +	setbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRSREN);
> +	writel(0x3, STM32_RCC_BASE + RCC_MP_SREQSETR);
> +
> +	/* Zzz, enter stop mode */
> +	asm volatile(
> +		"wfi\n"
> +		"isb\n"
> +		"dsb\n");

are you sure of the instruction order ?

     in TF-A, stm32_pwr_down_wfi_load() => the order is dsb / isb / wfi

and you can be replaced by ARM function = arch/arm/include/asm/system.h


     /*
      * Synchronize on memory accesses and instruction flow before the WFI
      * instruction.
      */
     dsb();
     isb();
     wfi();

> +
> +	writel(0x3, STM32_RCC_BASE + RCC_MP_SREQCLRR);
> +	ddr_sw_self_refresh_exit();
> +
> +	writel(SYSCFG_CMPCR_MPUEN, STM32_SYSCFG_BASE + SYSCFG_CMPENSETR);
> +	clrbits_le32(STM32_SYSCFG_BASE + SYSCFG_CMPCR, SYSCFG_CMPCR_SW_CTRL);
> +}


I also need to test this patch on ST boards...


regards

Patrick


^ permalink raw reply	[flat|nested] 3+ messages in thread

* Re: [PATCH] stm32mp: psci: Implement PSCI system suspend and DRAM SSR
  2022-02-10 19:20 ` Patrick DELAUNAY
@ 2022-02-21 20:02   ` Marek Vasut
  0 siblings, 0 replies; 3+ messages in thread
From: Marek Vasut @ 2022-02-21 20:02 UTC (permalink / raw)
  To: Patrick DELAUNAY, u-boot; +Cc: Patrice Chotard

On 2/10/22 20:20, Patrick DELAUNAY wrote:

[...]

>> +    writel(RCC_MP_CIFR_WKUPF, STM32_RCC_BASE + RCC_MP_CIFR);
>> +    setbits_le32(STM32_RCC_BASE + RCC_MP_CIER, RCC_MP_CIFR_WKUPF);
>> +
>> +    setbits_le32(STM32_PWR_BASE + PWR_MPUCR,
>> +             PWR_MPUCR_CSSF | PWR_MPUCR_CSTDBYDIS | PWR_MPUCR_PDDS);
>> +
>> +    psci_v7_flush_dcache_all();
>> +    ddr_sr_mode_ssr();
> 
> => here SSR is forced in DDR self refresh entry,
> 
>        it was normal in TF-A which manage ASR and HSR mode are managed
> 
>        but that seens strange for SPL as only SSR mode is correclty 
> managed (DDR_PWRCTL = 0x0)
> 
>        previous mode is not restored after in this code

The ASR should be restored if it was enabled before, indeed.

>        => I think the  ddr_sr_mode_ssr() can be done in DDR driver
> 
>      as it is done in TF-A driver = ./drivers/st/ddr/stm32mp1_ram.c

There is no trace of STM32MP1 ASR/SSR/HSR implementation in ATF :
$ git grep -i [ash]sr drivers/st/ddr/stm32mp1_ram.c
gives no results in
a1f02f4f3 ("Merge "docs(changelog): generate changelog" into integration")
or
8d9c1b3ca ("Merge changes from topic "st-format-signedness" into 
integration").

So back to U-Boot ...

The secure part has no access to DM structures, so no, it is better to 
keep all the bits and pieces of the PSCI in one place. It also makes the 
PSCI code self-contained and easy to understand, as it should be.

As for the various modes:
- ASR is Automatic SR, that's handled by the controller automatically
   even at runtime, and it is enabled in separate patch
   (ram: stm32mp1: Unconditionally enable ASR)
- SSR is Software SR, that's what's implemented here and that's where
   the system software puts the DRAM into SR
- HSR is Hardware SR, what exactly is this useful for ?

It seems ASR is recommended for runtime power saving and SSR for suspend 
power saving. So what is HSR for ?

> static int stm32mp1_ddr_setup(void)
> {
> 
> .....
> 
> 
>      /*
>       * Initialization sequence has configured DDR registers with settings.
>       * The Self Refresh (SR) mode corresponding to these settings has now
>       * to be set.
>       */
>      ddr_set_sr_mode(ddr_read_sr_mode());
> 
>   .....
> 
> }
> 
> => same can be done at the end of  DDr driver in SPL:
> 
>       drivers/ram/stm32mp1/stm32mp1_ddr.c::stm32mp1_ddr_init()
> 
> 
> void stm32mp1_ddr_init(struct ddr_info *priv,
>                 const struct stm32mp1_ddr_config *config)
> {
> 
> ....
> /* 12. set back registers in step 8 to the orginal values if desidered */
>      stm32mp1_refresh_restore(priv->ctl, config->c_reg.rfshctl3,
>                   config->c_reg.pwrctl);
> 
> +   /* Force the Self Refresh (SR) mode = SSR for SPL, HSR or ASR are 
> not supported */
> 
> +   ddr_sr_mode_ssr();
> 
>      /* enable uMCTL2 AXI port 0 and 1 */
> .....
> 
> }
> 
> 
> Then the call of ddr_sr_mode_ssr() can be removed here.
> 
> 
> see also ./drivers/clk/clk_stm32mp1.c::stm32mp1_clktree()
> 
> => Software Self-Refresh mode (SSR) during DDR initilialization

SSR does cut off DRAM access, ASR does not, I think you have those two 
confused, no ? You can enable ASR in the DDR driver (see ram: stm32mp1: 
Unconditionally enable ASR), but you must only enable/disable SSR on 
entry/exit from CStop, i.e. here in this PSCI callback.

>> +    ddr_sw_self_refresh_in();
>> +    setbits_le32(STM32_PWR_BASE + PWR_CR3, PWR_CR3_DDRSREN);
>> +    writel(0x3, STM32_RCC_BASE + RCC_MP_SREQSETR);
>> +
>> +    /* Zzz, enter stop mode */
>> +    asm volatile(
>> +        "wfi\n"
>> +        "isb\n"
>> +        "dsb\n");
> 
> are you sure of the instruction order ?
> 
>      in TF-A, stm32_pwr_down_wfi_load() => the order is dsb / isb / wfi
> 
> and you can be replaced by ARM function = arch/arm/include/asm/system.h

This function also does not exist in either source, sorry.

>      /*
>       * Synchronize on memory accesses and instruction flow before the WFI
>       * instruction.
>       */
>      dsb();
>      isb();
>      wfi();

I think it does make more sense to do ISB/DSB before the WFI, yes.

>> +
>> +    writel(0x3, STM32_RCC_BASE + RCC_MP_SREQCLRR);
>> +    ddr_sw_self_refresh_exit();
>> +
>> +    writel(SYSCFG_CMPCR_MPUEN, STM32_SYSCFG_BASE + SYSCFG_CMPENSETR);
>> +    clrbits_le32(STM32_SYSCFG_BASE + SYSCFG_CMPCR, 
>> SYSCFG_CMPCR_SW_CTRL);
>> +}
> 
> 
> I also need to test this patch on ST boards...

I will send V2 soon.

^ permalink raw reply	[flat|nested] 3+ messages in thread

end of thread, other threads:[~2022-02-21 20:02 UTC | newest]

Thread overview: 3+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2022-02-02 11:52 [PATCH] stm32mp: psci: Implement PSCI system suspend and DRAM SSR Marek Vasut
2022-02-10 19:20 ` Patrick DELAUNAY
2022-02-21 20:02   ` Marek Vasut

This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.