[PATCH 2/7] arm: mach-k3: j721e: Enable QoS for DSS

Andrew Davis afd at ti.com
Wed May 22 17:44:15 CEST 2024


On 5/22/24 6:37 AM, Jayesh Choudhary wrote:
> Enable Quality of Service (QoS) blocks for Display SubSystem (DSS), by
> servicing the DSS - DDR traffic from the Real-Time (RT) queue. This is
> done by setting the DSS DMA orderID to greater than 7.
> ATYPE 3 is selected so that the traffic takes non-coherent path and does

So this is the part I'm not sure about, this change is not just a performance
adjustment, it can and does break things. The ORDERID setting is fine with me,
but changing ATYPE should be done in a separate patch so it can be debated on
its own.

> not have a conflict with coherent traffic from C7x (deep-learning
> applications).
> Before setting up the QoS, the ORDERID needs to be mapped to VBUSM sources
> using setup_navss_nb() function call that sets the threadmap for NBSS
> registers. (Section 10.2.10.1.2 "NB Parameters" in TRM[0])
> 
> Section 3.3.2 "Quality of Service (QoS)" in the TRM[0] provide more
> details.
> 
> [0]: https://www.ti.com/lit/zip/spruil1
> 
> Signed-off-by: Jayesh Choudhary <j-choudhary at ti.com>
> ---
>   arch/arm/mach-k3/j721e/j721e_init.c         |  28 +++++
>   arch/arm/mach-k3/r5/j721e/Makefile          |   1 +
>   arch/arm/mach-k3/r5/j721e/j721e_qos.h       |  96 +++++++++++++++
>   arch/arm/mach-k3/r5/j721e/j721e_qos_uboot.c | 125 ++++++++++++++++++++
>   4 files changed, 250 insertions(+)
>   create mode 100644 arch/arm/mach-k3/r5/j721e/j721e_qos.h
>   create mode 100644 arch/arm/mach-k3/r5/j721e/j721e_qos_uboot.c
> 
> diff --git a/arch/arm/mach-k3/j721e/j721e_init.c b/arch/arm/mach-k3/j721e/j721e_init.c
> index c2024f2500..e9ed8cb267 100644
> --- a/arch/arm/mach-k3/j721e/j721e_init.c
> +++ b/arch/arm/mach-k3/j721e/j721e_init.c
> @@ -23,6 +23,22 @@
>   #include "../sysfw-loader.h"
>   #include "../common.h"
>   
> +/* NAVSS North Bridge (NB) registers */
> +#define NAVSS0_NBSS_NB0_CFG_MMRS		0x03802000
> +#define NAVSS0_NBSS_NB1_CFG_MMRS		0x03803000
> +#define NAVSS0_NBSS_NB0_CFG_NB_THREADMAP	(NAVSS0_NBSS_NB0_CFG_MMRS + 0x10)
> +#define NAVSS0_NBSS_NB1_CFG_NB_THREADMAP	(NAVSS0_NBSS_NB1_CFG_MMRS + 0x10)
> +/*
> + * Thread Map for North Bridge Configuration
> + * Each bit is for each VBUSM source.
> + * Bit[0] maps orderID 0-7 to VBUSM.C thread number
> + * Bit[1] maps orderID 8-15 to VBUSM.C thread number
> + * When bit has value 0: VBUSM.C thread 0 (non-real time traffic)
> + * When bit has value 1: VBUSM.C thread 2 (real time traffic)
> + */
> +#define NB_THREADMAP_BIT0				BIT(0)
> +#define NB_THREADMAP_BIT1				BIT(1)
> +
>   #ifdef CONFIG_K3_LOAD_SYSFW
>   struct fwl_data cbass_hc_cfg0_fwls[] = {
>   #if defined(CONFIG_TARGET_J721E_R5_EVM)
> @@ -124,6 +140,13 @@ void k3_mmc_restart_clock(void)
>   }
>   #endif
>   
> +/* Setup North Bridge registers to map ORDERID 8-15 to RT traffic */
> +static void setup_navss_nb(void)
> +{
> +	writel(NB_THREADMAP_BIT1, (uintptr_t)NAVSS0_NBSS_NB0_CFG_NB_THREADMAP);
> +	writel(NB_THREADMAP_BIT1, (uintptr_t)NAVSS0_NBSS_NB1_CFG_NB_THREADMAP);
> +}
> +
>   /*
>    * This uninitialized global variable would normal end up in the .bss section,
>    * but the .bss is cleared between writing and reading this variable, so move
> @@ -288,6 +311,11 @@ void board_init_f(ulong dummy)
>   		panic("DRAM init failed: %d\n", ret);
>   #endif
>   	spl_enable_cache();
> +
> +	if (IS_ENABLED(CONFIG_CPU_V7R))
> +		setup_navss_nb();
> +
> +	setup_qos();
>   }
>   
>   u32 spl_mmc_boot_mode(struct mmc *mmc, const u32 boot_device)
> diff --git a/arch/arm/mach-k3/r5/j721e/Makefile b/arch/arm/mach-k3/r5/j721e/Makefile
> index 78325db402..07bfb0dd93 100644
> --- a/arch/arm/mach-k3/r5/j721e/Makefile
> +++ b/arch/arm/mach-k3/r5/j721e/Makefile
> @@ -3,3 +3,4 @@
>   # Copyright (C) 2020 Texas Instruments Incorporated - https://www.ti.com/
>   obj-y += clk-data.o
>   obj-y += dev-data.o
> +obj-y += j721e_qos_uboot.o
> diff --git a/arch/arm/mach-k3/r5/j721e/j721e_qos.h b/arch/arm/mach-k3/r5/j721e/j721e_qos.h
> new file mode 100644
> index 0000000000..9ec0b7c630
> --- /dev/null
> +++ b/arch/arm/mach-k3/r5/j721e/j721e_qos.h
> @@ -0,0 +1,96 @@
> +/* SPDX-License-Identifier: GPL-2.0+ */
> +/*
> + * Keystone3 Quality of service endpoint definitions
> + * Auto generated by K3 Resource Partitioning Tool
> + *
> + * Copyright (C) 2024 Texas Instruments Incorporated - https://www.ti.com/
> + */
> +
> +#define PULSAR_SL_MCU_0_MEMBDG_RMST0	0x45D10000
> +#define PULSAR_SL_MCU_0_MEMBDG_WMST0	0x45D10400
> +#define PULSAR_SL_MCU_0_CPU0_PMST	0x45D10800
> +#define PULSAR_SL_MCU_0_MEMBDG_RMST1	0x45D11000
> +#define PULSAR_SL_MCU_0_MEMBDG_WMST1	0x45D11400
> +#define PULSAR_SL_MCU_0_CPU1_PMST	0x45D11800
> +#define SA2_UL_MCU_0_CTXCACH_EXT_DMA	0x45D13000
> +#define ICSS_G_MAIN_0_PR1_EXT_VBUSM	0x45D80000
> +#define ICSS_G_MAIN_1_PR1_EXT_VBUSM	0x45D80400
> +#define K3_C66_COREPAC_MAIN_0_C66_MDMA	0x45D81000
> +#define K3_C66_COREPAC_MAIN_1_C66_MDMA	0x45D81400
> +#define EMMCSD4SS_MAIN_0_EMMCSDSS_RD	0x45D82000
> +#define EMMCSD4SS_MAIN_0_EMMCSDSS_WR	0x45D82400
> +#define EMMCSD4SS_MAIN_1_EMMCSDSS_RD	0x45D82800
> +#define EMMCSD4SS_MAIN_1_EMMCSDSS_WR	0x45D82C00
> +#define PULSAR_SL_MAIN_0_MEMBDG_RMST0	0x45D84000
> +#define PULSAR_SL_MAIN_0_MEMBDG_RMST1	0x45D84400
> +#define PULSAR_SL_MAIN_0_MEMBDG_WMST0	0x45D84800
> +#define PULSAR_SL_MAIN_0_MEMBDG_WMST1	0x45D84C00
> +#define PULSAR_SL_MAIN_1_MEMBDG_RMST0	0x45D85000
> +#define PULSAR_SL_MAIN_1_MEMBDG_RMST1	0x45D85400
> +#define PULSAR_SL_MAIN_1_MEMBDG_WMST0	0x45D85800
> +#define PULSAR_SL_MAIN_1_MEMBDG_WMST1	0x45D85C00
> +#define COMPUTE_CLUSTER_J7ES_TB_VDC_MAIN_0_GIC_MEM_RD_VBUSM	0x45D86000
> +#define COMPUTE_CLUSTER_J7ES_TB_VDC_MAIN_0_GIC_MEM_WR_VBUSM	0x45D86400
> +#define K3_C66_COREPAC_MAIN_0_C66_CFG	0x45D87000
> +#define K3_C66_COREPAC_MAIN_1_C66_CFG	0x45D87400
> +#define SA2_UL_MAIN_0_CTXCACH_EXT_DMA	0x45D88800
> +#define PULSAR_SL_MAIN_0_PBDG_RMST0	0x45D89800
> +#define PULSAR_SL_MAIN_0_PBDG_RMST1	0x45D89C00
> +#define PULSAR_SL_MAIN_0_PBDG_WMST0	0x45D8A000
> +#define PULSAR_SL_MAIN_0_PBDG_WMST1	0x45D8A400
> +#define PULSAR_SL_MAIN_1_PBDG_RMST0	0x45D8A800
> +#define PULSAR_SL_MAIN_1_PBDG_RMST1	0x45D8AC00
> +#define PULSAR_SL_MAIN_1_PBDG_WMST0	0x45D8B000
> +#define PULSAR_SL_MAIN_1_PBDG_WMST1	0x45D8B400
> +#define VPFE_MAIN_0_VBUSM_DMA	0x45D8C000
> +#define VPE_MAIN_0_VPDMA_MST0	0x45D8C400
> +#define VPE_MAIN_0_VPDMA_MST1	0x45D8C800
> +#define PCIE_G4X2_MAIN_0_PCIE_MST_RD_HP	0x45D90000
> +#define PCIE_G4X2_MAIN_0_PCIE_MST_RD_LP	0x45D90400
> +#define PCIE_G4X2_MAIN_0_PCIE_MST_WR_HP	0x45D90800
> +#define PCIE_G4X2_MAIN_0_PCIE_MST_WR_LP	0x45D90C00
> +#define PCIE_G4X2_MAIN_1_PCIE_MST_RD_HP	0x45D91000
> +#define PCIE_G4X2_MAIN_1_PCIE_MST_RD_LP	0x45D91400
> +#define PCIE_G4X2_MAIN_1_PCIE_MST_WR_HP	0x45D91800
> +#define PCIE_G4X2_MAIN_1_PCIE_MST_WR_LP	0x45D91C00
> +#define PCIE_G4X2_MAIN_2_PCIE_MST_RD_HP	0x45D92000
> +#define PCIE_G4X2_MAIN_2_PCIE_MST_RD_LP	0x45D92400
> +#define PCIE_G4X2_MAIN_2_PCIE_MST_WR_HP	0x45D92800
> +#define PCIE_G4X2_MAIN_2_PCIE_MST_WR_LP	0x45D92C00
> +#define PCIE_G4X2_MAIN_3_PCIE_MST_RD_HP	0x45D93000
> +#define PCIE_G4X2_MAIN_3_PCIE_MST_RD_LP	0x45D93400
> +#define PCIE_G4X2_MAIN_3_PCIE_MST_WR_HP	0x45D93800
> +#define PCIE_G4X2_MAIN_3_PCIE_MST_WR_LP	0x45D93C00
> +#define USB3P0SS_16FFC_MAIN_0_MSTR0	0x45D98000
> +#define USB3P0SS_16FFC_MAIN_0_MSTW0	0x45D98400
> +#define USB3P0SS_16FFC_MAIN_1_MSTR0	0x45D98800
> +#define USB3P0SS_16FFC_MAIN_1_MSTW0	0x45D98C00
> +#define USB3P0SS_16FFC_MAIN_2_MSTR0	0x45D99000
> +#define USB3P0SS_16FFC_MAIN_2_MSTW0	0x45D99400
> +#define MLBSS2P0_MAIN_0_MLBSS_DMA_VBUSP	0x45D99C00
> +#define EMMC8SS_16FFC_MAIN_0_EMMCSS_RD	0x45D9A000
> +#define EMMC8SS_16FFC_MAIN_0_EMMCSS_WR	0x45D9A400
> +#define UFSHCI2P1SS_16FFC_MAIN_0_UFSHCI_VBM_MST_RD	0x45D9B000
> +#define UFSHCI2P1SS_16FFC_MAIN_0_UFSHCI_VBM_MST_WR	0x45D9B400
> +#define UFSHCI2P1SS_16FFC_MAIN_1_UFSHCI_VBM_MST_RD	0x45D9B800
> +#define UFSHCI2P1SS_16FFC_MAIN_1_UFSHCI_VBM_MST_WR	0x45D9BC00
> +#define DEBUGSS_K3_WRAP_CV0_MAIN_0_VBUSMR	0x45DA0000
> +#define DEBUGSS_K3_WRAP_CV0_MAIN_0_VBUSMW	0x45DA0400
> +#define PULSAR_SL_MAIN_0_CPU0_PMST	0x45DA4000
> +#define PULSAR_SL_MAIN_0_CPU1_PMST	0x45DA4400
> +#define PULSAR_SL_MAIN_1_CPU0_PMST	0x45DA4800
> +#define PULSAR_SL_MAIN_1_CPU1_PMST	0x45DA4C00
> +#define DMPAC_TOP_MAIN_0_DATA_MST	0x45DC0000
> +#define K3_D5520MP2_MAIN_0_M_VBUSM_R	0x45DC0400
> +#define K3_D5520MP2_MAIN_0_M_VBUSM_W	0x45DC0800
> +#define K3_VXE384MP2_MAIN_0_M_VBUSM_R	0x45DC0C00
> +#define K3_VXE384MP2_MAIN_0_M_VBUSM_W	0x45DC1000
> +#define VPAC_TOP_MAIN_0_DATA_MST_0	0x45DC1400
> +#define VPAC_TOP_MAIN_0_DATA_MST_1	0x45DC1800
> +#define VPAC_TOP_MAIN_0_LDC0_M_MST	0x45DC1C00
> +#define K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA	0x45DC2000
> +#define K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC	0x45DC2400
> +#define J7_LASCAR_GPU_WRAP_MAIN_0_M0_VBUSM_R_ASYNC	0x45DC5000
> +#define J7_LASCAR_GPU_WRAP_MAIN_0_M0_VBUSM_W_ASYNC	0x45DC5800
> +#define J7_LASCAR_GPU_WRAP_MAIN_0_M1_VBUSM_R_ASYNC	0x45DC6000
> +#define J7_LASCAR_GPU_WRAP_MAIN_0_M1_VBUSM_W_ASYNC	0x45DC6800
> diff --git a/arch/arm/mach-k3/r5/j721e/j721e_qos_uboot.c b/arch/arm/mach-k3/r5/j721e/j721e_qos_uboot.c
> new file mode 100644
> index 0000000000..c829057200
> --- /dev/null
> +++ b/arch/arm/mach-k3/r5/j721e/j721e_qos_uboot.c
> @@ -0,0 +1,125 @@
> +// SPDX-License-Identifier: GPL-2.0+
> +/*
> + * j721e Quality of Service (QoS) Configuration Data
> + * Auto generated from K3 Resource Partitioning tool
> + */
> +
> +#include <asm/arch/k3-qos.h>
> +#include "j721e_qos.h"
> +
> +struct k3_qos_data qos_data[] = {
> +	/* DSS_PIPE_VID1 - 2 endpoints, 2 channels */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 0,

0x100 being the instance, and 0x4 * x being the specific device register right?
That could be encoded in a macro (the "Resource Partitioning tool" would
be updated to generate that too).

Andrew

> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 1,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 0,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 1,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +
> +	/* DSS_PIPE_VIDL1 - 2 endpoints, 2 channels */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 2,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 3,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 2,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 3,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +
> +	/* DSS_PIPE_VID2 - 2 endpoints, 2 channels */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 4,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 5,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 4,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 5,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +
> +	/* DSS_PIPE_VIDL2 - 2 endpoints, 2 channels */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 6,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0x100 + 0x4 * 7,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 6,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0x100 + 0x4 * 7,
> +		.val = ATYPE_3 | ORDERID_15,
> +	},
> +
> +	/* Following registers set 1:1 mapping for orderID MAP1/MAP2
> +	 * remap registers. orderID x is remapped to orderID x again
> +	 * This is to ensure orderID from MAP register is unchanged
> +	 */
> +
> +	/* K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA - 2 groups */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 0,
> +		.val = 0x76543210,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 4,
> +		.val = 0xfedcba98,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 8,
> +		.val = 0x76543210,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_DMA + 12,
> +		.val = 0xfedcba98,
> +	},
> +
> +	/* K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC - 2 groups */
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 0,
> +		.val = 0x76543210,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 4,
> +		.val = 0xfedcba98,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 8,
> +		.val = 0x76543210,
> +	},
> +	{
> +		.reg = K3_DSS_MAIN_0_DSS_INST0_VBUSM_FBDC + 12,
> +		.val = 0xfedcba98,
> +	},
> +};
> +
> +u32 qos_count = ARRAY_SIZE(qos_data);


More information about the U-Boot mailing list