arm-trusted-firmware/lib/cpus/aarch64/denver.S

/*
 * Copyright (c) 2015-2016, ARM Limited and Contributors. All rights reserved.
 *
 * SPDX-License-Identifier: BSD-3-Clause
 */

#include <arch.h>
#include <asm_macros.S>
#include <assert_macros.S>
#include <denver.h>
#include <cpu_macros.S>
#include <plat_macros.S>

	.global	denver_disable_dco

	/* ---------------------------------------------
	 * Disable debug interfaces
	 * ---------------------------------------------
	 */
func denver_disable_ext_debug
	mov	x0, #1
	msr	osdlr_el1, x0
	isb
	dsb	sy
	ret
endfunc denver_disable_ext_debug

	/* ----------------------------------------------------
	 * Enable dynamic code optimizer (DCO)
	 * ----------------------------------------------------
	 */
func denver_enable_dco
	mrs	x0, mpidr_el1
	and	x0, x0, #0xF
	mov	x1, #1
	lsl	x1, x1, x0
	msr	s3_0_c15_c0_2, x1
	ret
endfunc denver_enable_dco

	/* ----------------------------------------------------
	 * Disable dynamic code optimizer (DCO)
	 * ----------------------------------------------------
	 */
func denver_disable_dco

	/* turn off background work */
	mrs	x0, mpidr_el1
	and	x0, x0, #0xF
	mov	x1, #1
	lsl	x1, x1, x0
	lsl	x2, x1, #16
	msr	s3_0_c15_c0_2, x2
	isb

	/* wait till the background work turns off */
1:	mrs	x2, s3_0_c15_c0_2
	lsr	x2, x2, #32
	and	w2, w2, 0xFFFF
	and	x2, x2, x1
	cbnz	x2, 1b

	ret
endfunc denver_disable_dco

	/* -------------------------------------------------
	 * The CPU Ops reset function for Denver.
	 * -------------------------------------------------
	 */
func denver_reset_func

	mov	x19, x30

	/* ----------------------------------------------------
	 * Enable dynamic code optimizer (DCO)
	 * ----------------------------------------------------
	 */
	bl	denver_enable_dco

	ret	x19
endfunc denver_reset_func

	/* ----------------------------------------------------
	 * The CPU Ops core power down function for Denver.
	 * ----------------------------------------------------
	 */
func denver_core_pwr_dwn

	mov	x19, x30

	/* ---------------------------------------------
	 * Force the debug interfaces to be quiescent
	 * ---------------------------------------------
	 */
	bl	denver_disable_ext_debug

	ret	x19
endfunc denver_core_pwr_dwn

	/* -------------------------------------------------------
	 * The CPU Ops cluster power down function for Denver.
	 * -------------------------------------------------------
	 */
func denver_cluster_pwr_dwn
	ret
endfunc denver_cluster_pwr_dwn

	/* ---------------------------------------------
	 * This function provides Denver specific
	 * register information for crash reporting.
	 * It needs to return with x6 pointing to
	 * a list of register names in ascii and
	 * x8 - x15 having values of registers to be
	 * reported.
	 * ---------------------------------------------
	 */
.section .rodata.denver_regs, "aS"
denver_regs:  /* The ascii list of register names to be reported */
	.asciz	"actlr_el1", ""

func denver_cpu_reg_dump
	adr	x6, denver_regs
	mrs	x8, ACTLR_EL1
	ret
endfunc denver_cpu_reg_dump

declare_cpu_ops denver, DENVER_MIDR_PN0, \
	denver_reset_func, \
	denver_core_pwr_dwn, \
	denver_cluster_pwr_dwn

declare_cpu_ops denver, DENVER_MIDR_PN1, \
	denver_reset_func, \
	denver_core_pwr_dwn, \
	denver_cluster_pwr_dwn

declare_cpu_ops denver, DENVER_MIDR_PN2, \
	denver_reset_func, \
	denver_core_pwr_dwn, \
	denver_cluster_pwr_dwn

declare_cpu_ops denver, DENVER_MIDR_PN3, \
	denver_reset_func, \
	denver_core_pwr_dwn, \
	denver_cluster_pwr_dwn

declare_cpu_ops denver, DENVER_MIDR_PN4, \
	denver_reset_func, \
	denver_core_pwr_dwn, \
	denver_cluster_pwr_dwn
Add "Project Denver" CPU support Denver is NVIDIA's own custom-designed, 64-bit, dual-core CPU which is fully ARMv8 architecture compatible. Each of the two Denver cores implements a 7-way superscalar microarchitecture (up to 7 concurrent micro-ops can be executed per clock), and includes a 128KB 4-way L1 instruction cache, a 64KB 4-way L1 data cache, and a 2MB 16-way L2 cache, which services both cores. Denver implements an innovative process called Dynamic Code Optimization, which optimizes frequently used software routines at runtime into dense, highly tuned microcode-equivalent routines. These are stored in a dedicated, 128MB main-memory-based optimization cache. After being read into the instruction cache, the optimized micro-ops are executed, re-fetched and executed from the instruction cache as long as needed and capacity allows. Effectively, this reduces the need to re-optimize the software routines. Instead of using hardware to extract the instruction-level parallelism (ILP) inherent in the code, Denver extracts the ILP once via software techniques, and then executes those routines repeatedly, thus amortizing the cost of ILP extraction over the many execution instances. Denver also features new low latency power-state transitions, in addition to extensive power-gating and dynamic voltage and clock scaling based on workloads. Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2015-07-14 12:41:20 +01:00			`/*`
cpus: denver: disable DCO operations from platform code This patch moves the code to disable DCO operations out from common CPU files. This allows the platform code to call thsi API as and when required. There are certain CPU power down states which require the DCO to be kept ON and platforms can decide selectively now. Change-Id: Icb946fe2545a7d8c5903c420d1ee169c4921a2d1 Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2016-02-22 19:09:41 +00:00			`* Copyright (c) 2015-2016, ARM Limited and Contributors. All rights reserved.`
Add "Project Denver" CPU support Denver is NVIDIA's own custom-designed, 64-bit, dual-core CPU which is fully ARMv8 architecture compatible. Each of the two Denver cores implements a 7-way superscalar microarchitecture (up to 7 concurrent micro-ops can be executed per clock), and includes a 128KB 4-way L1 instruction cache, a 64KB 4-way L1 data cache, and a 2MB 16-way L2 cache, which services both cores. Denver implements an innovative process called Dynamic Code Optimization, which optimizes frequently used software routines at runtime into dense, highly tuned microcode-equivalent routines. These are stored in a dedicated, 128MB main-memory-based optimization cache. After being read into the instruction cache, the optimized micro-ops are executed, re-fetched and executed from the instruction cache as long as needed and capacity allows. Effectively, this reduces the need to re-optimize the software routines. Instead of using hardware to extract the instruction-level parallelism (ILP) inherent in the code, Denver extracts the ILP once via software techniques, and then executes those routines repeatedly, thus amortizing the cost of ILP extraction over the many execution instances. Denver also features new low latency power-state transitions, in addition to extensive power-gating and dynamic voltage and clock scaling based on workloads. Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2015-07-14 12:41:20 +01:00			`*`
Use SPDX license identifiers To make software license auditing simpler, use SPDX[0] license identifiers instead of duplicating the license text in every file. NOTE: Files that have been imported by FreeBSD have not been modified. [0]: https://spdx.org/ Change-Id: I80a00e1f641b8cc075ca5a95b10607ed9ed8761a Signed-off-by: dp-arm <dimitris.papastamos@arm.com> 2017-05-03 09:38:09 +01:00			`* SPDX-License-Identifier: BSD-3-Clause`
Add "Project Denver" CPU support Denver is NVIDIA's own custom-designed, 64-bit, dual-core CPU which is fully ARMv8 architecture compatible. Each of the two Denver cores implements a 7-way superscalar microarchitecture (up to 7 concurrent micro-ops can be executed per clock), and includes a 128KB 4-way L1 instruction cache, a 64KB 4-way L1 data cache, and a 2MB 16-way L2 cache, which services both cores. Denver implements an innovative process called Dynamic Code Optimization, which optimizes frequently used software routines at runtime into dense, highly tuned microcode-equivalent routines. These are stored in a dedicated, 128MB main-memory-based optimization cache. After being read into the instruction cache, the optimized micro-ops are executed, re-fetched and executed from the instruction cache as long as needed and capacity allows. Effectively, this reduces the need to re-optimize the software routines. Instead of using hardware to extract the instruction-level parallelism (ILP) inherent in the code, Denver extracts the ILP once via software techniques, and then executes those routines repeatedly, thus amortizing the cost of ILP extraction over the many execution instances. Denver also features new low latency power-state transitions, in addition to extensive power-gating and dynamic voltage and clock scaling based on workloads. Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2015-07-14 12:41:20 +01:00			`*/`

			`#include <arch.h>`
			`#include <asm_macros.S>`
			`#include <assert_macros.S>`
			`#include <denver.h>`
			`#include <cpu_macros.S>`
			`#include <plat_macros.S>`

cpus: denver: disable DCO operations from platform code This patch moves the code to disable DCO operations out from common CPU files. This allows the platform code to call thsi API as and when required. There are certain CPU power down states which require the DCO to be kept ON and platforms can decide selectively now. Change-Id: Icb946fe2545a7d8c5903c420d1ee169c4921a2d1 Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2016-02-22 19:09:41 +00:00			`.global denver_disable_dco`

Add "Project Denver" CPU support Denver is NVIDIA's own custom-designed, 64-bit, dual-core CPU which is fully ARMv8 architecture compatible. Each of the two Denver cores implements a 7-way superscalar microarchitecture (up to 7 concurrent micro-ops can be executed per clock), and includes a 128KB 4-way L1 instruction cache, a 64KB 4-way L1 data cache, and a 2MB 16-way L2 cache, which services both cores. Denver implements an innovative process called Dynamic Code Optimization, which optimizes frequently used software routines at runtime into dense, highly tuned microcode-equivalent routines. These are stored in a dedicated, 128MB main-memory-based optimization cache. After being read into the instruction cache, the optimized micro-ops are executed, re-fetched and executed from the instruction cache as long as needed and capacity allows. Effectively, this reduces the need to re-optimize the software routines. Instead of using hardware to extract the instruction-level parallelism (ILP) inherent in the code, Denver extracts the ILP once via software techniques, and then executes those routines repeatedly, thus amortizing the cost of ILP extraction over the many execution instances. Denver also features new low latency power-state transitions, in addition to extensive power-gating and dynamic voltage and clock scaling based on workloads. Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2015-07-14 12:41:20 +01:00			`/* ---------------------------------------------`
			`* Disable debug interfaces`
			`* ---------------------------------------------`
			`*/`
			`func denver_disable_ext_debug`
			`mov x0, #1`
			`msr osdlr_el1, x0`
			`isb`
			`dsb sy`
			`ret`
			`endfunc denver_disable_ext_debug`

			`/* ----------------------------------------------------`
			`* Enable dynamic code optimizer (DCO)`
			`* ----------------------------------------------------`
			`*/`
			`func denver_enable_dco`
			`mrs x0, mpidr_el1`
			`and x0, x0, #0xF`
			`mov x1, #1`
			`lsl x1, x1, x0`
			`msr s3_0_c15_c0_2, x1`
			`ret`
			`endfunc denver_enable_dco`

			`/* ----------------------------------------------------`
			`* Disable dynamic code optimizer (DCO)`
			`* ----------------------------------------------------`
			`*/`
			`func denver_disable_dco`

			`/* turn off background work */`
			`mrs x0, mpidr_el1`
			`and x0, x0, #0xF`
			`mov x1, #1`
			`lsl x1, x1, x0`
			`lsl x2, x1, #16`
			`msr s3_0_c15_c0_2, x2`
			`isb`

			`/* wait till the background work turns off */`
			`1: mrs x2, s3_0_c15_c0_2`
			`lsr x2, x2, #32`
			`and w2, w2, 0xFFFF`
			`and x2, x2, x1`
			`cbnz x2, 1b`

			`ret`
			`endfunc denver_disable_dco`

			`/* -------------------------------------------------`
			`* The CPU Ops reset function for Denver.`
			`* -------------------------------------------------`
			`*/`
			`func denver_reset_func`

			`mov x19, x30`

			`/* ----------------------------------------------------`
			`* Enable dynamic code optimizer (DCO)`
			`* ----------------------------------------------------`
			`*/`
			`bl denver_enable_dco`

			`ret x19`
			`endfunc denver_reset_func`

			`/* ----------------------------------------------------`
			`* The CPU Ops core power down function for Denver.`
			`* ----------------------------------------------------`
			`*/`
			`func denver_core_pwr_dwn`

			`mov x19, x30`

			`/* ---------------------------------------------`
			`* Force the debug interfaces to be quiescent`
			`* ---------------------------------------------`
			`*/`
			`bl denver_disable_ext_debug`

			`ret x19`
			`endfunc denver_core_pwr_dwn`

			`/* -------------------------------------------------------`
			`* The CPU Ops cluster power down function for Denver.`
			`* -------------------------------------------------------`
			`*/`
			`func denver_cluster_pwr_dwn`
			`ret`
			`endfunc denver_cluster_pwr_dwn`

			`/* ---------------------------------------------`
			`* This function provides Denver specific`
			`* register information for crash reporting.`
			`* It needs to return with x6 pointing to`
			`* a list of register names in ascii and`
			`* x8 - x15 having values of registers to be`
			`* reported.`
			`* ---------------------------------------------`
			`*/`
			`.section .rodata.denver_regs, "aS"`
			`denver_regs: /* The ascii list of register names to be reported */`
			`.asciz "actlr_el1", ""`

			`func denver_cpu_reg_dump`
			`adr x6, denver_regs`
			`mrs x8, ACTLR_EL1`
			`ret`
			`endfunc denver_cpu_reg_dump`

cpus: Add support for all Denver variants This patch adds support for all variants of the Denver CPUs. The variants export their cpu_ops to allow all Denver platforms to run the Trusted Firmware stack. Change-Id: I1488813ddfd506ffe363d8a32cda1b575e437035 Signed-off-by: Varun Wadekar <vwadekar@nvidia.com> 2015-09-03 12:45:06 +01:00			`declare_cpu_ops denver, DENVER_MIDR_PN0, \`
			`denver_reset_func, \`
			`denver_core_pwr_dwn, \`
			`denver_cluster_pwr_dwn`

			`declare_cpu_ops denver, DENVER_MIDR_PN1, \`
			`denver_reset_func, \`
			`denver_core_pwr_dwn, \`
			`denver_cluster_pwr_dwn`

			`declare_cpu_ops denver, DENVER_MIDR_PN2, \`
			`denver_reset_func, \`
			`denver_core_pwr_dwn, \`
			`denver_cluster_pwr_dwn`

			`declare_cpu_ops denver, DENVER_MIDR_PN3, \`
			`denver_reset_func, \`
			`denver_core_pwr_dwn, \`
			`denver_cluster_pwr_dwn`

			`declare_cpu_ops denver, DENVER_MIDR_PN4, \`
Add provision to extend CPU operations at more levels Various CPU drivers in ARM Trusted Firmware register functions to handle power-down operations. At present, separate functions are registered to power down individual cores and clusters. This scheme operates on the basis of core and cluster, and doesn't cater for extending the hierarchy for power-down operations. For example, future CPUs might support multiple threads which might need powering down individually. This patch therefore reworks the CPU operations framework to allow for registering power down handlers on specific level basis. Henceforth: - Generic code invokes CPU power down operations by the level required. - CPU drivers explicitly mention CPU_NO_RESET_FUNC when the CPU has no reset function. - CPU drivers register power down handlers as a list: a mandatory handler for level 0, and optional handlers for higher levels. All existing CPU drivers are adapted to the new CPU operations framework without needing any functional changes within. Also update firmware design guide. Change-Id: I1826842d37a9e60a9e85fdcee7b4b8f6bc1ad043 Signed-off-by: Jeenu Viswambharan <jeenu.viswambharan@arm.com> 2016-11-18 12:58:28 +00:00			`denver_reset_func, \`
			`denver_core_pwr_dwn, \`
			`denver_cluster_pwr_dwn`