| // SPDX-License-Identifier: GPL-2.0+ |
| /* |
| * Copyright 2014-2015 Freescale Semiconductor, Inc. |
| */ |
| |
| #include <common.h> |
| #include <clock_legacy.h> |
| #include <cpu_func.h> |
| #include <image.h> |
| #include <log.h> |
| #include <asm/cache.h> |
| #include <asm/global_data.h> |
| #include <asm/io.h> |
| #include <asm/ptrace.h> |
| #include <asm/system.h> |
| #include <asm/arch/mp.h> |
| #include <asm/arch/soc.h> |
| #include <linux/compat.h> |
| #include <linux/delay.h> |
| #include <linux/psci.h> |
| #include <malloc.h> |
| #include "cpu.h" |
| #include <asm/arch-fsl-layerscape/soc.h> |
| |
| DECLARE_GLOBAL_DATA_PTR; |
| |
| void *get_spin_tbl_addr(void) |
| { |
| /* the spin table is at the beginning */ |
| return secondary_boot_code_start; |
| } |
| |
| void update_os_arch_secondary_cores(uint8_t os_arch) |
| { |
| u64 *table = get_spin_tbl_addr(); |
| int i; |
| |
| for (i = 1; i < CONFIG_MAX_CPUS; i++) { |
| if (os_arch == IH_ARCH_DEFAULT) |
| table[i * WORDS_PER_SPIN_TABLE_ENTRY + |
| SPIN_TABLE_ELEM_ARCH_COMP_IDX] = OS_ARCH_SAME; |
| else |
| table[i * WORDS_PER_SPIN_TABLE_ENTRY + |
| SPIN_TABLE_ELEM_ARCH_COMP_IDX] = OS_ARCH_DIFF; |
| } |
| } |
| |
| #ifdef CONFIG_FSL_LSCH3 |
| static void wake_secondary_core_n(int cluster, int core, int cluster_cores) |
| { |
| struct ccsr_gur __iomem *gur = (void *)(CONFIG_SYS_FSL_GUTS_ADDR); |
| struct ccsr_reset __iomem *rst = (void *)(CONFIG_SYS_FSL_RST_ADDR); |
| u32 mpidr = 0; |
| |
| mpidr = ((cluster << 8) | core); |
| /* |
| * mpidr_el1 register value of core which needs to be released |
| * is written to scratchrw[6] register |
| */ |
| gur_out32(&gur->scratchrw[6], mpidr); |
| asm volatile("dsb st" : : : "memory"); |
| rst->brrl |= 1 << ((cluster * cluster_cores) + core); |
| asm volatile("dsb st" : : : "memory"); |
| /* |
| * scratchrw[6] register value is polled |
| * when the value becomes zero, this means that this core is up |
| * and running, next core can be released now |
| */ |
| while (gur_in32(&gur->scratchrw[6]) != 0) |
| ; |
| } |
| #endif |
| |
| int fsl_layerscape_wake_seconday_cores(void) |
| { |
| struct ccsr_gur __iomem *gur = (void *)(CONFIG_SYS_FSL_GUTS_ADDR); |
| #ifdef CONFIG_FSL_LSCH3 |
| struct ccsr_reset __iomem *rst = (void *)(CONFIG_SYS_FSL_RST_ADDR); |
| u32 svr, ver, cluster, type; |
| int j = 0, cluster_cores = 0; |
| #elif defined(CONFIG_FSL_LSCH2) |
| struct ccsr_scfg __iomem *scfg = (void *)(CONFIG_SYS_FSL_SCFG_ADDR); |
| #endif |
| u32 cores, cpu_up_mask = 1; |
| int i, timeout = 10; |
| u64 *table; |
| #ifdef CONFIG_EFI_LOADER |
| void *reloc_addr; |
| #endif |
| |
| #ifdef COUNTER_FREQUENCY_REAL |
| /* update for secondary cores */ |
| __real_cntfrq = COUNTER_FREQUENCY_REAL; |
| flush_dcache_range((unsigned long)&__real_cntfrq, |
| (unsigned long)&__real_cntfrq + 8); |
| #endif |
| |
| #ifdef CONFIG_EFI_LOADER |
| /* |
| * EFI will reserve 64kb for its runtime services. This will probably |
| * overlap with our spin table code, which is why we have to relocate |
| * it. |
| * Keep this after the __real_cntfrq update, so we have it when we |
| * copy the complete section here. |
| */ |
| reloc_addr = memalign(PAGE_SIZE, |
| round_up(secondary_boot_code_size, PAGE_SIZE)); |
| if (reloc_addr) { |
| debug("Relocating spin table from %p to %p (size %lx)\n", |
| secondary_boot_code_start, reloc_addr, |
| secondary_boot_code_size); |
| memcpy(reloc_addr, secondary_boot_code_start, |
| secondary_boot_code_size); |
| flush_dcache_range((unsigned long)reloc_addr, |
| (unsigned long)reloc_addr + |
| secondary_boot_code_size); |
| |
| /* set new entry point for secondary cores */ |
| secondary_boot_addr += reloc_addr - |
| secondary_boot_code_start; |
| flush_dcache_range((unsigned long)&secondary_boot_addr, |
| (unsigned long)&secondary_boot_addr + 8); |
| |
| /* this will be used to reserve the memory */ |
| secondary_boot_code_start = reloc_addr; |
| } |
| #endif |
| |
| cores = cpu_mask(); |
| /* Clear spin table so that secondary processors |
| * observe the correct value after waking up from wfe. |
| */ |
| table = get_spin_tbl_addr(); |
| memset(table, 0, CONFIG_MAX_CPUS*SPIN_TABLE_ELEM_SIZE); |
| flush_dcache_range((unsigned long)table, |
| (unsigned long)table + |
| (CONFIG_MAX_CPUS*SPIN_TABLE_ELEM_SIZE)); |
| |
| debug("Waking secondary cores to start from %lx\n", gd->relocaddr); |
| |
| #ifdef CONFIG_FSL_LSCH3 |
| gur_out32(&gur->bootlocptrh, (u32)(gd->relocaddr >> 32)); |
| gur_out32(&gur->bootlocptrl, (u32)gd->relocaddr); |
| |
| svr = gur_in32(&gur->svr); |
| ver = SVR_SOC_VER(svr); |
| if (ver == SVR_LS2080A || ver == SVR_LS2085A) { |
| gur_out32(&gur->scratchrw[6], 1); |
| asm volatile("dsb st" : : : "memory"); |
| rst->brrl = cores; |
| asm volatile("dsb st" : : : "memory"); |
| } else { |
| /* |
| * Release the cores out of reset one-at-a-time to avoid |
| * power spikes |
| */ |
| i = 0; |
| cluster = in_le32(&gur->tp_cluster[i].lower); |
| for (j = 0; j < TP_INIT_PER_CLUSTER; j++) { |
| type = initiator_type(cluster, j); |
| if (type && |
| TP_ITYP_TYPE(type) == TP_ITYP_TYPE_ARM) |
| cluster_cores++; |
| } |
| |
| do { |
| cluster = in_le32(&gur->tp_cluster[i].lower); |
| for (j = 0; j < TP_INIT_PER_CLUSTER; j++) { |
| type = initiator_type(cluster, j); |
| if (type && |
| TP_ITYP_TYPE(type) == TP_ITYP_TYPE_ARM) |
| wake_secondary_core_n(i, j, |
| cluster_cores); |
| } |
| i++; |
| } while ((cluster & TP_CLUSTER_EOC) != TP_CLUSTER_EOC); |
| } |
| #elif defined(CONFIG_FSL_LSCH2) |
| scfg_out32(&scfg->scratchrw[0], (u32)(gd->relocaddr >> 32)); |
| scfg_out32(&scfg->scratchrw[1], (u32)gd->relocaddr); |
| asm volatile("dsb st" : : : "memory"); |
| gur_out32(&gur->brrl, cores); |
| asm volatile("dsb st" : : : "memory"); |
| |
| /* Bootup online cores */ |
| scfg_out32(&scfg->corebcr, cores); |
| #endif |
| /* This is needed as a precautionary measure. |
| * If some code before this has accidentally released the secondary |
| * cores then the pre-bootloader code will trap them in a "wfe" unless |
| * the scratchrw[6] is set. In this case we need a sev here to get these |
| * cores moving again. |
| */ |
| asm volatile("sev"); |
| |
| while (timeout--) { |
| flush_dcache_range((unsigned long)table, (unsigned long)table + |
| CONFIG_MAX_CPUS * 64); |
| for (i = 1; i < CONFIG_MAX_CPUS; i++) { |
| if (table[i * WORDS_PER_SPIN_TABLE_ENTRY + |
| SPIN_TABLE_ELEM_STATUS_IDX]) |
| cpu_up_mask |= 1 << i; |
| } |
| if (hweight32(cpu_up_mask) == hweight32(cores)) |
| break; |
| udelay(10); |
| } |
| if (timeout <= 0) { |
| printf("CPU: Failed to bring up some cores (mask 0x%x)\n", |
| cores ^ cpu_up_mask); |
| return 1; |
| } |
| printf("CPU: %d cores online\n", hweight32(cores)); |
| |
| return 0; |
| } |
| |
| int is_core_valid(unsigned int core) |
| { |
| return !!((1 << core) & cpu_mask()); |
| } |
| |
| static int is_pos_valid(unsigned int pos) |
| { |
| return !!((1 << pos) & cpu_pos_mask()); |
| } |
| |
| int is_core_online(u64 cpu_id) |
| { |
| u64 *table = get_spin_tbl_addr(); |
| int pos = id_to_core(cpu_id); |
| table += pos * WORDS_PER_SPIN_TABLE_ENTRY; |
| return table[SPIN_TABLE_ELEM_STATUS_IDX] == 1; |
| } |
| |
| int cpu_reset(u32 nr) |
| { |
| puts("Feature is not implemented.\n"); |
| |
| return 0; |
| } |
| |
| int cpu_disable(u32 nr) |
| { |
| puts("Feature is not implemented.\n"); |
| |
| return 0; |
| } |
| |
| static int core_to_pos(int nr) |
| { |
| u32 cores = cpu_pos_mask(); |
| int i, count = 0; |
| |
| if (nr == 0) { |
| return 0; |
| } else if (nr >= hweight32(cores)) { |
| puts("Not a valid core number.\n"); |
| return -1; |
| } |
| |
| for (i = 1; i < 32; i++) { |
| if (is_pos_valid(i)) { |
| count++; |
| if (count == nr) |
| break; |
| } |
| } |
| |
| if (count != nr) |
| return -1; |
| |
| return i; |
| } |
| |
| int cpu_status(u32 nr) |
| { |
| u64 *table = get_spin_tbl_addr(); |
| int pos; |
| |
| if (nr == 0) { |
| printf("table base @ 0x%p\n", table); |
| } else { |
| pos = core_to_pos(nr); |
| if (pos < 0) |
| return -1; |
| table += pos * WORDS_PER_SPIN_TABLE_ENTRY; |
| printf("table @ 0x%p\n", table); |
| printf(" addr - 0x%016llx\n", |
| table[SPIN_TABLE_ELEM_ENTRY_ADDR_IDX]); |
| printf(" status - 0x%016llx\n", |
| table[SPIN_TABLE_ELEM_STATUS_IDX]); |
| printf(" lpid - 0x%016llx\n", |
| table[SPIN_TABLE_ELEM_LPID_IDX]); |
| } |
| |
| return 0; |
| } |
| |
| int cpu_release(u32 nr, int argc, char *const argv[]) |
| { |
| u64 boot_addr; |
| u64 *table = get_spin_tbl_addr(); |
| int pos; |
| int ret; |
| |
| boot_addr = simple_strtoull(argv[0], NULL, 16); |
| |
| if (check_psci()) { |
| /* SPIN Table is used */ |
| pos = core_to_pos(nr); |
| if (pos <= 0) |
| return -1; |
| |
| table += pos * WORDS_PER_SPIN_TABLE_ENTRY; |
| table[SPIN_TABLE_ELEM_ENTRY_ADDR_IDX] = boot_addr; |
| flush_dcache_range((unsigned long)table, |
| (unsigned long)table + SPIN_TABLE_ELEM_SIZE); |
| asm volatile("dsb st"); |
| |
| /* |
| * The secondary CPUs polling the spin-table above for a non-zero |
| * value. To save power "wfe" is called. Thus call "sev" here to |
| * wake the CPUs and let them check the spin-table again (see |
| * slave_cpu loop in lowlevel.S) |
| */ |
| asm volatile("sev"); |
| } else { |
| /* Use PSCI to kick the core */ |
| printf("begin to kick cpu core #%d to address %llx\n", |
| nr, boot_addr); |
| ret = invoke_psci_fn(PSCI_0_2_FN64_CPU_ON, nr, boot_addr, 0); |
| if (ret) |
| return -1; |
| } |
| |
| return 0; |
| } |