arch/arm/mach-vexpress/dcscb.c

   1 /*
   2  * arch/arm/mach-vexpress/dcscb.c - Dual Cluster System Configuration Block
   3  *
   4  * Created by:  Nicolas Pitre, May 2012
   5  * Copyright:   (C) 2012-2013  Linaro Limited
   6  *
   7  * This program is free software; you can redistribute it and/or modify
   8  * it under the terms of the GNU General Public License version 2 as
   9  * published by the Free Software Foundation.
  10  */
  11
  12 #include <linux/init.h>
  13 #include <linux/kernel.h>
  14 #include <linux/io.h>
  15 #include <linux/spinlock.h>
  16 #include <linux/errno.h>
  17 #include <linux/of_address.h>
  18 #include <linux/vexpress.h>
  19 #include <linux/arm-cci.h>
  20
  21 #include <asm/mcpm.h>
  22 #include <asm/proc-fns.h>
  23 #include <asm/cacheflush.h>
  24 #include <asm/cputype.h>
  25 #include <asm/cp15.h>
  26
  27
  28 #define RST_HOLD0       0x0
  29 #define RST_HOLD1       0x4
  30 #define SYS_SWRESET     0x8
  31 #define RST_STAT0       0xc
  32 #define RST_STAT1       0x10
  33 #define EAG_CFG_R       0x20
  34 #define EAG_CFG_W       0x24
  35 #define KFC_CFG_R       0x28
  36 #define KFC_CFG_W       0x2c
  37 #define DCS_CFG_R       0x30
  38
  39 /*
  40  * We can't use regular spinlocks. In the switcher case, it is possible
  41  * for an outbound CPU to call power_down() while its inbound counterpart
  42  * is already live using the same logical CPU number which trips lockdep
  43  * debugging.
  44  */
  45 static arch_spinlock_t dcscb_lock = __ARCH_SPIN_LOCK_UNLOCKED;
  46
  47 static void __iomem *dcscb_base;
  48 static int dcscb_use_count[4][2];
  49 static int dcscb_allcpus_mask[2];
  50
  51 static int dcscb_power_up(unsigned int cpu, unsigned int cluster)
  52 {
  53         unsigned int rst_hold, cpumask = (1 << cpu);
  54         unsigned int all_mask = dcscb_allcpus_mask[cluster];
  55
  56         pr_debug("%s: cpu %u cluster %u\n", __func__, cpu, cluster);
  57         if (cpu >= 4 || cluster >= 2)
  58                 return -EINVAL;
  59
  60         /*
  61          * Since this is called with IRQs enabled, and no arch_spin_lock_irq
  62          * variant exists, we need to disable IRQs manually here.
  63          */
  64         local_irq_disable();
  65         arch_spin_lock(&dcscb_lock);
  66
  67         dcscb_use_count[cpu][cluster]++;
  68         if (dcscb_use_count[cpu][cluster] == 1) {
  69                 rst_hold = readl_relaxed(dcscb_base + RST_HOLD0 + cluster * 4);
  70                 if (rst_hold & (1 << 8)) {
  71                         /* remove cluster reset and add individual CPU's reset */
  72                         rst_hold &= ~(1 << 8);
  73                         rst_hold |= all_mask;
  74                 }
  75                 rst_hold &= ~(cpumask | (cpumask << 4));
  76                 writel_relaxed(rst_hold, dcscb_base + RST_HOLD0 + cluster * 4);
  77         } else if (dcscb_use_count[cpu][cluster] != 2) {
  78                 /*
  79                  * The only possible values are:
  80                  * 0 = CPU down
  81                  * 1 = CPU (still) up
  82                  * 2 = CPU requested to be up before it had a chance
  83                  *     to actually make itself down.
  84                  * Any other value is a bug.
  85                  */
  86                 BUG();
  87         }
  88
  89         arch_spin_unlock(&dcscb_lock);
  90         local_irq_enable();
  91
  92         return 0;
  93 }
  94
  95 static void dcscb_power_down(void)
  96 {
  97         unsigned int mpidr, cpu, cluster, rst_hold, cpumask, all_mask;
  98         bool last_man = false, skip_wfi = false;
  99
 100         mpidr = read_cpuid_mpidr();
 101         cpu = MPIDR_AFFINITY_LEVEL(mpidr, 0);
 102         cluster = MPIDR_AFFINITY_LEVEL(mpidr, 1);
 103         cpumask = (1 << cpu);
 104         all_mask = dcscb_allcpus_mask[cluster];
 105
 106         pr_debug("%s: cpu %u cluster %u\n", __func__, cpu, cluster);
 107         BUG_ON(cpu >= 4 || cluster >= 2);
 108
 109         __mcpm_cpu_going_down(cpu, cluster);
 110
 111         arch_spin_lock(&dcscb_lock);
 112         BUG_ON(__mcpm_cluster_state(cluster) != CLUSTER_UP);
 113         dcscb_use_count[cpu][cluster]--;
 114         if (dcscb_use_count[cpu][cluster] == 0) {
 115                 rst_hold = readl_relaxed(dcscb_base + RST_HOLD0 + cluster * 4);
 116                 rst_hold |= cpumask;
 117                 if (((rst_hold | (rst_hold >> 4)) & all_mask) == all_mask) {
 118                         rst_hold |= (1 << 8);
 119                         last_man = true;
 120                 }
 121                 writel_relaxed(rst_hold, dcscb_base + RST_HOLD0 + cluster * 4);
 122         } else if (dcscb_use_count[cpu][cluster] == 1) {
 123                 /*
 124                  * A power_up request went ahead of us.
 125                  * Even if we do not want to shut this CPU down,
 126                  * the caller expects a certain state as if the WFI
 127                  * was aborted.  So let's continue with cache cleaning.
 128                  */
 129                 skip_wfi = true;
 130         } else
 131                 BUG();
 132
 133         if (last_man && __mcpm_outbound_enter_critical(cpu, cluster)) {
 134                 arch_spin_unlock(&dcscb_lock);
 135
 136                 /*
 137                  * Flush all cache levels for this cluster.
 138                  *
 139                  * To do so we do:
 140                  * - Clear the SCTLR.C bit to prevent further cache allocations
 141                  * - Flush the whole cache
 142                  * - Clear the ACTLR "SMP" bit to disable local coherency
 143                  *
 144                  * Let's do it in the safest possible way i.e. with
 145                  * no memory access within the following sequence
 146                  * including to the stack.
 147                  */
 148                 asm volatile(
 149                 "mrc    p15, 0, r0, c1, c0, 0   @ get CR \n\t"
 150                 "bic    r0, r0, #"__stringify(CR_C)" \n\t"
 151                 "mcr    p15, 0, r0, c1, c0, 0   @ set CR \n\t"
 152                 "isb    \n\t"
 153                 "bl     v7_flush_dcache_all \n\t"
 154                 "clrex  \n\t"
 155                 "mrc    p15, 0, r0, c1, c0, 1   @ get AUXCR \n\t"
 156                 "bic    r0, r0, #(1 << 6)       @ disable local coherency \n\t"
 157                 "mcr    p15, 0, r0, c1, c0, 1   @ set AUXCR \n\t"
 158                 "isb    \n\t"
 159                 "dsb    "
 160                 : : : "r0","r1","r2","r3","r4","r5","r6","r7",
 161                       "r9","r10","r11","lr","memory");
 162
 163                 /*
 164                  * This is a harmless no-op.  On platforms with a real
 165                  * outer cache this might either be needed or not,
 166                  * depending on where the outer cache sits.
 167                  */
 168                 outer_flush_all();
 169
 170                 /*
 171                  * Disable cluster-level coherency by masking
 172                  * incoming snoops and DVM messages:
 173                  */
 174                 cci_disable_port_by_cpu(mpidr);
 175
 176                 __mcpm_outbound_leave_critical(cluster, CLUSTER_DOWN);
 177         } else {
 178                 arch_spin_unlock(&dcscb_lock);
 179
 180                 /*
 181                  * Flush the local CPU cache.
 182                  * Let's do it in the safest possible way as above.
 183                  */
 184                 asm volatile(
 185                 "mrc    p15, 0, r0, c1, c0, 0   @ get CR \n\t"
 186                 "bic    r0, r0, #"__stringify(CR_C)" \n\t"
 187                 "mcr    p15, 0, r0, c1, c0, 0   @ set CR \n\t"
 188                 "isb    \n\t"
 189                 "bl     v7_flush_dcache_louis \n\t"
 190                 "clrex  \n\t"
 191                 "mrc    p15, 0, r0, c1, c0, 1   @ get AUXCR \n\t"
 192                 "bic    r0, r0, #(1 << 6)       @ disable local coherency \n\t"
 193                 "mcr    p15, 0, r0, c1, c0, 1   @ set AUXCR \n\t"
 194                 "isb    \n\t"
 195                 "dsb    "
 196                 : : : "r0","r1","r2","r3","r4","r5","r6","r7",
 197                       "r9","r10","r11","lr","memory");
 198         }
 199
 200         __mcpm_cpu_down(cpu, cluster);
 201
 202         /* Now we are prepared for power-down, do it: */
 203         dsb();
 204         if (!skip_wfi)
 205                 wfi();
 206
 207         /* Not dead at this point?  Let our caller cope. */
 208 }
 209
 210 static const struct mcpm_platform_ops dcscb_power_ops = {
 211         .power_up       = dcscb_power_up,
 212         .power_down     = dcscb_power_down,
 213 };
 214
 215 static void __init dcscb_usage_count_init(void)
 216 {
 217         unsigned int mpidr, cpu, cluster;
 218
 219         mpidr = read_cpuid_mpidr();
 220         cpu = MPIDR_AFFINITY_LEVEL(mpidr, 0);
 221         cluster = MPIDR_AFFINITY_LEVEL(mpidr, 1);
 222
 223         pr_debug("%s: cpu %u cluster %u\n", __func__, cpu, cluster);
 224         BUG_ON(cpu >= 4 || cluster >= 2);
 225         dcscb_use_count[cpu][cluster] = 1;
 226 }
 227
 228 extern void dcscb_power_up_setup(unsigned int affinity_level);
 229
 230 static int __init dcscb_init(void)
 231 {
 232         struct device_node *node;
 233         unsigned int cfg;
 234         int ret;
 235
 236         if (!cci_probed())
 237                 return -ENODEV;
 238
 239         node = of_find_compatible_node(NULL, NULL, "arm,rtsm,dcscb");
 240         if (!node)
 241                 return -ENODEV;
 242         dcscb_base = of_iomap(node, 0);
 243         if (!dcscb_base)
 244                 return -EADDRNOTAVAIL;
 245         cfg = readl_relaxed(dcscb_base + DCS_CFG_R);
 246         dcscb_allcpus_mask[0] = (1 << (((cfg >> 16) >> (0 << 2)) & 0xf)) - 1;
 247         dcscb_allcpus_mask[1] = (1 << (((cfg >> 16) >> (1 << 2)) & 0xf)) - 1;
 248         dcscb_usage_count_init();
 249
 250         ret = mcpm_platform_register(&dcscb_power_ops);
 251         if (!ret)
 252                 ret = mcpm_sync_init(dcscb_power_up_setup);
 253         if (ret) {
 254                 iounmap(dcscb_base);
 255                 return ret;
 256         }
 257
 258         pr_info("VExpress DCSCB support installed\n");
 259
 260         /*
 261          * Future entries into the kernel can now go
 262          * through the cluster entry vectors.
 263          */
 264         vexpress_flags_set(virt_to_phys(mcpm_entry_point));
 265
 266         return 0;
 267 }
 268
 269 early_initcall(dcscb_init);