On Fri, May 09 2014 at 3:05:22 pm BST, Christoffer Dall <christoffer.dall@xxxxxxxxxx> wrote: > On Wed, Apr 16, 2014 at 02:39:34PM +0100, Marc Zyngier wrote: >> The Generic Interrupt Controller (version 3) offers services that are >> similar to GICv2, with a number of additional features: >> - Affinity routing based on the CPU MPIDR (ARE) >> - System register for the CPU interfaces (SRE) >> - Support for more that 8 CPUs >> - Locality-specific Peripheral Interrupts (LPIs) >> - Interrupt Translation Services (ITS) >> >> This patch adds preliminary support for GICv3 with ARE and SRE, >> non-secure mode only. It relies on higher exception levels to grant ARE >> and SRE access. >> >> Support for LPI and ITS will be added at a later time. >> >> Cc: Thomas Gleixner <tglx@xxxxxxxxxxxxx> >> Reviewed-by: Zi Shen Lim <zlim@xxxxxxxxxxxx> >> Acked-by: Catalin Marinas <catalin.marinas@xxxxxxx> >> Signed-off-by: Marc Zyngier <marc.zyngier@xxxxxxx> >> --- >> arch/arm64/Kconfig | 1 + >> arch/arm64/kernel/head.S | 18 + >> arch/arm64/kernel/hyp-stub.S | 1 + >> drivers/irqchip/Kconfig | 5 + >> drivers/irqchip/Makefile | 1 + >> drivers/irqchip/irq-gic-v3.c | 681 +++++++++++++++++++++++++++++++++++++ >> include/linux/irqchip/arm-gic-v3.h | 188 ++++++++++ >> 7 files changed, 895 insertions(+) >> create mode 100644 drivers/irqchip/irq-gic-v3.c >> create mode 100644 include/linux/irqchip/arm-gic-v3.h >> >> diff --git a/arch/arm64/Kconfig b/arch/arm64/Kconfig >> index 27bbcfc..5bd0dfe 100644 >> --- a/arch/arm64/Kconfig >> +++ b/arch/arm64/Kconfig >> @@ -9,6 +9,7 @@ config ARM64 >> select ARM_AMBA >> select ARM_ARCH_TIMER >> select ARM_GIC >> + select ARM_GIC_V3 >> select BUILDTIME_EXTABLE_SORT >> select CLONE_BACKWARDS >> select COMMON_CLK >> diff --git a/arch/arm64/kernel/head.S b/arch/arm64/kernel/head.S >> index 0b281ff..7c56e93 100644 >> --- a/arch/arm64/kernel/head.S >> +++ b/arch/arm64/kernel/head.S >> @@ -22,6 +22,7 @@ >> >> #include <linux/linkage.h> >> #include <linux/init.h> >> +#include <linux/irqchip/arm-gic-v3.h> >> >> #include <asm/assembler.h> >> #include <asm/ptrace.h> >> @@ -183,6 +184,23 @@ CPU_LE( bic x0, x0, #(3 << 24) ) // Clear the EE and E0E bits for EL1 >> msr cnthctl_el2, x0 >> msr cntvoff_el2, xzr // Clear virtual offset >> >> +#ifdef CONFIG_ARM_GIC_V3 >> + /* GICv3 system register access */ >> + mrs x0, id_aa64pfr0_el1 >> + ubfx x0, x0, #24, #4 >> + cmp x0, #1 >> + b.ne 3f >> + >> + mrs x0, ICC_SRE_EL2 >> + orr x0, x0, #1 // Set ICC_SRE_EL2.SRE==1 >> + orr x0, x0, #(1 << 3) // Set ICC_SRE_EL2.Enable==1 >> + msr ICC_SRE_EL2, x0 >> + isb // Make sure SRE is now 1 >> + msr ICH_HCR_EL2, xzr // Reset ICC_HCR_EL2 to defaults >> + >> +3: >> +#endif >> + >> /* Populate ID registers. */ >> mrs x0, midr_el1 >> mrs x1, mpidr_el1 >> diff --git a/arch/arm64/kernel/hyp-stub.S b/arch/arm64/kernel/hyp-stub.S >> index 0959611..a272f33 100644 >> --- a/arch/arm64/kernel/hyp-stub.S >> +++ b/arch/arm64/kernel/hyp-stub.S >> @@ -19,6 +19,7 @@ >> >> #include <linux/init.h> >> #include <linux/linkage.h> >> +#include <linux/irqchip/arm-gic-v3.h> >> >> #include <asm/assembler.h> >> #include <asm/ptrace.h> >> diff --git a/drivers/irqchip/Kconfig b/drivers/irqchip/Kconfig >> index 61ffdca..5b55c46 100644 >> --- a/drivers/irqchip/Kconfig >> +++ b/drivers/irqchip/Kconfig >> @@ -10,6 +10,11 @@ config ARM_GIC >> config GIC_NON_BANKED >> bool >> >> +config ARM_GIC_V3 >> + bool >> + select IRQ_DOMAIN >> + select MULTI_IRQ_HANDLER >> + >> config ARM_NVIC >> bool >> select IRQ_DOMAIN >> diff --git a/drivers/irqchip/Makefile b/drivers/irqchip/Makefile >> index 22e616c..4adfda8 100644 >> --- a/drivers/irqchip/Makefile >> +++ b/drivers/irqchip/Makefile >> @@ -14,6 +14,7 @@ obj-$(CONFIG_ORION_IRQCHIP) += irq-orion.o >> obj-$(CONFIG_ARCH_SUNXI) += irq-sun4i.o >> obj-$(CONFIG_ARCH_SPEAR3XX) += spear-shirq.o >> obj-$(CONFIG_ARM_GIC) += irq-gic.o irq-gic-common.o >> +obj-$(CONFIG_ARM_GIC_V3) += irq-gic-v3.o irq-gic-common.o >> obj-$(CONFIG_ARM_NVIC) += irq-nvic.o >> obj-$(CONFIG_ARM_VIC) += irq-vic.o >> obj-$(CONFIG_IMGPDC_IRQ) += irq-imgpdc.o >> diff --git a/drivers/irqchip/irq-gic-v3.c b/drivers/irqchip/irq-gic-v3.c >> new file mode 100644 >> index 0000000..b4c8140 >> --- /dev/null >> +++ b/drivers/irqchip/irq-gic-v3.c >> @@ -0,0 +1,681 @@ >> +/* >> + * Copyright (C) 2013, 2014 ARM Limited, All Rights Reserved. >> + * Author: Marc Zyngier <marc.zyngier@xxxxxxx> >> + * >> + * This program is free software; you can redistribute it and/or modify >> + * it under the terms of the GNU General Public License version 2 as >> + * published by the Free Software Foundation. >> + * >> + * This program is distributed in the hope that it will be useful, >> + * but WITHOUT ANY WARRANTY; without even the implied warranty of >> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the >> + * GNU General Public License for more details. >> + * >> + * You should have received a copy of the GNU General Public License >> + * along with this program. If not, see <http://www.gnu.org/licenses/>. >> + */ >> + >> +#include <linux/cpu.h> >> +#include <linux/delay.h> >> +#include <linux/interrupt.h> >> +#include <linux/of.h> >> +#include <linux/of_address.h> >> +#include <linux/of_irq.h> >> +#include <linux/percpu.h> >> +#include <linux/slab.h> >> + >> +#include <linux/irqchip/arm-gic-v3.h> >> + >> +#include <asm/cputype.h> >> +#include <asm/exception.h> >> +#include <asm/smp_plat.h> >> + >> +#include "irq-gic-common.h" >> +#include "irqchip.h" >> + >> +struct gic_chip_data { >> + void __iomem *dist_base; >> + void __iomem **redist_base; >> + void __percpu __iomem **rdist; >> + struct irq_domain *domain; >> + u64 redist_stride; >> + u32 redist_regions; >> + unsigned int irq_nr; >> +}; >> + >> +static struct gic_chip_data gic_data __read_mostly; >> + >> +#define gic_data_rdist() (this_cpu_ptr(gic_data.rdist)) >> +#define gic_data_rdist_rd_base() (*gic_data_rdist()) >> +#define gic_data_rdist_sgi_base() (gic_data_rdist_rd_base() + SZ_64K) >> + >> +#define DEFAULT_PMR_VALUE 0xf0 >> + >> +static inline unsigned int gic_irq(struct irq_data *d) >> +{ >> + return d->hwirq; >> +} >> + >> +static inline int gic_irq_in_rdist(struct irq_data *d) >> +{ >> + return gic_irq(d) < 32; >> +} >> + >> +static inline void __iomem *gic_dist_base(struct irq_data *d) >> +{ >> + if (gic_irq_in_rdist(d)) /* SGI+PPI -> SGI_base for this CPU */ >> + return gic_data_rdist_sgi_base(); >> + >> + if (d->hwirq <= 1023) /* SPI -> dist_base */ >> + return gic_data.dist_base; >> + >> + if (d->hwirq >= 8192) >> + BUG(); /* LPI Detected!!! */ >> + >> + return NULL; >> +} >> + >> +static void gic_do_wait_for_rwp(void __iomem *base) >> +{ >> + u32 count = 1000000; /* 1s! */ >> + >> + while (readl_relaxed(base + GICD_CTLR) & GICD_CTLR_RWP) { >> + count--; >> + if (!count) { >> + pr_err_ratelimited("RWP timeout, gone fishing\n"); >> + return; >> + } >> + cpu_relax(); >> + udelay(1); >> + }; >> +} >> + >> +/* Wait for completion of a distributor change */ >> +static void gic_dist_wait_for_rwp(void) >> +{ >> + gic_do_wait_for_rwp(gic_data.dist_base); >> +} >> + >> +/* Wait for completion of a redistributor change */ >> +static void gic_redist_wait_for_rwp(void) >> +{ >> + gic_do_wait_for_rwp(gic_data_rdist_rd_base()); >> +} >> + >> +/* Low level accessors */ >> +static u64 gic_read_iar(void) >> +{ >> + u64 irqstat; >> + >> + asm volatile("mrs %0, " __stringify(ICC_IAR1_EL1) : "=r" (irqstat)); >> + return irqstat; >> +} >> + >> +static void gic_write_pmr(u64 val) >> +{ >> + asm volatile("msr " __stringify(ICC_PMR_EL1) ", %0" : : "r" (val)); >> +} >> + >> +static void gic_write_ctlr(u64 val) >> +{ >> + asm volatile("msr " __stringify(ICC_CTLR_EL1) ", %0" : : "r" (val)); >> + isb(); >> +} >> + >> +static void gic_write_grpen1(u64 val) >> +{ >> + asm volatile("msr " __stringify(ICC_GRPEN1_EL1) ", %0" : : "r" (val)); >> + isb(); >> +} >> + >> +static void gic_write_sgi1r(u64 val) >> +{ >> + asm volatile("msr " __stringify(ICC_SGI1R_EL1) ", %0" : : "r" (val)); >> +} >> + >> +static void gic_enable_sre(void) >> +{ >> + u64 val; >> + >> + asm volatile("mrs %0, " __stringify(ICC_SRE_EL1) : "=r" (val)); >> + val |= GICC_SRE_EL1_SRE; >> + asm volatile("msr " __stringify(ICC_SRE_EL1) ", %0" : : "r" (val)); >> + isb(); >> + >> + /* >> + * Need to check that the SRE bit has actually been set. If >> + * not, it means that SRE is disabled at EL2. We're going to >> + * die painfully, and there is nothing we can do about it. >> + * >> + * Kindly inform the luser. >> + */ >> + asm volatile("mrs %0, " __stringify(ICC_SRE_EL1) : "=r" (val)); >> + if (!(val & GICC_SRE_EL1_SRE)) >> + pr_err("GIC: unable to set SRE (disabled at EL2), panic ahead\n"); >> +} >> + >> +static void gic_enable_redist(void) >> +{ >> + void __iomem *rbase; >> + u32 count = 1000000; /* 1s! */ >> + u32 val; >> + >> + rbase = gic_data_rdist_rd_base(); >> + >> + /* Wake up this CPU redistributor */ >> + val = readl_relaxed(rbase + GICR_WAKER); >> + val &= ~GICR_WAKER_ProcessorSleep; >> + writel_relaxed(val, rbase + GICR_WAKER); >> + >> + while (readl_relaxed(rbase + GICR_WAKER) & GICR_WAKER_ChildrenAsleep) { >> + count--; >> + if (!count) { >> + pr_err_ratelimited("redist didn't wake up...\n"); >> + return; >> + } >> + cpu_relax(); >> + udelay(1); >> + }; >> +} >> + >> +/* >> + * Routines to acknowledge, disable and enable interrupts >> + */ >> +static void gic_poke_irq(struct irq_data *d, u32 offset) >> +{ >> + u32 mask = 1 << (gic_irq(d) % 32); >> + void (*rwp_wait)(void); >> + void __iomem *base; >> + >> + if (gic_irq_in_rdist(d)) { >> + base = gic_data_rdist_sgi_base(); >> + rwp_wait = gic_redist_wait_for_rwp; >> + } else { >> + base = gic_data.dist_base; >> + rwp_wait = gic_dist_wait_for_rwp; >> + } >> + >> + writel_relaxed(mask, base + offset + (gic_irq(d) / 32) * 4); >> + rwp_wait(); >> +} >> + >> +static int gic_peek_irq(struct irq_data *d, u32 offset) >> +{ >> + u32 mask = 1 << (gic_irq(d) % 32); >> + void __iomem *base; >> + >> + if (gic_irq_in_rdist(d)) >> + base = gic_data_rdist_sgi_base(); >> + else >> + base = gic_data.dist_base; >> + >> + return !!(readl_relaxed(base + offset + (gic_irq(d) / 32) * 4) & mask); >> +} >> + >> +static void gic_mask_irq(struct irq_data *d) >> +{ >> + gic_poke_irq(d, GICD_ICENABLER); >> +} >> + >> +static void gic_unmask_irq(struct irq_data *d) >> +{ >> + gic_poke_irq(d, GICD_ISENABLER); >> +} >> + >> +static void gic_eoi_irq(struct irq_data *d) >> +{ >> + gic_write_eoir(gic_irq(d)); >> +} >> + >> +static int gic_set_type(struct irq_data *d, unsigned int type) >> +{ >> + unsigned int irq = gic_irq(d); >> + void (*rwp_wait)(void); >> + void __iomem *base; >> + >> + if (gic_irq_in_rdist(d)) { >> + base = gic_data_rdist_sgi_base(); >> + rwp_wait = gic_redist_wait_for_rwp; >> + } else { >> + base = gic_data.dist_base; >> + rwp_wait = gic_dist_wait_for_rwp; >> + } >> + >> + /* Interrupt configuration for SGIs can't be changed */ >> + if (irq < 16) >> + return -EINVAL; >> + >> + if (type != IRQ_TYPE_LEVEL_HIGH && type != IRQ_TYPE_EDGE_RISING) >> + return -EINVAL; >> + >> + gic_configure_irq(irq, type, base, rwp_wait); > > I'm noticing here that we're only waiting for the write to config/enable > if the IRQ was already enabled in gic_configure_irq, but gic_unmask_irq > just enables the IRQ without waiting for operation to complete. > > So I'm wondering if there isn't a disconnect between configuring a > disabled IRQ and immediately unmasking it, versus configuring an enabled > IRQ? That's a good point. gic_configure_irq() should wait for rwp unconditionnally in the epilogue. >> + >> + return 0; >> +} >> + >> +static u64 gic_mpidr_to_affinity(u64 mpidr) >> +{ >> + u64 aff; >> + >> + aff = (MPIDR_AFFINITY_LEVEL(mpidr, 3) << 32 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 2) << 16 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 1) << 8 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 0)) & ~GICD_IROUTER_SPI_MODE_ANY; >> + >> + return aff; >> +} >> + >> +static asmlinkage void __exception_irq_entry gic_handle_irq(struct pt_regs *regs) >> +{ >> + u64 irqnr; >> + >> + do { >> + irqnr = gic_read_iar(); >> + >> + if (likely(irqnr > 15 && irqnr < 1021)) { >> + irqnr = irq_find_mapping(gic_data.domain, irqnr); >> + handle_IRQ(irqnr, regs); >> + continue; >> + } >> + if (irqnr < 16) { >> + gic_write_eoir(irqnr); >> +#ifdef CONFIG_SMP >> + handle_IPI(irqnr, regs); >> +#else >> + WARN_ONCE(true, "Unexpected SGI received!\n"); >> +#endif >> + continue; >> + } >> + } while (irqnr != 0x3ff); >> +} >> + >> +static void __init gic_dist_init(void) >> +{ >> + unsigned int i; >> + u64 affinity; >> + void __iomem *base = gic_data.dist_base; >> + >> + /* Disable the distributor */ >> + writel_relaxed(0, base + GICD_CTLR); >> + >> + gic_dist_config(base, gic_data.irq_nr, gic_dist_wait_for_rwp); >> + >> + /* Enable distributor with ARE, Group1 */ >> + writel_relaxed(GICD_CTLR_ARE_NS | GICD_CTLR_ENABLE_G1A | GICD_CTLR_ENABLE_G1, >> + base + GICD_CTLR); >> + >> + /* >> + * Set all global interrupts to the boot CPU only. ARE must be >> + * enabled. >> + */ >> + affinity = gic_mpidr_to_affinity(cpu_logical_map(smp_processor_id())); >> + for (i = 32; i < gic_data.irq_nr; i++) >> + writeq_relaxed(affinity, base + GICD_IROUTER + i * 8); >> +} >> + >> +static int gic_populate_rdist(void) >> +{ >> + u64 mpidr = cpu_logical_map(smp_processor_id()); >> + u64 typer; >> + u32 aff; >> + int i; >> + >> + /* Convery affinity to a 32bit value... */ > > s/Convery/Convert/ > > while you're at it, you could go the extra mile and specify "that can be > matched to GICR_TYPER bits [63:32]". If you really wanted to. Sure. >> + aff = (MPIDR_AFFINITY_LEVEL(mpidr, 3) << 24 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 2) << 16 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 1) << 8 | >> + MPIDR_AFFINITY_LEVEL(mpidr, 0)); >> + >> + for (i = 0; i < gic_data.redist_regions; i++) { >> + void __iomem *ptr = gic_data.redist_base[i]; >> + u32 reg; >> + >> + reg = readl_relaxed(ptr + GICR_PIDR2) & GIC_PIDR2_ARCH_MASK; >> + if (reg != 0x30 && reg != 0x40) { /* We're in trouble... */ >> + pr_warn("No redistributor present @%p\n", ptr); >> + break; >> + } >> + >> + do { >> + typer = readq_relaxed(ptr + GICR_TYPER); >> + if ((typer >> 32) == aff) { >> + gic_data_rdist_rd_base() = ptr; >> + pr_info("CPU%d: found redistributor %llx @%p\n", >> + smp_processor_id(), >> + (unsigned long long)mpidr, ptr); >> + return 0; >> + } >> + >> + if (gic_data.redist_stride) { >> + ptr += gic_data.redist_stride; >> + } else { >> + ptr += SZ_64K * 2; /* Skip RD_base + SGI_base */ >> + if (typer & GICR_TYPER_VLPIS) >> + ptr += SZ_64K * 2; /* Skip VLPI_base + reserved page */ >> + } >> + } while (!(typer & GICR_TYPER_LAST)); >> + } >> + >> + /* We couldn't even deal with ourselves... */ >> + WARN(true, "CPU%d: mpidr %llx has no re-distributor!\n", >> + smp_processor_id(), (unsigned long long)mpidr); >> + return -ENODEV; >> +} >> + >> +static void gic_cpu_init(void) >> +{ >> + void __iomem *rbase; >> + >> + /* Register ourselves with the rest of the world */ >> + if (gic_populate_rdist()) >> + return; >> + >> + gic_enable_redist(); >> + >> + rbase = gic_data_rdist_sgi_base(); >> + >> + gic_cpu_config(rbase, gic_redist_wait_for_rwp); >> + >> + /* Enable system registers */ >> + gic_enable_sre(); >> + >> + /* Set priority mask register */ >> + gic_write_pmr(DEFAULT_PMR_VALUE); >> + >> + /* EOI deactivates interrupt too (mode 0) */ >> + gic_write_ctlr(GICC_CTLR_EL1_EOImode_drop_dir); >> + >> + /* ... and let's hit the road... */ >> + gic_write_grpen1(1); >> +} >> + >> +#ifdef CONFIG_SMP >> +static int gic_secondary_init(struct notifier_block *nfb, >> + unsigned long action, void *hcpu) >> +{ >> + if (action == CPU_STARTING || action == CPU_STARTING_FROZEN) >> + gic_cpu_init(); >> + return NOTIFY_OK; >> +} >> + >> +/* >> + * Notifier for enabling the GIC CPU interface. Set an arbitrarily high >> + * priority because the GIC needs to be up before the ARM generic timers. >> + */ >> +static struct notifier_block gic_cpu_notifier = { >> + .notifier_call = gic_secondary_init, >> + .priority = 100, >> +}; >> + >> +static u16 gic_compute_target_list(int *base_cpu, const struct cpumask *mask, >> + u64 cluster_id) >> +{ >> + int cpu = *base_cpu; >> + u64 mpidr = cpu_logical_map(cpu); >> + u16 tlist = 0; >> + >> + while (cpu < nr_cpu_ids) { >> + /* >> + * If we ever get a cluster of more than 16 CPUs, just >> + * scream and skip that CPU. >> + */ >> + if (WARN_ON((mpidr & 0xff) >= 16)) >> + goto out; >> + >> + tlist |= 1 << (mpidr & 0xf); >> + >> + cpu = cpumask_next(cpu, mask); >> + if (cpu == nr_cpu_ids) >> + goto out; >> + >> + mpidr = cpu_logical_map(cpu); >> + >> + if (cluster_id != (mpidr & ~0xffUL)) { >> + cpu--; >> + goto out; >> + } >> + } >> +out: >> + *base_cpu = cpu; >> + return tlist; >> +} >> + >> +static void gic_send_sgi(u64 cluster_id, u16 tlist, unsigned int irq) >> +{ >> + u64 val; >> + >> + val = (MPIDR_AFFINITY_LEVEL(cluster_id, 3) << 48 | >> + MPIDR_AFFINITY_LEVEL(cluster_id, 2) << 32 | >> + irq << 24 | >> + MPIDR_AFFINITY_LEVEL(cluster_id, 1) << 16 | >> + tlist); >> + >> + pr_debug("CPU%d: ICC_SGI1R_EL1 %llx\n", smp_processor_id(), val); >> + gic_write_sgi1r(val); >> +} >> + >> +static void gic_raise_softirq(const struct cpumask *mask, unsigned int irq) >> +{ >> + int cpu; >> + >> + if (WARN_ON(irq >= 16)) >> + return; >> + >> + /* >> + * Ensure that stores to Normal memory are visible to the >> + * other CPUs before issuing the IPI. >> + */ >> + smp_wmb(); >> + >> + for_each_cpu_mask(cpu, *mask) { >> + u64 cluster_id = cpu_logical_map(cpu) & ~0xffUL; >> + u16 tlist; >> + >> + tlist = gic_compute_target_list(&cpu, mask, cluster_id); >> + gic_send_sgi(cluster_id, tlist, irq); >> + } >> + >> + /* Force the above writes to ICC_SGI1R_EL1 to be executed */ >> + isb(); >> +} >> + >> +static void gic_smp_init(void) >> +{ >> + set_smp_cross_call(gic_raise_softirq); >> + register_cpu_notifier(&gic_cpu_notifier); >> +} >> + >> +static int gic_set_affinity(struct irq_data *d, const struct cpumask *mask_val, >> + bool force) >> +{ >> + unsigned int cpu = cpumask_any_and(mask_val, cpu_online_mask); >> + void __iomem *reg; >> + int enabled; >> + u64 val; >> + >> + if (gic_irq_in_rdist(d)) >> + return -EINVAL; >> + >> + /* If interrupt was enabled, disable it first */ >> + enabled = gic_peek_irq(d, GICD_ISENABLER); >> + if (enabled) >> + gic_mask_irq(d); >> + >> + reg = gic_dist_base(d) + GICD_IROUTER + (gic_irq(d) * 8); >> + val = gic_mpidr_to_affinity(cpu_logical_map(cpu)); >> + >> + writeq_relaxed(val, reg); >> + >> + /* >> + * If the interrupt was enabled, enabled it again. Otherwise, >> + * just wait for the distributor to have digested our changes. >> + */ >> + if (enabled) >> + gic_unmask_irq(d); >> + else >> + gic_dist_wait_for_rwp(); > > If we don't need to wait for RWP when enabling the interrupt, why do we > need to wait if we're not going to enable it (presumably nothing ever > takes effect until someone later enables the interrupt, in which case > the effect would be the same? no?)? We do wait on the unmask path too (see gic_poke_irq). >> + >> + return IRQ_SET_MASK_OK; >> +} >> +#else >> +#define gic_set_affinity NULL >> +#define gic_smp_init() do { } while(0) >> +#endif >> + >> +static struct irq_chip gic_chip = { >> + .name = "GICv3", >> + .irq_mask = gic_mask_irq, >> + .irq_unmask = gic_unmask_irq, >> + .irq_eoi = gic_eoi_irq, >> + .irq_set_type = gic_set_type, >> + .irq_set_affinity = gic_set_affinity, >> +}; >> + >> +static int gic_irq_domain_map(struct irq_domain *d, unsigned int irq, >> + irq_hw_number_t hw) >> +{ >> + /* SGIs are private to the core kernel */ >> + if (hw < 16) >> + return -EPERM; >> + /* PPIs */ >> + if (hw < 32) { >> + irq_set_percpu_devid(irq); >> + irq_set_chip_and_handler(irq, &gic_chip, >> + handle_percpu_devid_irq); >> + set_irq_flags(irq, IRQF_VALID | IRQF_NOAUTOEN); >> + } >> + /* SPIs */ >> + if (hw >= 32 && hw < gic_data.irq_nr) { >> + irq_set_chip_and_handler(irq, &gic_chip, >> + handle_fasteoi_irq); >> + set_irq_flags(irq, IRQF_VALID | IRQF_PROBE); >> + } >> + irq_set_chip_data(irq, d->host_data); >> + return 0; >> +} >> + >> +static int gic_irq_domain_xlate(struct irq_domain *d, >> + struct device_node *controller, >> + const u32 *intspec, unsigned int intsize, >> + unsigned long *out_hwirq, unsigned int *out_type) >> +{ >> + if (d->of_node != controller) >> + return -EINVAL; >> + if (intsize < 3) >> + return -EINVAL; >> + >> + switch(intspec[0]) { >> + case 0: /* SPI */ >> + *out_hwirq = intspec[1] + 32; >> + break; >> + case 1: /* PPI */ >> + *out_hwirq = intspec[1] + 16; >> + break; >> + default: >> + return -EINVAL; >> + } >> + >> + *out_type = intspec[2] & IRQ_TYPE_SENSE_MASK; >> + return 0; >> +} >> + >> +static const struct irq_domain_ops gic_irq_domain_ops = { >> + .map = gic_irq_domain_map, >> + .xlate = gic_irq_domain_xlate, >> +}; >> + >> +static int __init gic_of_init(struct device_node *node, struct device_node *parent) >> +{ >> + void __iomem *dist_base; >> + void __iomem **redist_base; >> + u64 redist_stride; >> + u32 redist_regions; >> + u32 reg; >> + int gic_irqs; >> + int err; >> + int i; >> + >> + dist_base = of_iomap(node, 0); >> + if (!dist_base) { >> + pr_err("%s: unable to map gic dist registers\n", >> + node->full_name); >> + return -ENXIO; >> + } >> + >> + reg = readl_relaxed(dist_base + GICD_PIDR2) & GIC_PIDR2_ARCH_MASK; >> + if (reg != 0x30 && reg != 0x40) { >> + pr_err("%s: no distributor detected, giving up\n", >> + node->full_name); >> + err = -ENODEV; >> + goto out_unmap_dist; >> + } >> + >> + if (of_property_read_u32(node, "#redistributor-regions", &redist_regions)) >> + redist_regions = 1; >> + >> + redist_base = kzalloc(sizeof(*redist_base) * redist_regions, GFP_KERNEL); >> + if (!redist_base) { >> + err = -ENOMEM; >> + goto out_unmap_dist; >> + } >> + >> + for (i = 0; i < redist_regions; i++) { >> + redist_base[i] = of_iomap(node, 1 + i); >> + if (!redist_base[i]) { >> + pr_err("%s: couldn't map region %d\n", >> + node->full_name, i); >> + err = -ENODEV; >> + goto out_unmap_rdist; >> + } >> + } >> + >> + if (of_property_read_u64(node, "redistributor-stride", &redist_stride)) >> + redist_stride = 0; >> + >> + gic_data.dist_base = dist_base; >> + gic_data.redist_base = redist_base; >> + gic_data.redist_regions = redist_regions; >> + gic_data.redist_stride = redist_stride; >> + >> + /* >> + * Find out how many interrupts are supported. >> + * The GIC only supports up to 1020 interrupt sources (SGI+PPI+SPI) >> + */ >> + gic_irqs = readl_relaxed(gic_data.dist_base + GICD_TYPER) & 0x1f; >> + gic_irqs = (gic_irqs + 1) * 32; >> + if (gic_irqs > 1020) >> + gic_irqs = 1020; >> + gic_data.irq_nr = gic_irqs; >> + >> + gic_data.domain = irq_domain_add_tree(node, &gic_irq_domain_ops, >> + &gic_data); >> + gic_data.rdist = alloc_percpu(typeof(*gic_data.rdist)); >> + >> + if (WARN_ON(!gic_data.domain) || WARN_ON(!gic_data.rdist)) { >> + err = -ENOMEM; >> + goto out_free; >> + } >> + >> + set_handle_irq(gic_handle_irq); >> + >> + gic_smp_init(); >> + gic_dist_init(); >> + gic_cpu_init(); >> + >> + return 0; >> + >> +out_free: >> + if (gic_data.domain) >> + irq_domain_remove(gic_data.domain); >> + free_percpu(gic_data.rdist); >> +out_unmap_rdist: >> + for (i = 0; i < redist_regions; i++) >> + if (redist_base[i]) >> + iounmap(redist_base[i]); >> + kfree(redist_base); >> +out_unmap_dist: >> + iounmap(dist_base); >> + return err; >> +} >> + >> +IRQCHIP_DECLARE(gic_v3, "arm,gic-v3", gic_of_init); >> diff --git a/include/linux/irqchip/arm-gic-v3.h b/include/linux/irqchip/arm-gic-v3.h >> new file mode 100644 >> index 0000000..16c8b05 >> --- /dev/null >> +++ b/include/linux/irqchip/arm-gic-v3.h >> @@ -0,0 +1,188 @@ >> +/* >> + * Copyright (C) 2013, 2014 ARM Limited, All Rights Reserved. >> + * Author: Marc Zyngier <marc.zyngier@xxxxxxx> >> + * >> + * >> + * This program is free software; you can redistribute it and/or modify >> + * it under the terms of the GNU General Public License version 2 as >> + * published by the Free Software Foundation. >> + * >> + * This program is distributed in the hope that it will be useful, >> + * but WITHOUT ANY WARRANTY; without even the implied warranty of >> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the >> + * GNU General Public License for more details. >> + * >> + * You should have received a copy of the GNU General Public License >> + * along with this program. If not, see <http://www.gnu.org/licenses/>. >> + */ >> +#ifndef __LINUX_IRQCHIP_ARM_GIC_V3_H >> +#define __LINUX_IRQCHIP_ARM_GIC_V3_H >> + >> +/* >> + * Distributor registers. We assume we're running non-secure, with ARE >> + * being set. Secure-only and non-ARE registers are not described. >> + */ >> +#define GICD_CTLR 0x0000 >> +#define GICD_TYPER 0x0004 >> +#define GICD_IIDR 0x0008 >> +#define GICD_STATUSR 0x0010 >> +#define GICD_SETSPI_NSR 0x0040 >> +#define GICD_CLRSPI_NSR 0x0048 >> +#define GICD_SETSPI_SR 0x0050 >> +#define GICD_CLRSPI_SR 0x0058 >> +#define GICD_SEIR 0x0068 >> +#define GICD_ISENABLER 0x0100 >> +#define GICD_ICENABLER 0x0180 >> +#define GICD_ISPENDR 0x0200 >> +#define GICD_ICPENDR 0x0280 >> +#define GICD_ISACTIVER 0x0300 >> +#define GICD_ICACTIVER 0x0380 >> +#define GICD_IPRIORITYR 0x0400 >> +#define GICD_ICFGR 0x0C00 >> +#define GICD_IROUTER 0x6000 >> +#define GICD_PIDR2 0xFFE8 >> + >> +#define GICD_CTLR_RWP (1U << 31) >> +#define GICD_CTLR_ARE_NS (1U << 4) >> +#define GICD_CTLR_ENABLE_G1A (1U << 1) >> +#define GICD_CTLR_ENABLE_G1 (1U << 0) >> + >> +#define GICD_IROUTER_SPI_MODE_ONE (0U << 31) >> +#define GICD_IROUTER_SPI_MODE_ANY (1U << 31) >> + >> +#define GIC_PIDR2_ARCH_MASK 0xf0 >> + >> +/* >> + * Re-Distributor registers, offsets from RD_base >> + */ >> +#define GICR_CTLR GICD_CTLR >> +#define GICR_IIDR 0x0004 >> +#define GICR_TYPER 0x0008 >> +#define GICR_STATUSR GICD_STATUSR >> +#define GICR_WAKER 0x0014 >> +#define GICR_SETLPIR 0x0040 >> +#define GICR_CLRLPIR 0x0048 >> +#define GICR_SEIR GICD_SEIR >> +#define GICR_PROPBASER 0x0070 >> +#define GICR_PENDBASER 0x0078 >> +#define GICR_INVLPIR 0x00A0 >> +#define GICR_INVALLR 0x00B0 >> +#define GICR_SYNCR 0x00C0 >> +#define GICR_MOVLPIR 0x0100 >> +#define GICR_MOVALLR 0x0110 >> +#define GICR_PIDR2 GICD_PIDR2 >> + >> +#define GICR_WAKER_ProcessorSleep (1U << 1) >> +#define GICR_WAKER_ChildrenAsleep (1U << 2) >> + >> +/* >> + * Re-Distributor registers, offsets from SGI_base >> + */ >> +#define GICR_ISENABLER0 GICD_ISENABLER >> +#define GICR_ICENABLER0 GICD_ICENABLER >> +#define GICR_ISPENDR0 GICD_ISPENDR >> +#define GICR_ICPENDR0 GICD_ICPENDR >> +#define GICR_ISACTIVER0 GICD_ISACTIVER >> +#define GICR_ICACTIVER0 GICD_ICACTIVER >> +#define GICR_IPRIORITYR0 GICD_IPRIORITYR >> +#define GICR_ICFGR0 GICD_ICFGR >> + >> +#define GICR_TYPER_VLPIS (1U << 1) >> +#define GICR_TYPER_LAST (1U << 4) >> + >> +/* >> + * CPU interface registers >> + */ >> +#define GICC_CTLR_EL1_EOImode_drop_dir (0U << 1) >> +#define GICC_CTLR_EL1_EOImode_drop (1U << 1) >> +#define GICC_SRE_EL1_SRE (1U << 0) >> + >> +/* >> + * Hypervisor interface registers (SRE only) >> + */ >> +#define GICH_LR_VIRTUAL_ID_MASK ((1UL << 32) - 1) >> + >> +#define GICH_LR_EOI (1UL << 41) >> +#define GICH_LR_GROUP (1UL << 60) >> +#define GICH_LR_STATE (3UL << 62) >> +#define GICH_LR_PENDING_BIT (1UL << 62) >> +#define GICH_LR_ACTIVE_BIT (1UL << 63) >> + >> +#define GICH_MISR_EOI (1 << 0) >> +#define GICH_MISR_U (1 << 1) >> + >> +#define GICH_HCR_EN (1 << 0) >> +#define GICH_HCR_UIE (1 << 1) >> + >> +#define GICH_VMCR_CTLR_SHIFT 0 >> +#define GICH_VMCR_CTLR_MASK (0x21f << GICH_VMCR_CTLR_SHIFT) >> +#define GICH_VMCR_BPR1_SHIFT 18 >> +#define GICH_VMCR_BPR1_MASK (7 << GICH_VMCR_BPR1_SHIFT) >> +#define GICH_VMCR_BPR0_SHIFT 21 >> +#define GICH_VMCR_BPR0_MASK (7 << GICH_VMCR_BPR0_SHIFT) >> +#define GICH_VMCR_PMR_SHIFT 24 >> +#define GICH_VMCR_PMR_MASK (0xffUL << GICH_VMCR_PMR_SHIFT) >> + >> +#define ICC_EOIR1_EL1 S3_0_C12_C12_1 >> +#define ICC_IAR1_EL1 S3_0_C12_C12_0 >> +#define ICC_SGI1R_EL1 S3_0_C12_C11_5 >> +#define ICC_PMR_EL1 S3_0_C4_C6_0 >> +#define ICC_CTLR_EL1 S3_0_C12_C12_4 >> +#define ICC_SRE_EL1 S3_0_C12_C12_5 >> +#define ICC_GRPEN1_EL1 S3_0_C12_C12_7 >> + >> +#define ICC_SRE_EL2 S3_4_C12_C9_5 >> + >> +#define ICH_VSEIR_EL2 S3_4_C12_C9_4 >> +#define ICH_HCR_EL2 S3_4_C12_C11_0 >> +#define ICH_VTR_EL2 S3_4_C12_C11_1 >> +#define ICH_MISR_EL2 S3_4_C12_C11_2 >> +#define ICH_EISR_EL2 S3_4_C12_C11_3 >> +#define ICH_ELSR_EL2 S3_4_C12_C11_5 >> +#define ICH_VMCR_EL2 S3_4_C12_C11_7 >> + >> +#define __LR0_EL2(x) S3_4_C12_C12_ ## x >> +#define __LR8_EL2(x) S3_4_C12_C13_ ## x >> + >> +#define ICH_LR0_EL2 __LR0_EL2(0) >> +#define ICH_LR1_EL2 __LR0_EL2(1) >> +#define ICH_LR2_EL2 __LR0_EL2(2) >> +#define ICH_LR3_EL2 __LR0_EL2(3) >> +#define ICH_LR4_EL2 __LR0_EL2(4) >> +#define ICH_LR5_EL2 __LR0_EL2(5) >> +#define ICH_LR6_EL2 __LR0_EL2(6) >> +#define ICH_LR7_EL2 __LR0_EL2(7) >> +#define ICH_LR8_EL2 __LR8_EL2(0) >> +#define ICH_LR9_EL2 __LR8_EL2(1) >> +#define ICH_LR10_EL2 __LR8_EL2(2) >> +#define ICH_LR11_EL2 __LR8_EL2(3) >> +#define ICH_LR12_EL2 __LR8_EL2(4) >> +#define ICH_LR13_EL2 __LR8_EL2(5) >> +#define ICH_LR14_EL2 __LR8_EL2(6) >> +#define ICH_LR15_EL2 __LR8_EL2(7) >> + >> +#define __AP0Rx_EL2(x) S3_4_C12_C8_ ## x >> +#define ICH_AP0R0_EL2 __AP0Rx_EL2(0) >> +#define ICH_AP0R1_EL2 __AP0Rx_EL2(1) >> +#define ICH_AP0R2_EL2 __AP0Rx_EL2(2) >> +#define ICH_AP0R3_EL2 __AP0Rx_EL2(3) >> + >> +#define __AP1Rx_EL2(x) S3_4_C12_C9_ ## x >> +#define ICH_AP1R0_EL2 __AP1Rx_EL2(0) >> +#define ICH_AP1R1_EL2 __AP1Rx_EL2(1) >> +#define ICH_AP1R2_EL2 __AP1Rx_EL2(2) >> +#define ICH_AP1R3_EL2 __AP1Rx_EL2(3) >> + >> +#ifndef __ASSEMBLY__ >> + >> +#include <linux/stringify.h> >> + >> +static inline void gic_write_eoir(u64 irq) >> +{ >> + asm volatile("msr " __stringify(ICC_EOIR1_EL1) ", %0" : : "r" (irq)); >> + isb(); >> +} >> + >> +#endif >> + >> +#endif >> -- >> 1.8.3.4 >> > > I noticed that you removed all the dist_lock locks here. I assume there > was some rationale behind this, and given you can share that explanation > with me and address the other tiny issues: The purpose of the lock was to avoid races between mask/unmask and set_type (both of which use the enable registers). But given that these registers can operate on a single bit (set/clear operations), and that the kernel won't try to do both at the same time, it is safe to get rid of the whole locking. > Reviewed-by: Christoffer Dall <christoffer.dall@xxxxxxxxxx> Thanks, M. -- Jazz is not dead. It just smells funny. _______________________________________________ kvmarm mailing list kvmarm@xxxxxxxxxxxxxxxxxxxxx https://lists.cs.columbia.edu/mailman/listinfo/kvmarm