2011-04-04 11:46:58 +08:00
|
|
|
/*
|
|
|
|
* Copyright 2011 IBM Corporation.
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version
|
|
|
|
* 2 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
#include <linux/types.h>
|
|
|
|
#include <linux/threads.h>
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/irq.h>
|
|
|
|
#include <linux/debugfs.h>
|
|
|
|
#include <linux/smp.h>
|
|
|
|
#include <linux/interrupt.h>
|
|
|
|
#include <linux/seq_file.h>
|
|
|
|
#include <linux/init.h>
|
|
|
|
#include <linux/cpu.h>
|
|
|
|
#include <linux/of.h>
|
|
|
|
#include <linux/slab.h>
|
|
|
|
#include <linux/spinlock.h>
|
|
|
|
|
|
|
|
#include <asm/prom.h>
|
|
|
|
#include <asm/io.h>
|
|
|
|
#include <asm/smp.h>
|
|
|
|
#include <asm/machdep.h>
|
|
|
|
#include <asm/irq.h>
|
|
|
|
#include <asm/errno.h>
|
|
|
|
#include <asm/rtas.h>
|
|
|
|
#include <asm/xics.h>
|
|
|
|
#include <asm/firmware.h>
|
|
|
|
|
|
|
|
/* Globals common to all ICP/ICS implementations */
|
|
|
|
const struct icp_ops *icp_ops;
|
|
|
|
|
|
|
|
unsigned int xics_default_server = 0xff;
|
|
|
|
unsigned int xics_default_distrib_server = 0;
|
|
|
|
unsigned int xics_interrupt_server_size = 8;
|
|
|
|
|
|
|
|
DEFINE_PER_CPU(struct xics_cppr, xics_cppr);
|
|
|
|
|
2012-02-15 05:06:50 +08:00
|
|
|
struct irq_domain *xics_host;
|
2011-04-04 11:46:58 +08:00
|
|
|
|
|
|
|
static LIST_HEAD(ics_list);
|
|
|
|
|
|
|
|
void xics_update_irq_servers(void)
|
|
|
|
{
|
|
|
|
int i, j;
|
|
|
|
struct device_node *np;
|
|
|
|
u32 ilen;
|
|
|
|
const u32 *ireg;
|
|
|
|
u32 hcpuid;
|
|
|
|
|
|
|
|
/* Find the server numbers for the boot cpu. */
|
|
|
|
np = of_get_cpu_node(boot_cpuid, NULL);
|
|
|
|
BUG_ON(!np);
|
|
|
|
|
|
|
|
hcpuid = get_hard_smp_processor_id(boot_cpuid);
|
2011-03-04 15:25:55 +08:00
|
|
|
xics_default_server = xics_default_distrib_server = hcpuid;
|
|
|
|
|
|
|
|
pr_devel("xics: xics_default_server = 0x%x\n", xics_default_server);
|
2011-04-04 11:46:58 +08:00
|
|
|
|
|
|
|
ireg = of_get_property(np, "ibm,ppc-interrupt-gserver#s", &ilen);
|
|
|
|
if (!ireg) {
|
|
|
|
of_node_put(np);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
i = ilen / sizeof(int);
|
|
|
|
|
|
|
|
/* Global interrupt distribution server is specified in the last
|
|
|
|
* entry of "ibm,ppc-interrupt-gserver#s" property. Get the last
|
|
|
|
* entry fom this property for current boot cpu id and use it as
|
|
|
|
* default distribution server
|
|
|
|
*/
|
|
|
|
for (j = 0; j < i; j += 2) {
|
|
|
|
if (ireg[j] == hcpuid) {
|
|
|
|
xics_default_distrib_server = ireg[j+1];
|
2011-03-04 15:25:55 +08:00
|
|
|
break;
|
2011-04-04 11:46:58 +08:00
|
|
|
}
|
|
|
|
}
|
2011-03-04 15:25:55 +08:00
|
|
|
pr_devel("xics: xics_default_distrib_server = 0x%x\n",
|
|
|
|
xics_default_distrib_server);
|
2011-04-04 11:46:58 +08:00
|
|
|
of_node_put(np);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* GIQ stuff, currently only supported on RTAS setups, will have
|
|
|
|
* to be sorted properly for bare metal
|
|
|
|
*/
|
|
|
|
void xics_set_cpu_giq(unsigned int gserver, unsigned int join)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_PPC_RTAS
|
|
|
|
int index;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
if (!rtas_indicator_present(GLOBAL_INTERRUPT_QUEUE, NULL))
|
|
|
|
return;
|
|
|
|
|
|
|
|
index = (1UL << xics_interrupt_server_size) - 1 - gserver;
|
|
|
|
|
|
|
|
status = rtas_set_indicator_fast(GLOBAL_INTERRUPT_QUEUE, index, join);
|
|
|
|
|
|
|
|
WARN(status < 0, "set-indicator(%d, %d, %u) returned %d\n",
|
|
|
|
GLOBAL_INTERRUPT_QUEUE, index, join, status);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
void xics_setup_cpu(void)
|
|
|
|
{
|
|
|
|
icp_ops->set_priority(LOWEST_PRIORITY);
|
|
|
|
|
|
|
|
xics_set_cpu_giq(xics_default_distrib_server, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
void xics_mask_unknown_vec(unsigned int vec)
|
|
|
|
{
|
|
|
|
struct ics *ics;
|
|
|
|
|
2011-03-04 15:25:55 +08:00
|
|
|
pr_err("Interrupt 0x%x (real) is invalid, disabling it.\n", vec);
|
2011-04-04 11:46:58 +08:00
|
|
|
|
|
|
|
list_for_each_entry(ics, &ics_list, link)
|
|
|
|
ics->mask_unknown(ics, vec);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
|
|
|
|
static void xics_request_ipi(void)
|
|
|
|
{
|
|
|
|
unsigned int ipi;
|
|
|
|
|
|
|
|
ipi = irq_create_mapping(xics_host, XICS_IPI);
|
|
|
|
BUG_ON(ipi == NO_IRQ);
|
|
|
|
|
|
|
|
/*
|
2011-10-22 07:56:27 +08:00
|
|
|
* IPIs are marked IRQF_PERCPU. The handler was set in map.
|
2011-04-04 11:46:58 +08:00
|
|
|
*/
|
|
|
|
BUG_ON(request_irq(ipi, icp_ops->ipi_action,
|
2011-10-05 10:30:50 +08:00
|
|
|
IRQF_PERCPU | IRQF_NO_THREAD, "IPI", NULL));
|
2011-04-04 11:46:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int __init xics_smp_probe(void)
|
|
|
|
{
|
powerpc: Consolidate ipi message mux and demux
Consolidate the mux and demux of ipi messages into smp.c and call
a new smp_ops callback to actually trigger the ipi.
The powerpc architecture code is optimised for having 4 distinct
ipi triggers, which are mapped to 4 distinct messages (ipi many, ipi
single, scheduler ipi, and enter debugger). However, several interrupt
controllers only provide a single software triggered interrupt that
can be delivered to each cpu. To resolve this limitation, each smp_ops
implementation created a per-cpu variable that is manipulated with atomic
bitops. Since these lines will be contended they are optimialy marked as
shared_aligned and take a full cache line for each cpu. Distro kernels
may have 2 or 3 of these in their config, each taking per-cpu space
even though at most one will be in use.
This consolidation removes smp_message_recv and replaces the single call
actions cases with direct calls from the common message recognition loop.
The complicated debugger ipi case with its muxed crash handling code is
moved to debug_ipi_action which is now called from the demux code (instead
of the multi-message action calling smp_message_recv).
I put a call to reschedule_action to increase the likelyhood of correctly
merging the anticipated scheduler_ipi() hook coming from the scheduler
tree; that single required call can be inlined later.
The actual message decode is a copy of the old pseries xics code with its
memory barriers and cache line spacing, augmented with a per-cpu unsigned
long based on the book-e doorbell code. The optional data is set via a
callback from the implementation and is passed to the new cause-ipi hook
along with the logical cpu number. While currently only the doorbell
implemntation uses this data it should be almost zero cost to retrieve and
pass it -- it adds a single register load for the argument from the same
cache line to which we just completed a store and the register is dead
on return from the call. I extended the data element from unsigned int
to unsigned long in case some other code wanted to associate a pointer.
The doorbell check_self is replaced by a call to smp_muxed_ipi_resend,
conditioned on the CPU_DBELL feature. The ifdef guard could be relaxed
to CONFIG_SMP but I left it with BOOKE for now.
Also, the doorbell interrupt vector for book-e was not calling irq_enter
and irq_exit, which throws off cpu accounting and causes code to not
realize it is running in interrupt context. Add the missing calls.
Signed-off-by: Milton Miller <miltonm@bga.com>
Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
2011-05-11 03:29:39 +08:00
|
|
|
/* Setup cause_ipi callback based on which ICP is used */
|
|
|
|
smp_ops->cause_ipi = icp_ops->cause_ipi;
|
2011-04-04 11:46:58 +08:00
|
|
|
|
|
|
|
/* Register all the IPIs */
|
|
|
|
xics_request_ipi();
|
|
|
|
|
|
|
|
return cpumask_weight(cpu_possible_mask);
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* CONFIG_SMP */
|
|
|
|
|
|
|
|
void xics_teardown_cpu(void)
|
|
|
|
{
|
|
|
|
struct xics_cppr *os_cppr = &__get_cpu_var(xics_cppr);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* we have to reset the cppr index to 0 because we're
|
|
|
|
* not going to return from the IPI
|
|
|
|
*/
|
|
|
|
os_cppr->index = 0;
|
|
|
|
icp_ops->set_priority(0);
|
|
|
|
icp_ops->teardown_cpu();
|
|
|
|
}
|
|
|
|
|
|
|
|
void xics_kexec_teardown_cpu(int secondary)
|
|
|
|
{
|
|
|
|
xics_teardown_cpu();
|
|
|
|
|
|
|
|
icp_ops->flush_ipi();
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Some machines need to have at least one cpu in the GIQ,
|
|
|
|
* so leave the master cpu in the group.
|
|
|
|
*/
|
|
|
|
if (secondary)
|
|
|
|
xics_set_cpu_giq(xics_default_distrib_server, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef CONFIG_HOTPLUG_CPU
|
|
|
|
|
|
|
|
/* Interrupts are disabled. */
|
|
|
|
void xics_migrate_irqs_away(void)
|
|
|
|
{
|
|
|
|
int cpu = smp_processor_id(), hw_cpu = hard_smp_processor_id();
|
|
|
|
unsigned int irq, virq;
|
|
|
|
|
|
|
|
/* If we used to be the default server, move to the new "boot_cpuid" */
|
|
|
|
if (hw_cpu == xics_default_server)
|
|
|
|
xics_update_irq_servers();
|
|
|
|
|
|
|
|
/* Reject any interrupt that was queued to us... */
|
|
|
|
icp_ops->set_priority(0);
|
|
|
|
|
|
|
|
/* Remove ourselves from the global interrupt queue */
|
|
|
|
xics_set_cpu_giq(xics_default_distrib_server, 0);
|
|
|
|
|
|
|
|
/* Allow IPIs again... */
|
|
|
|
icp_ops->set_priority(DEFAULT_PRIORITY);
|
|
|
|
|
|
|
|
for_each_irq(virq) {
|
|
|
|
struct irq_desc *desc;
|
|
|
|
struct irq_chip *chip;
|
|
|
|
long server;
|
|
|
|
unsigned long flags;
|
|
|
|
struct ics *ics;
|
|
|
|
|
|
|
|
/* We can't set affinity on ISA interrupts */
|
|
|
|
if (virq < NUM_ISA_INTERRUPTS)
|
|
|
|
continue;
|
|
|
|
desc = irq_to_desc(virq);
|
|
|
|
/* We only need to migrate enabled IRQS */
|
|
|
|
if (!desc || !desc->action)
|
|
|
|
continue;
|
2012-02-15 05:06:51 +08:00
|
|
|
if (desc->irq_data.domain != xics_host)
|
|
|
|
continue;
|
|
|
|
irq = desc->irq_data.hwirq;
|
|
|
|
/* We need to get IPIs still. */
|
|
|
|
if (irq == XICS_IPI || irq == XICS_IRQ_SPURIOUS)
|
|
|
|
continue;
|
2011-04-04 11:46:58 +08:00
|
|
|
chip = irq_desc_get_chip(desc);
|
|
|
|
if (!chip || !chip->irq_set_affinity)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
raw_spin_lock_irqsave(&desc->lock, flags);
|
|
|
|
|
|
|
|
/* Locate interrupt server */
|
|
|
|
server = -1;
|
|
|
|
ics = irq_get_chip_data(virq);
|
|
|
|
if (ics)
|
|
|
|
server = ics->get_server(ics, irq);
|
|
|
|
if (server < 0) {
|
|
|
|
printk(KERN_ERR "%s: Can't find server for irq %d\n",
|
|
|
|
__func__, irq);
|
|
|
|
goto unlock;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* We only support delivery to all cpus or to one cpu.
|
|
|
|
* The irq has to be migrated only in the single cpu
|
|
|
|
* case.
|
|
|
|
*/
|
|
|
|
if (server != hw_cpu)
|
|
|
|
goto unlock;
|
|
|
|
|
|
|
|
/* This is expected during cpu offline. */
|
|
|
|
if (cpu_online(cpu))
|
|
|
|
pr_warning("IRQ %u affinity broken off cpu %u\n",
|
|
|
|
virq, cpu);
|
|
|
|
|
|
|
|
/* Reset affinity to all cpus */
|
|
|
|
raw_spin_unlock_irqrestore(&desc->lock, flags);
|
|
|
|
irq_set_affinity(virq, cpu_all_mask);
|
|
|
|
continue;
|
|
|
|
unlock:
|
|
|
|
raw_spin_unlock_irqrestore(&desc->lock, flags);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif /* CONFIG_HOTPLUG_CPU */
|
|
|
|
|
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
/*
|
|
|
|
* For the moment we only implement delivery to all cpus or one cpu.
|
|
|
|
*
|
|
|
|
* If the requested affinity is cpu_all_mask, we set global affinity.
|
|
|
|
* If not we set it to the first cpu in the mask, even if multiple cpus
|
|
|
|
* are set. This is so things like irqbalance (which set core and package
|
|
|
|
* wide affinities) do the right thing.
|
2011-03-04 15:25:55 +08:00
|
|
|
*
|
|
|
|
* We need to fix this to implement support for the links
|
2011-04-04 11:46:58 +08:00
|
|
|
*/
|
|
|
|
int xics_get_irq_server(unsigned int virq, const struct cpumask *cpumask,
|
|
|
|
unsigned int strict_check)
|
|
|
|
{
|
|
|
|
|
|
|
|
if (!distribute_irqs)
|
|
|
|
return xics_default_server;
|
|
|
|
|
|
|
|
if (!cpumask_subset(cpu_possible_mask, cpumask)) {
|
|
|
|
int server = cpumask_first_and(cpu_online_mask, cpumask);
|
|
|
|
|
|
|
|
if (server < nr_cpu_ids)
|
|
|
|
return get_hard_smp_processor_id(server);
|
|
|
|
|
|
|
|
if (strict_check)
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Workaround issue with some versions of JS20 firmware that
|
|
|
|
* deliver interrupts to cpus which haven't been started. This
|
|
|
|
* happens when using the maxcpus= boot option.
|
|
|
|
*/
|
|
|
|
if (cpumask_equal(cpu_online_mask, cpu_present_mask))
|
|
|
|
return xics_default_distrib_server;
|
|
|
|
|
|
|
|
return xics_default_server;
|
|
|
|
}
|
|
|
|
#endif /* CONFIG_SMP */
|
|
|
|
|
2012-02-15 05:06:50 +08:00
|
|
|
static int xics_host_match(struct irq_domain *h, struct device_node *node)
|
2011-04-04 11:46:58 +08:00
|
|
|
{
|
2011-04-15 06:31:59 +08:00
|
|
|
struct ics *ics;
|
|
|
|
|
|
|
|
list_for_each_entry(ics, &ics_list, link)
|
|
|
|
if (ics->host_match(ics, node))
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
return 0;
|
2011-04-04 11:46:58 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Dummies */
|
|
|
|
static void xics_ipi_unmask(struct irq_data *d) { }
|
|
|
|
static void xics_ipi_mask(struct irq_data *d) { }
|
|
|
|
|
|
|
|
static struct irq_chip xics_ipi_chip = {
|
|
|
|
.name = "XICS",
|
|
|
|
.irq_eoi = NULL, /* Patched at init time */
|
|
|
|
.irq_mask = xics_ipi_mask,
|
|
|
|
.irq_unmask = xics_ipi_unmask,
|
|
|
|
};
|
|
|
|
|
2012-02-15 05:06:50 +08:00
|
|
|
static int xics_host_map(struct irq_domain *h, unsigned int virq,
|
2011-04-04 11:46:58 +08:00
|
|
|
irq_hw_number_t hw)
|
|
|
|
{
|
|
|
|
struct ics *ics;
|
|
|
|
|
|
|
|
pr_devel("xics: map virq %d, hwirq 0x%lx\n", virq, hw);
|
|
|
|
|
|
|
|
/* Insert the interrupt mapping into the radix tree for fast lookup */
|
|
|
|
irq_radix_revmap_insert(xics_host, virq, hw);
|
|
|
|
|
|
|
|
/* They aren't all level sensitive but we just don't really know */
|
|
|
|
irq_set_status_flags(virq, IRQ_LEVEL);
|
|
|
|
|
|
|
|
/* Don't call into ICS for IPIs */
|
|
|
|
if (hw == XICS_IPI) {
|
|
|
|
irq_set_chip_and_handler(virq, &xics_ipi_chip,
|
2011-05-11 03:29:49 +08:00
|
|
|
handle_percpu_irq);
|
2011-04-04 11:46:58 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Let the ICS setup the chip data */
|
|
|
|
list_for_each_entry(ics, &ics_list, link)
|
|
|
|
if (ics->map(ics, virq) == 0)
|
2011-05-11 03:29:49 +08:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
return -EINVAL;
|
2011-04-04 11:46:58 +08:00
|
|
|
}
|
|
|
|
|
2012-02-15 05:06:50 +08:00
|
|
|
static int xics_host_xlate(struct irq_domain *h, struct device_node *ct,
|
2011-04-04 11:46:58 +08:00
|
|
|
const u32 *intspec, unsigned int intsize,
|
|
|
|
irq_hw_number_t *out_hwirq, unsigned int *out_flags)
|
|
|
|
|
|
|
|
{
|
|
|
|
/* Current xics implementation translates everything
|
|
|
|
* to level. It is not technically right for MSIs but this
|
|
|
|
* is irrelevant at this point. We might get smarter in the future
|
|
|
|
*/
|
|
|
|
*out_hwirq = intspec[0];
|
|
|
|
*out_flags = IRQ_TYPE_LEVEL_LOW;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-02-15 05:06:50 +08:00
|
|
|
static struct irq_domain_ops xics_host_ops = {
|
2011-04-04 11:46:58 +08:00
|
|
|
.match = xics_host_match,
|
|
|
|
.map = xics_host_map,
|
|
|
|
.xlate = xics_host_xlate,
|
|
|
|
};
|
|
|
|
|
|
|
|
static void __init xics_init_host(void)
|
|
|
|
{
|
2012-02-15 05:06:54 +08:00
|
|
|
xics_host = irq_domain_add_tree(NULL, &xics_host_ops, NULL);
|
2011-04-04 11:46:58 +08:00
|
|
|
BUG_ON(xics_host == NULL);
|
|
|
|
irq_set_default_host(xics_host);
|
|
|
|
}
|
|
|
|
|
|
|
|
void __init xics_register_ics(struct ics *ics)
|
|
|
|
{
|
|
|
|
list_add(&ics->link, &ics_list);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void __init xics_get_server_size(void)
|
|
|
|
{
|
|
|
|
struct device_node *np;
|
|
|
|
const u32 *isize;
|
|
|
|
|
|
|
|
/* We fetch the interrupt server size from the first ICS node
|
|
|
|
* we find if any
|
|
|
|
*/
|
|
|
|
np = of_find_compatible_node(NULL, NULL, "ibm,ppc-xics");
|
|
|
|
if (!np)
|
|
|
|
return;
|
|
|
|
isize = of_get_property(np, "ibm,interrupt-server#-size", NULL);
|
|
|
|
if (!isize)
|
|
|
|
return;
|
|
|
|
xics_interrupt_server_size = *isize;
|
|
|
|
of_node_put(np);
|
|
|
|
}
|
|
|
|
|
|
|
|
void __init xics_init(void)
|
|
|
|
{
|
|
|
|
int rc = -1;
|
|
|
|
|
|
|
|
/* Fist locate ICP */
|
|
|
|
if (firmware_has_feature(FW_FEATURE_LPAR))
|
|
|
|
rc = icp_hv_init();
|
|
|
|
if (rc < 0)
|
|
|
|
rc = icp_native_init();
|
|
|
|
if (rc < 0) {
|
|
|
|
pr_warning("XICS: Cannot find a Presentation Controller !\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Copy get_irq callback over to ppc_md */
|
|
|
|
ppc_md.get_irq = icp_ops->get_irq;
|
|
|
|
|
|
|
|
/* Patch up IPI chip EOI */
|
|
|
|
xics_ipi_chip.irq_eoi = icp_ops->eoi;
|
|
|
|
|
|
|
|
/* Now locate ICS */
|
|
|
|
rc = ics_rtas_init();
|
2011-09-20 01:45:02 +08:00
|
|
|
if (rc < 0)
|
|
|
|
rc = ics_opal_init();
|
2011-04-04 11:46:58 +08:00
|
|
|
if (rc < 0)
|
|
|
|
pr_warning("XICS: Cannot find a Source Controller !\n");
|
|
|
|
|
|
|
|
/* Initialize common bits */
|
|
|
|
xics_get_server_size();
|
|
|
|
xics_update_irq_servers();
|
|
|
|
xics_init_host();
|
|
|
|
xics_setup_cpu();
|
|
|
|
}
|