On Mon, 26 Jun 2017, Palmer Dabbelt wrote:
> +DEFINE_PER_CPU(struct riscv_irq_data, riscv_irq_data);
> +DEFINE_PER_CPU(atomic_long_t, riscv_early_sie);
> +
> +static void riscv_software_interrupt(void)
> +{
> +#ifdef CONFIG_SMP
> +     irqreturn_t ret;
> +
> +     ret = handle_ipi();
> +     if (ret != IRQ_NONE)
> +             return;
> +#endif
> +
> +     BUG();

Are you sure you want to crash the system just because a spurious interrupt
happened?

> +}
> +
> +asmlinkage void __irq_entry do_IRQ(unsigned int cause, struct pt_regs *regs)
> +{
> +     struct pt_regs *old_regs = set_irq_regs(regs);
> +     struct irq_domain *domain;
> +
> +     irq_enter();
> +
> +     /* There are three classes of interrupt: timer, software, and

Please use proper multiline comment formatting:

        /*
         * bla.....
         * foo.....
         */

> +      * external devices.  We dispatch between them here.  External
> +      * device interrupts use the generic IRQ mechanisms.
> +      */
> +     switch (cause) {
> +     case INTERRUPT_CAUSE_TIMER:
> +             riscv_timer_interrupt();
> +             break;
> +     case INTERRUPT_CAUSE_SOFTWARE:
> +             riscv_software_interrupt();
> +             break;
> +     default:
> +             domain = per_cpu(riscv_irq_data, smp_processor_id()).domain;
> +             generic_handle_irq(irq_find_mapping(domain, cause));
> +             break;
> +     }
> +
> +     irq_exit();
> +     set_irq_regs(old_regs);
> +}
> +
> +static int riscv_irqdomain_map(struct irq_domain *d, unsigned int irq,
> +                            irq_hw_number_t hwirq)
> +{
> +     struct riscv_irq_data *data = d->host_data;
> +
> +     irq_set_chip_and_handler(irq, &data->chip, handle_simple_irq);
> +     irq_set_chip_data(irq, data);
> +     irq_set_noprobe(irq);
> +
> +     return 0;
> +}
> +
> +static const struct irq_domain_ops riscv_irqdomain_ops = {
> +     .map    = riscv_irqdomain_map,
> +     .xlate  = irq_domain_xlate_onecell,
> +};
> +
> +static void riscv_irq_mask(struct irq_data *d)
> +{
> +     struct riscv_irq_data *data = irq_data_get_irq_chip_data(d);
> +
> +     BUG_ON(smp_processor_id() != data->hart);

Crashing the machine is the last resort if there is no chance to handle a
situation gracefully. Something like

        if (WARN_ON_ONCE(smp_processor_id() != data->hart))
                do_something_sensible();
        else
                .....

might at least keep the machine halfways functional for debugging.

> +     csr_clear(sie, 1 << (long)d->hwirq);
> +}
> +
> +static void riscv_irq_unmask(struct irq_data *d)
> +{
> +     struct riscv_irq_data *data = irq_data_get_irq_chip_data(d);
> +
> +     BUG_ON(smp_processor_id() != data->hart);
> +     csr_set(sie, 1 << (long)d->hwirq);
> +}
> +
> +static void riscv_irq_enable_helper(void *d)
> +{
> +     riscv_irq_unmask(d);
> +}
> +
> +static void riscv_irq_enable(struct irq_data *d)
> +{
> +     struct riscv_irq_data *data = irq_data_get_irq_chip_data(d);
> +
> +     /* There are two phases to setting up an interrupt: first we set a bit
> +      * in this bookkeeping structure, which is used by trap_init to
> +      * initialize SIE for each hart as it comes up.

And what exactly has this to do with irq_enable()? Why would you call that
for an interrupt which solely goes to a offline cpu?

> +static void riscv_irq_disable(struct irq_data *d)
> +{
> +     struct riscv_irq_data *data = irq_data_get_irq_chip_data(d);
> +
> +     /* This is the mirror of riscv_irq_enable. */
> +     atomic_long_and(~(1 << (long)d->hwirq),
> +                     &per_cpu(riscv_early_sie, data->hart));
> +     if (data->hart == smp_processor_id())
> +             riscv_irq_mask(d);
> +     else if (cpu_online(data->hart))
> +             smp_call_function_single(data->hart,
> +                                      riscv_irq_disable_helper,
> +                                      d,
> +                                      true);

Same question as above.

> +}
> +
> +static void riscv_irq_mask_noop(struct irq_data *d) { }
> +
> +static void riscv_irq_unmask_noop(struct irq_data *d) { }
> 
> +static void riscv_irq_enable_noop(struct irq_data *d)
> +{
> +     struct device_node *data = irq_data_get_irq_chip_data(d);
> +     u32 hart;
> +
> +     if (!of_property_read_u32(data, "reg", &hart))
> +             printk(
> +               KERN_WARNING "enabled interrupt %d for missing hart %d (this 
> interrupt has no handler)\n",

Has no handler? I really have a hard time to understand the logic here.

> +               (int)d->hwirq, hart);
> +}
> +
> +static struct irq_chip riscv_noop_chip = {
> +     .name = "riscv,cpu-intc,noop",
> +     .irq_mask = riscv_irq_mask_noop,
> +     .irq_unmask = riscv_irq_unmask_noop,
> +     .irq_enable = riscv_irq_enable_noop,

Please write that in tabular fashion:

        .name           = "riscv,cpu-intc,noop",
        .irq_mask       = riscv_irq_mask_noop,

> +};
> +
> +static int riscv_irqdomain_map_noop(struct irq_domain *d, unsigned int irq,
> +                                 irq_hw_number_t hwirq)
> +{
> +     struct device_node *data = d->host_data;
> +
> +     irq_set_chip_and_handler(irq, &riscv_noop_chip, handle_simple_irq);
> +     irq_set_chip_data(irq, data);
> +     return 0;
> +}
> +
> +static const struct irq_domain_ops riscv_irqdomain_ops_noop = {
> +     .map    = riscv_irqdomain_map_noop,
> +     .xlate  = irq_domain_xlate_onecell,
> +};
> +
> +static int riscv_intc_init(struct device_node *node, struct device_node 
> *parent)
> +{
> +     int hart;
> +     struct riscv_irq_data *data;
> +
> +     if (parent)
> +             return 0;
> +
> +     hart = riscv_of_processor_hart(node->parent);
> +     if (hart < 0) {
> +             /* If a hart is disabled, create a no-op irq domain.  Devices
> +              * may still have interrupts connected to those harts.  This is
> +              * not wrong... unless they actually load a driver that needs
> +              * it!
> +              */
> +             irq_domain_add_linear(
> +                     node,
> +                     8*sizeof(uintptr_t),
> +                     &riscv_irqdomain_ops_noop,
> +                     node->parent);
> +             return 0;

I have a hard time to understand the logic here. Why do you need an
interrupt domain for something which does not exist? That does not make any
sense.

> +     }
> +
> +     data = &per_cpu(riscv_irq_data, hart);
> +     snprintf(data->name, sizeof(data->name), "riscv,cpu_intc,%d", hart);
> +     data->hart = hart;
> +     data->chip.name = data->name;
> +     data->chip.irq_mask = riscv_irq_mask;
> +     data->chip.irq_unmask = riscv_irq_unmask;
> +     data->chip.irq_enable = riscv_irq_enable;
> +     data->chip.irq_disable = riscv_irq_disable;
> +     data->domain = irq_domain_add_linear(
> +             node,
> +             8*sizeof(uintptr_t),
> +             &riscv_irqdomain_ops,
> +             data);
> +     WARN_ON(!data->domain);

That warn_on is great. You warn and then continue as if nothing
happened. Machine will crash later dereferencing a NULL pointer.

Some more epxlanations about the inner workings of all of this would be
appreciated.

Thanks,

        tglx



Reply via email to