What's the performance impact of this?  If you run this test with --fp,
--altivec or --vector what is the impact of adding this patch?

http://ozlabs.org/~anton/junkcode/context_switch2.c

eg 
  ./context_switch2 --fp 0 0 

Mikey

On Thu, 2015-07-09 at 15:16 +0530, Anshuman Khandual wrote:
> This patch enables facility unavailable exceptions for generic facility,
> FPU, ALTIVEC and VSX in /proc/interrupts listing by incrementing their
> newly added IRQ statistical counters as and when these exceptions happen.
> This also adds couple of helper functions which will be called from within
> the interrupt handler context to update their statistics. Similarly this
> patch also enables alignment and program check exceptions as well.
> 
>       With this patch being applied, /proc/interrupts looks something
> like this after running various workloads which create these exceptions.
> 
> --------------------------------------------------------------
>            CPU0       CPU1
>  16:      28477      35288      XICS   2 Level     IPI
>  17:          0          0      XICS 4101 Level     virtio0
>  18:          0          0      XICS 4100 Level     ohci_hcd:usb1
>  19:     288146          0      XICS 4099 Level     virtio1
>  20:          0          0      XICS 4096 Level     RAS_EPOW
>  21:       6241      17364      XICS 4102 Level     ibmvscsi
>  22:        133          0      XICS 4103 Level     hvc_console
> LOC:      12617      24509   Local timer interrupts for timer event device
> LOC:         98         73   Local timer interrupts for others
> SPU:          0          0   Spurious interrupts
> PMI:          0          0   Performance monitoring interrupts
> MCE:          0          0   Machine check exceptions
> DBL:          0          0   Doorbell interrupts
> ALN:          0          0   Alignment exceptions
> PRG:          0          0   Program check exceptions
> FAC:          0          0   Facility unavailable exceptions
> FPU:      12736       2458   FPU unavailable exceptions
> ALT:     108313      24507   ALTIVEC unavailable exceptions
> VSX:     408590    4943568   VSX unavailable exceptions
> --------------------------------------------------------------
> 
> Signed-off-by: Anshuman Khandual <khand...@linux.vnet.ibm.com>
> ---
> Changes in V2:
> - Fixed some typos in the final /proc/interrupts output
> - Added support for alignment and program check exceptions
> 
>  arch/powerpc/include/asm/hardirq.h   |  6 ++++++
>  arch/powerpc/kernel/exceptions-64s.S |  2 ++
>  arch/powerpc/kernel/irq.c            | 35 +++++++++++++++++++++++++++++++++++
>  arch/powerpc/kernel/traps.c          | 28 ++++++++++++++++++++++++++++
>  4 files changed, 71 insertions(+)
> 
> diff --git a/arch/powerpc/include/asm/hardirq.h 
> b/arch/powerpc/include/asm/hardirq.h
> index 8add8b8..ba51d3e 100644
> --- a/arch/powerpc/include/asm/hardirq.h
> +++ b/arch/powerpc/include/asm/hardirq.h
> @@ -15,6 +15,12 @@ typedef struct {
>  #ifdef CONFIG_PPC_DOORBELL
>       unsigned int doorbell_irqs;
>  #endif
> +     unsigned int alignment_exceptions;
> +     unsigned int program_exceptions;
> +     unsigned int fac_unav_exceptions;
> +     unsigned int fpu_unav_exceptions;
> +     unsigned int altivec_unav_exceptions;
> +     unsigned int vsx_unav_exceptions;
>  } ____cacheline_aligned irq_cpustat_t;
>  
>  DECLARE_PER_CPU_SHARED_ALIGNED(irq_cpustat_t, irq_stat);
> diff --git a/arch/powerpc/kernel/exceptions-64s.S 
> b/arch/powerpc/kernel/exceptions-64s.S
> index 0a0399c2..a86180c 100644
> --- a/arch/powerpc/kernel/exceptions-64s.S
> +++ b/arch/powerpc/kernel/exceptions-64s.S
> @@ -1158,6 +1158,7 @@ BEGIN_FTR_SECTION
>  END_FTR_SECTION_IFSET(CPU_FTR_TM)
>  #endif
>       bl      load_up_fpu
> +     bl      fpu_unav_exceptions_count
>       b       fast_exception_return
>  #ifdef CONFIG_PPC_TRANSACTIONAL_MEM
>  2:   /* User process was in a transaction */
> @@ -1184,6 +1185,7 @@ BEGIN_FTR_SECTION
>    END_FTR_SECTION_NESTED(CPU_FTR_TM, CPU_FTR_TM, 69)
>  #endif
>       bl      load_up_altivec
> +     bl      altivec_unav_exceptions_count
>       b       fast_exception_return
>  #ifdef CONFIG_PPC_TRANSACTIONAL_MEM
>  2:   /* User process was in a transaction */
> diff --git a/arch/powerpc/kernel/irq.c b/arch/powerpc/kernel/irq.c
> index 4509603..8b4d928 100644
> --- a/arch/powerpc/kernel/irq.c
> +++ b/arch/powerpc/kernel/irq.c
> @@ -397,6 +397,35 @@ int arch_show_interrupts(struct seq_file *p, int prec)
>               seq_printf(p, "  Doorbell interrupts\n");
>       }
>  #endif
> +     seq_printf(p, "%*s: ", prec, "ALN");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, 
> j).alignment_exceptions);
> +     seq_printf(p, "  Alignment exceptions\n");
> +
> +     seq_printf(p, "%*s: ", prec, "PRG");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, j).program_exceptions);
> +     seq_printf(p, "  Program check exceptions\n");
> +
> +     seq_printf(p, "%*s: ", prec, "FAC");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, 
> j).fac_unav_exceptions);
> +     seq_printf(p, "  Facility unavailable exceptions\n");
> +
> +     seq_printf(p, "%*s: ", prec, "FPU");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, 
> j).fpu_unav_exceptions);
> +     seq_printf(p, "  FPU unavailable exceptions\n");
> +
> +     seq_printf(p, "%*s: ", prec, "ALT");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, 
> j).altivec_unav_exceptions);
> +     seq_printf(p, "  ALTIVEC unavailable exceptions\n");
> +
> +     seq_printf(p, "%*s: ", prec, "VSX");
> +     for_each_online_cpu(j)
> +             seq_printf(p, "%10u ", per_cpu(irq_stat, 
> j).vsx_unav_exceptions);
> +     seq_printf(p, "  VSX unavailable exceptions\n");
>  
>       return 0;
>  }
> @@ -416,6 +445,12 @@ u64 arch_irq_stat_cpu(unsigned int cpu)
>  #ifdef CONFIG_PPC_DOORBELL
>       sum += per_cpu(irq_stat, cpu).doorbell_irqs;
>  #endif
> +     sum += per_cpu(irq_stat, cpu).alignment_exceptions;
> +     sum += per_cpu(irq_stat, cpu).program_exceptions;
> +     sum += per_cpu(irq_stat, cpu).fac_unav_exceptions;
> +     sum += per_cpu(irq_stat, cpu).fpu_unav_exceptions;
> +     sum += per_cpu(irq_stat, cpu).altivec_unav_exceptions;
> +     sum += per_cpu(irq_stat, cpu).vsx_unav_exceptions;
>  
>       return sum;
>  }
> diff --git a/arch/powerpc/kernel/traps.c b/arch/powerpc/kernel/traps.c
> index 6530f1b..9b6511c 100644
> --- a/arch/powerpc/kernel/traps.c
> +++ b/arch/powerpc/kernel/traps.c
> @@ -1137,6 +1137,8 @@ void __kprobes program_check_exception(struct pt_regs 
> *regs)
>       enum ctx_state prev_state = exception_enter();
>       unsigned int reason = get_reason(regs);
>  
> +     __this_cpu_inc(irq_stat.program_exceptions);
> +
>       /* We can now get here via a FP Unavailable exception if the core
>        * has no FPU, in that case the reason flags will be 0 */
>  
> @@ -1260,6 +1262,8 @@ void alignment_exception(struct pt_regs *regs)
>       enum ctx_state prev_state = exception_enter();
>       int sig, code, fixed = 0;
>  
> +     __this_cpu_inc(irq_stat.alignment_exceptions);
> +
>       /* We restore the interrupt state now */
>       if (!arch_irq_disabled_regs(regs))
>               local_irq_enable();
> @@ -1322,6 +1326,8 @@ void kernel_fp_unavailable_exception(struct pt_regs 
> *regs)
>  {
>       enum ctx_state prev_state = exception_enter();
>  
> +     __this_cpu_inc(irq_stat.fpu_unav_exceptions);
> +
>       printk(KERN_EMERG "Unrecoverable FP Unavailable Exception "
>                         "%lx at %lx\n", regs->trap, regs->nip);
>       die("Unrecoverable FP Unavailable Exception", regs, SIGABRT);
> @@ -1333,6 +1339,8 @@ void altivec_unavailable_exception(struct pt_regs *regs)
>  {
>       enum ctx_state prev_state = exception_enter();
>  
> +     __this_cpu_inc(irq_stat.altivec_unav_exceptions);
> +
>       if (user_mode(regs)) {
>               /* A user program has executed an altivec instruction,
>                  but this kernel doesn't support altivec. */
> @@ -1350,6 +1358,8 @@ bail:
>  
>  void vsx_unavailable_exception(struct pt_regs *regs)
>  {
> +     __this_cpu_inc(irq_stat.vsx_unav_exceptions);
> +
>       if (user_mode(regs)) {
>               /* A user program has executed an vsx instruction,
>                  but this kernel doesn't support vsx. */
> @@ -1381,6 +1391,8 @@ void facility_unavailable_exception(struct pt_regs 
> *regs)
>       u8 status;
>       bool hv;
>  
> +     __this_cpu_inc(irq_stat.fac_unav_exceptions);
> +
>       hv = (regs->trap == 0xf80);
>       if (hv)
>               value = mfspr(SPRN_HFSCR);
> @@ -1453,10 +1465,22 @@ void facility_unavailable_exception(struct pt_regs 
> *regs)
>  }
>  #endif
>  
> +void fpu_unav_exceptions_count(void)
> +{
> +     __this_cpu_inc(irq_stat.fpu_unav_exceptions);
> +}
> +
> +void altivec_unav_exceptions_count(void)
> +{
> +     __this_cpu_inc(irq_stat.altivec_unav_exceptions);
> +}
> +
>  #ifdef CONFIG_PPC_TRANSACTIONAL_MEM
>  
>  void fp_unavailable_tm(struct pt_regs *regs)
>  {
> +     __this_cpu_inc(irq_stat.fpu_unav_exceptions);
> +
>       /* Note:  This does not handle any kind of FP laziness. */
>  
>       TM_DEBUG("FP Unavailable trap whilst transactional at 0x%lx, MSR=%lx\n",
> @@ -1493,6 +1517,8 @@ void fp_unavailable_tm(struct pt_regs *regs)
>  
>  void altivec_unavailable_tm(struct pt_regs *regs)
>  {
> +     __this_cpu_inc(irq_stat.altivec_unav_exceptions);
> +
>       /* See the comments in fp_unavailable_tm().  This function operates
>        * the same way.
>        */
> @@ -1515,6 +1541,8 @@ void vsx_unavailable_tm(struct pt_regs *regs)
>  {
>       unsigned long orig_msr = regs->msr;
>  
> +     __this_cpu_inc(irq_stat.vsx_unav_exceptions);
> +
>       /* See the comments in fp_unavailable_tm().  This works similarly,
>        * though we're loading both FP and VEC registers in here.
>        *

_______________________________________________
Linuxppc-dev mailing list
Linuxppc-dev@lists.ozlabs.org
https://lists.ozlabs.org/listinfo/linuxppc-dev

Reply via email to