On 2016/02/15 04:07PM, Cyril Bur wrote:
> Test that the non volatile floating point and Altivec registers get
> correctly preserved across the fork() syscall.
> 
> fork() works nicely for this purpose, the registers should be the same for
> both parent and child
> 
> Signed-off-by: Cyril Bur <cyril...@gmail.com>
> ---
>  tools/testing/selftests/powerpc/Makefile           |   3 +-
>  tools/testing/selftests/powerpc/basic_asm.h        |  30 ++++
>  tools/testing/selftests/powerpc/math/.gitignore    |   2 +
>  tools/testing/selftests/powerpc/math/Makefile      |  14 ++
>  tools/testing/selftests/powerpc/math/fpu_asm.S     | 161 +++++++++++++++++
>  tools/testing/selftests/powerpc/math/fpu_syscall.c |  90 ++++++++++
>  tools/testing/selftests/powerpc/math/vmx_asm.S     | 193 
> +++++++++++++++++++++
>  tools/testing/selftests/powerpc/math/vmx_syscall.c |  92 ++++++++++
>  8 files changed, 584 insertions(+), 1 deletion(-)
>  create mode 100644 tools/testing/selftests/powerpc/basic_asm.h
>  create mode 100644 tools/testing/selftests/powerpc/math/.gitignore
>  create mode 100644 tools/testing/selftests/powerpc/math/Makefile
>  create mode 100644 tools/testing/selftests/powerpc/math/fpu_asm.S
>  create mode 100644 tools/testing/selftests/powerpc/math/fpu_syscall.c
>  create mode 100644 tools/testing/selftests/powerpc/math/vmx_asm.S
>  create mode 100644 tools/testing/selftests/powerpc/math/vmx_syscall.c
> 
> diff --git a/tools/testing/selftests/powerpc/Makefile 
> b/tools/testing/selftests/powerpc/Makefile
> index 0c2706b..19e8191 100644
> --- a/tools/testing/selftests/powerpc/Makefile
> +++ b/tools/testing/selftests/powerpc/Makefile
> @@ -22,7 +22,8 @@ SUB_DIRS = benchmarks               \
>          switch_endian        \
>          syscalls             \
>          tm                   \
> -        vphn
> +        vphn         \
> +        math
>  
>  endif
>  
> diff --git a/tools/testing/selftests/powerpc/basic_asm.h 
> b/tools/testing/selftests/powerpc/basic_asm.h
> new file mode 100644
> index 0000000..f243da0
> --- /dev/null
> +++ b/tools/testing/selftests/powerpc/basic_asm.h
> @@ -0,0 +1,30 @@
> +#include <ppc-asm.h>
> +#include <asm/unistd.h>
> +
> +#define LOAD_REG_IMMEDIATE(reg,expr) \
> +     lis     reg,(expr)@highest;     \
> +     ori     reg,reg,(expr)@higher;  \
> +     rldicr  reg,reg,32,31;  \
> +     oris    reg,reg,(expr)@high;    \
> +     ori     reg,reg,(expr)@l;
> +
> +/* It is very important to note here that _extra is the extra amount of
> + * stack space needed.
> + * This space must be accessed at sp + 32!

This looks to be specific to ABIv2. Is this series limited to ppc64le?  
If so, you might want to ensure this only builds there.

Also:
#define PPC_ABIV2_MIN_STACK_SIZE 32

or just:
#define PPC_MIN_STACK   32

... is helpful. And, you might want to base the rest of your code that 
use PUSH_BASIC_STACK() on that. If we ever want to have these tests run 
anywhere else, that'll help a lot. (See further below)

> + */
> +#define PUSH_BASIC_STACK(_extra) \
> +     mflr    r0; \
> +     std     r0,16(sp); \
> +     stdu    sp,-(_extra + 32)(sp); \
> +     mfcr    r0; \
> +     stw     r0,8(sp); \
> +     std     2,24(sp);
                ^^
Better to use r2 here and below.

> +
> +#define POP_BASIC_STACK(_extra) \
> +     ld      2,24(sp); \
> +     lwz     r0,8(sp); \
> +     mtcr    r0; \
> +     addi    sp,sp,(_extra + 32); \
> +     ld      r0,16(sp); \
> +     mtlr    r0;
> +
> diff --git a/tools/testing/selftests/powerpc/math/.gitignore 
> b/tools/testing/selftests/powerpc/math/.gitignore
> new file mode 100644
> index 0000000..b19b269
> --- /dev/null
> +++ b/tools/testing/selftests/powerpc/math/.gitignore
> @@ -0,0 +1,2 @@
> +fpu_syscall
> +vmx_syscall
> diff --git a/tools/testing/selftests/powerpc/math/Makefile 
> b/tools/testing/selftests/powerpc/math/Makefile
> new file mode 100644
> index 0000000..418bef1
> --- /dev/null
> +++ b/tools/testing/selftests/powerpc/math/Makefile
> @@ -0,0 +1,14 @@
> +TEST_PROGS := fpu_syscall vmx_syscall
> +
> +all: $(TEST_PROGS)
> +
> +$(TEST_PROGS): ../harness.c
> +$(TEST_PROGS): CFLAGS += -O2 -g -pthread -m64 -maltivec
> +
> +fpu_syscall: fpu_asm.S
> +vmx_syscall: vmx_asm.S
> +
> +include ../../lib.mk
> +
> +clean:
> +     rm -f $(TEST_PROGS) *.o
> diff --git a/tools/testing/selftests/powerpc/math/fpu_asm.S 
> b/tools/testing/selftests/powerpc/math/fpu_asm.S
> new file mode 100644
> index 0000000..8733874
> --- /dev/null
> +++ b/tools/testing/selftests/powerpc/math/fpu_asm.S
> @@ -0,0 +1,161 @@
> +/*
> + * Copyright 2015, Cyril Bur, IBM Corp.
> + *
> + * This program is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU General Public License
> + * as published by the Free Software Foundation; either version
> + * 2 of the License, or (at your option) any later version.
> + */
> +
> +#include "../basic_asm.h"
> +
> +#define PUSH_FPU(pos) \
> +     stfd    f14,pos(sp); \
> +     stfd    f15,pos+8(sp); \
> +     stfd    f16,pos+16(sp); \
> +     stfd    f17,pos+24(sp); \
> +     stfd    f18,pos+32(sp); \
> +     stfd    f19,pos+40(sp); \
> +     stfd    f20,pos+48(sp); \
> +     stfd    f21,pos+56(sp); \
> +     stfd    f22,pos+64(sp); \
> +     stfd    f23,pos+72(sp); \
> +     stfd    f24,pos+80(sp); \
> +     stfd    f25,pos+88(sp); \
> +     stfd    f26,pos+96(sp); \
> +     stfd    f27,pos+104(sp); \
> +     stfd    f28,pos+112(sp); \
> +     stfd    f29,pos+120(sp); \
> +     stfd    f30,pos+128(sp); \
> +     stfd    f31,pos+136(sp);
> +
> +#define POP_FPU(pos) \
> +     lfd     f14,pos(sp); \
> +     lfd     f15,pos+8(sp); \
> +     lfd     f16,pos+16(sp); \
> +     lfd     f17,pos+24(sp); \
> +     lfd     f18,pos+32(sp); \
> +     lfd     f19,pos+40(sp); \
> +     lfd     f20,pos+48(sp); \
> +     lfd     f21,pos+56(sp); \
> +     lfd     f22,pos+64(sp); \
> +     lfd     f23,pos+72(sp); \
> +     lfd     f24,pos+80(sp); \
> +     lfd     f25,pos+88(sp); \
> +     lfd     f26,pos+96(sp); \
> +     lfd     f27,pos+104(sp); \
> +     lfd     f28,pos+112(sp); \
> +     lfd     f29,pos+120(sp); \
> +     lfd     f30,pos+128(sp); \
> +     lfd     f31,pos+136(sp);
> +
> +#Careful calling this, it will 'clobber' fpu (by design)
> +#Don't call this from C
> +FUNC_START(load_fpu)
> +     lfd     f14,0(r3)
> +     lfd     f15,8(r3)
> +     lfd     f16,16(r3)
> +     lfd     f17,24(r3)
> +     lfd     f18,32(r3)
> +     lfd     f19,40(r3)
> +     lfd     f20,48(r3)
> +     lfd     f21,56(r3)
> +     lfd     f22,64(r3)
> +     lfd     f23,72(r3)
> +     lfd     f24,80(r3)
> +     lfd     f25,88(r3)
> +     lfd     f26,96(r3)
> +     lfd     f27,104(r3)
> +     lfd     f28,112(r3)
> +     lfd     f29,120(r3)
> +     lfd     f30,128(r3)
> +     lfd     f31,136(r3)
> +     blr
> +FUNC_END(load_fpu)
> +
> +FUNC_START(check_fpu)
> +     mr r4,r3
> +     li      r3,1 #assume a bad result
> +     lfd     f0,0(r4)
> +     fcmpu   cr1,f0,f14
> +     bne     cr1,1f
> +     lfd     f0,8(r4)
> +     fcmpu   cr1,f0,f15
> +     bne     cr1,1f
> +     lfd     f0,16(r4)
> +     fcmpu   cr1,f0,f16
> +     bne     cr1,1f
> +     lfd     f0,24(r4)
> +     fcmpu   cr1,f0,f17
> +     bne     cr1,1f
> +     lfd     f0,32(r4)
> +     fcmpu   cr1,f0,f18
> +     bne     cr1,1f
> +     lfd     f0,40(r4)
> +     fcmpu   cr1,f0,f19
> +     bne     cr1,1f
> +     lfd     f0,48(r4)
> +     fcmpu   cr1,f0,f20
> +     bne     cr1,1f
> +     lfd     f0,56(r4)
> +     fcmpu   cr1,f0,f21
> +     bne     cr1,1f
> +     lfd     f0,64(r4)
> +     fcmpu   cr1,f0,f22
> +     bne     cr1,1f
> +     lfd     f0,72(r4)
> +     fcmpu   cr1,f0,f23
> +     bne     cr1,1f
> +     lfd     f0,80(r4)
> +     fcmpu   cr1,f0,f24
> +     bne     cr1,1f
> +     lfd     f0,88(r4)
> +     fcmpu   cr1,f0,f25
> +     bne     cr1,1f
> +     lfd     f0,96(r4)
> +     fcmpu   cr1,f0,f26
> +     bne     cr1,1f
> +     lfd     f0,104(r4)
> +     fcmpu   cr1,f0,f27
> +     bne     cr1,1f
> +     lfd     f0,112(r4)
> +     fcmpu   cr1,f0,f28
> +     bne     cr1,1f
> +     lfd     f0,120(r4)
> +     fcmpu   cr1,f0,f29
> +     bne     cr1,1f
> +     lfd     f0,128(r4)
> +     fcmpu   cr1,f0,f30
> +     bne     cr1,1f
> +     lfd     f0,136(r4)
> +     fcmpu   cr1,f0,f31
> +     bne     cr1,1f
> +     li      r3,0 #Sucess!!!
> +1:   blr
> +
> +FUNC_START(test_fpu)
> +     #r3 holds pointer to where to put the result of fork
> +     #r4 holds pointer to the pid
> +     #f14-f31 are non volatiles
> +     PUSH_BASIC_STACK(256)
> +     std     r3,40(sp) #Address of darray

So, this could be:
        PUSH_BASIC_STACK(256)
        std     r3,PPC_MIN_STACK+8(sp)

... though I wonder why there is +8 here?


- Naveen

_______________________________________________
Linuxppc-dev mailing list
Linuxppc-dev@lists.ozlabs.org
https://lists.ozlabs.org/listinfo/linuxppc-dev

Reply via email to