http://gcc.gnu.org/bugzilla/show_bug.cgi?id=46716

           Summary: bad code generated with -mno-sse2 -m64
           Product: gcc
           Version: 4.4.1
            Status: UNCONFIRMED
          Severity: normal
          Priority: P3
         Component: c
        AssignedTo: unassig...@gcc.gnu.org
        ReportedBy: mat...@caltech.edu


The following small program generates incorrect output when compiled with
the flags -mno-sse2 -m64 on a 64 bit system.  Output is correct for -m32
or -msse2 -m64.  The problem manifests as the lower double of the second
parameter passed into test() being replaced by the value of the second double
from the first parameter.

% cat /etc/release
Mandriva Linux release 2010.0 (Official) for x86_64
% cat /proc/cpuinfo | head -10
processor       : 0
vendor_id       : AuthenticAMD
cpu family      : 15
model           : 33
model name      : Dual Core AMD Opteron(tm) Processor 280
stepping        : 2
cpu MHz         : 1000.000
cache size      : 1024 KB
physical id     : 0
siblings        : 2
% gcc --version
gcc (GCC) 4.4.1

example:

% gcc -msse -mno-sse2 -I. -m64   -o foo gccprob2.c
% ./foo
s1      1.000000 2.000000
test s1 1.000000 2.000000
test s2 2.000000 2.000000
% gcc -msse -mno-sse2 -I. -m32   -o foo gccprob2.c
OR
% gcc -msse -msse2 -I. -m64   -o foo gccprob2.c
s1      1.000000 2.000000
test s1 1.000000 2.000000
test s2 1.000000 2.000000

*************************************************
#include <stdio.h> /* for printf */
typedef double    __m128d __attribute__ ((__vector_size__ (16),
__may_alias__));
typedef union
{
  __m128d x;
  double a[2];
} union128d;
#define EMM_FLT8(a)    ((double *)&(a))

void test ( __m128d s1, __m128d s2)
{
printf("test s1 %lf %lf\n",EMM_FLT8(s1)[0],EMM_FLT8(s1)[1]);
printf("test s2 %lf %lf\n",EMM_FLT8(s2)[0],EMM_FLT8(s2)[1]);
}

int main (void)
{
__attribute__ ((aligned (16)))  union128d s1;
  s1.a[0] = 1.0;
  s1.a[1] = 2.0;
printf("s1      %lf %lf\n",s1.a[0],s1.a[1]);
  test (s1.x, s1.x);
}
**************************************************

Reply via email to