https://gcc.gnu.org/bugzilla/show_bug.cgi?id=111333
Bug ID: 111333 Summary: Runtime failure for fcmulcph instrinsic Product: gcc Version: 14.0 Status: UNCONFIRMED Severity: normal Priority: P3 Component: target Assignee: unassigned at gcc dot gnu.org Reporter: crazylht at gmail dot com Target Milestone: --- cat main.cpp #include <immintrin.h> #include <cstdio> __attribute__((optimize("O0"))) auto func0(_Float16 *a, _Float16 *b, int n, _Float16 *c) { __m512h rA = _mm512_loadu_ph(a); for (int i = 0; i < n; i += 32) { __m512h rB = _mm512_loadu_ph(b + i); _mm512_storeu_ph(c + i, _mm512_fcmul_pch(rB, rA)); } } __attribute__((optimize("O2"))) auto func1(_Float16 *a, _Float16 *b, int n, _Float16 *c) { __m512h rA = _mm512_loadu_ph(a); for (int i = 0; i < n; i += 32) { __m512h rB = _mm512_loadu_ph(b + i); _mm512_storeu_ph(c + i, _mm512_fcmul_pch(rB, rA)); } } int main() { int n = 32; _Float16 a[n], b[n], c[n]; for (int i = 1; i <= n; i++) { a[i - 1] = i & 1 ? -i : i; b[i - 1] = i; } printf("a = %f + %fi \n", (float)a[0], (float)a[1]); printf("b = %f + %fi \n", (float)b[0], (float)b[1]); printf("b * conj(a) = %f + %fi \n\n", (float)(a[0]*b[0] + a[1]*b[1]), (float)(a[0]*b[1] - a[1]*b[0])); func0(a, b, n, c); for (int i = 0; i < n / 32 * 2; i++) { printf("%f ", (float)c[i]); } printf("\n"); func1(a, b, n, c); for (int i = 0; i < n / 32 * 2; i++) { printf("%f ", (float)c[i]); } printf("\n"); return 0; } g++ -march=sapphirerapids main.cpp -o test sde -spr-- ./test a = -1.000000 + 2.000000i b = 1.000000 + 2.000000i b * conj(a) = 3.000000 + -4.000000i 3.000000 -4.000000 3.000000 4.000000