Issue 140917
Summary Missed DCE when popcount of multiplication of two integers but arg1 is 1 in icelake-client
Labels new issue
Assignees
Reporter BreadTom
    [Godbolt](https://godbolt.org/z/nGesTMMK4)
Flags were -O3 -Wall -Wextra -march=icelake-client
```
#include <stdint.h>

int f0(uint64_t arg0, uint64_t arg1){
    uint64_t tmp0;
    int tmp1;
 if(arg1 % 2 == 0)
        __builtin_unreachable();
 if(!__builtin_mul_overflow(arg0, arg1, &tmp0))
 __builtin_unreachable();
    tmp1 = __builtin_popcountg(tmp0);
    return tmp1;
}

int f0_slow(uint64_t arg0, uint64_t arg1){
    uint64_t tmp0;
 int tmp1;
    if(arg1 % 2 == 0)
        __builtin_unreachable();
 if(!__builtin_mul_overflow(arg0, arg1, &tmp0))
 __builtin_unreachable();
    if(arg1 == 1)
        return __builtin_popcountg(arg0);
    tmp1 = __builtin_popcountg(tmp0);
    return tmp1;
}
```
```
define dso_local range(i32 0, 65) i32 @f0(i64 noundef %arg0, i64 noundef %arg1) local_unnamed_addr {
entry:
  %rem = and i64 %arg1, 1
  %cmp = icmp ne i64 %rem, 0
  tail call void @llvm.assume(i1 %cmp)
  %0 = tail call { i64, i1 } @llvm.umul.with.overflow.i64(i64 %arg0, i64 %arg1)
  %1 = extractvalue { i64, i1 } %0, 1
  %2 = extractvalue { i64, i1 } %0, 0
  tail call void @llvm.assume(i1 %1)
  %3 = tail call range(i64 0, 65) i64 @llvm.ctpop.i64(i64 %2)
  %cast = trunc nuw nsw i64 %3 to i32
 ret i32 %cast
}

declare { i64, i1 } @llvm.umul.with.overflow.i64(i64, i64) #1

declare i64 @llvm.ctpop.i64(i64) #1

define dso_local range(i32 0, 65) i32 @f0_slow(i64 noundef %arg0, i64 noundef %arg1) local_unnamed_addr {
entry:
  %rem = and i64 %arg1, 1
  %cmp = icmp ne i64 %rem, 0
  tail call void @llvm.assume(i1 %cmp)
  %0 = tail call { i64, i1 } @llvm.umul.with.overflow.i64(i64 %arg0, i64 %arg1)
  %1 = extractvalue { i64, i1 } %0, 1
  tail call void @llvm.assume(i1 %1)
  %cmp3 = icmp eq i64 %arg1, 1
  %2 = tail call range(i64 0, 65) i64 @llvm.ctpop.i64(i64 %arg0)
 %3 = extractvalue { i64, i1 } %0, 0
  %4 = tail call range(i64 0, 65) i64 @llvm.ctpop.i64(i64 %3)
  %retval.0.in = select i1 %cmp3, i64 %2, i64 %4
 %retval.0 = trunc nuw nsw i64 %retval.0.in to i32
  ret i32 %retval.0
}

declare void @llvm.assume(i1 noundef) #2
```
GCC does use only one popcnt but LLVM does not optimize if(arg1 == 1)
_______________________________________________
llvm-bugs mailing list
llvm-bugs@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-bugs

Reply via email to