Skip to content

Commit 4cf5576

Browse files
AmrDeveloperlanza
authored andcommitted
[CIR][CIRGen][Builtin][Neon] Lower neon vcaled_f64 (#1495)
Lower neon vcaled_f64
1 parent 1b1a832 commit 4cf5576

File tree

2 files changed

+12
-7
lines changed

2 files changed

+12
-7
lines changed

clang/lib/CIR/CodeGen/CIRGenBuiltinAArch64.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -2709,7 +2709,8 @@ static mlir::Value emitCommonNeonSISDBuiltinExpr(
27092709
return emitNeonCall(builder, {argTy}, ops, "aarch64.neon.facgt", resultTy,
27102710
loc);
27112711
case NEON::BI__builtin_neon_vcaled_f64:
2712-
llvm_unreachable(" neon_vcaled_f64 NYI ");
2712+
return emitNeonCall(builder, {argTy}, ops, "aarch64.neon.facge", resultTy,
2713+
loc);
27132714
case NEON::BI__builtin_neon_vcales_f32:
27142715
llvm_unreachable(" neon_vcales_f32 NYI ");
27152716
case NEON::BI__builtin_neon_vcaltd_f64:

clang/test/CIR/CodeGen/AArch64/neon.c

+10-6
Original file line numberDiff line numberDiff line change
@@ -15163,12 +15163,16 @@ uint64_t test_vcagtd_f64(float64_t a, float64_t b) {
1516315163
// return (uint32_t)vcales_f32(a, b);
1516415164
// }
1516515165

15166-
// NYI-LABEL: @test_vcaled_f64(
15167-
// NYI: [[VCALED_F64_I:%.*]] = call i64 @llvm.aarch64.neon.facge.i64.f64(double %b, double %a)
15168-
// NYI: ret i64 [[VCALED_F64_I]]
15169-
// uint64_t test_vcaled_f64(float64_t a, float64_t b) {
15170-
// return (uint64_t)vcaled_f64(a, b);
15171-
// }
15166+
uint64_t test_vcaled_f64(float64_t a, float64_t b) {
15167+
return (uint64_t)vcaled_f64(a, b);
15168+
15169+
// CIR-LABEL: vcaled_f64
15170+
// CIR: [[TMP0:%.*]] = cir.llvm.intrinsic "aarch64.neon.facge" {{.*}}, {{.*}} : (!cir.double, !cir.double) -> !u64i
15171+
15172+
// LLVM-LABEL: @test_vcaled_f64(
15173+
// LLVM: [[VCALED_F64_I:%.*]] = call i64 @llvm.aarch64.neon.facge.i64.f64(double %0, double %1)
15174+
// LLVM: ret i64 [[VCALED_F64_I]]
15175+
}
1517215176

1517315177
// NYI-LABEL: @test_vcalts_f32(
1517415178
// NYI: [[VCALTS_F32_I:%.*]] = call i32 @llvm.aarch64.neon.facgt.i32.f32(float %b, float %a)

0 commit comments

Comments
 (0)