77 lines
2.8 KiB
LLVM
77 lines
2.8 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -mtriple=aarch64 < %s | FileCheck %s
|
|
|
|
; All tests are doing unordered vector comparisons on vectors larger than a
|
|
; Neon vector.
|
|
|
|
define i1 @unordered_floating_point_compare_on_v8f32(<8 x float> %a_vec) {
|
|
; CHECK-LABEL: unordered_floating_point_compare_on_v8f32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
|
|
; CHECK-NEXT: mov w8, #1
|
|
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
|
|
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
|
|
; CHECK-NEXT: mvn v0.16b, v0.16b
|
|
; CHECK-NEXT: xtn v0.8b, v0.8h
|
|
; CHECK-NEXT: umaxv b0, v0.8b
|
|
; CHECK-NEXT: fmov w9, s0
|
|
; CHECK-NEXT: bic w0, w8, w9
|
|
; CHECK-NEXT: ret
|
|
%a_cmp = fcmp ule <8 x float> %a_vec, zeroinitializer
|
|
%cmp_result = bitcast <8 x i1> %a_cmp to i8
|
|
%all_zero = icmp eq i8 %cmp_result, 0
|
|
ret i1 %all_zero
|
|
}
|
|
|
|
define i1 @unordered_floating_point_compare_on_v16f32(<16 x float> %a_vec) {
|
|
; CHECK-LABEL: unordered_floating_point_compare_on_v16f32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: fcmgt v3.4s, v3.4s, #0.0
|
|
; CHECK-NEXT: mov w8, #1
|
|
; CHECK-NEXT: fcmgt v2.4s, v2.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
|
|
; CHECK-NEXT: uzp1 v2.8h, v2.8h, v3.8h
|
|
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
|
|
; CHECK-NEXT: uzp1 v0.16b, v0.16b, v2.16b
|
|
; CHECK-NEXT: mvn v0.16b, v0.16b
|
|
; CHECK-NEXT: umaxv b0, v0.16b
|
|
; CHECK-NEXT: fmov w9, s0
|
|
; CHECK-NEXT: bic w0, w8, w9
|
|
; CHECK-NEXT: ret
|
|
%a_cmp = fcmp ule <16 x float> %a_vec, zeroinitializer
|
|
%cmp_result = bitcast <16 x i1> %a_cmp to i16
|
|
%all_zero = icmp eq i16 %cmp_result, 0
|
|
ret i1 %all_zero
|
|
}
|
|
|
|
define i1 @unordered_floating_point_compare_on_v32f32(<32 x float> %a_vec) {
|
|
; CHECK-LABEL: unordered_floating_point_compare_on_v32f32:
|
|
; CHECK: // %bb.0:
|
|
; CHECK-NEXT: fcmgt v3.4s, v3.4s, #0.0
|
|
; CHECK-NEXT: mov w9, #1
|
|
; CHECK-NEXT: fcmgt v2.4s, v2.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v1.4s, v1.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v0.4s, v0.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v7.4s, v7.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v6.4s, v6.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v5.4s, v5.4s, #0.0
|
|
; CHECK-NEXT: fcmgt v4.4s, v4.4s, #0.0
|
|
; CHECK-NEXT: uzp1 v2.8h, v2.8h, v3.8h
|
|
; CHECK-NEXT: uzp1 v0.8h, v0.8h, v1.8h
|
|
; CHECK-NEXT: uzp1 v6.8h, v6.8h, v7.8h
|
|
; CHECK-NEXT: uzp1 v1.8h, v4.8h, v5.8h
|
|
; CHECK-NEXT: uzp1 v0.16b, v0.16b, v2.16b
|
|
; CHECK-NEXT: uzp1 v1.16b, v1.16b, v6.16b
|
|
; CHECK-NEXT: mvn v0.16b, v0.16b
|
|
; CHECK-NEXT: orn v0.16b, v0.16b, v1.16b
|
|
; CHECK-NEXT: umaxv b0, v0.16b
|
|
; CHECK-NEXT: fmov w8, s0
|
|
; CHECK-NEXT: bic w0, w9, w8
|
|
; CHECK-NEXT: ret
|
|
%a_cmp = fcmp ule <32 x float> %a_vec, zeroinitializer
|
|
%cmp_result = bitcast <32 x i1> %a_cmp to i32
|
|
%all_zero = icmp eq i32 %cmp_result, 0
|
|
ret i1 %all_zero
|
|
}
|