65 lines
3.3 KiB
LLVM
65 lines
3.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt -interleaved-load-combine -S -verify-memoryssa %s | FileCheck %s
|
|
|
|
target triple = "arm64-apple-darwin"
|
|
|
|
declare void @clobber(<2 x double>)
|
|
|
|
define void @rename_uses(ptr %src, i1 %c.1, i1 %c.2) {
|
|
; CHECK-LABEL: @rename_uses(
|
|
; CHECK-NEXT: bb:
|
|
; CHECK-NEXT: br label [[OUTER_HEADER:%.*]]
|
|
; CHECK: outer.header:
|
|
; CHECK-NEXT: br label [[INNER:%.*]]
|
|
; CHECK: inner:
|
|
; CHECK-NEXT: br i1 [[C_1:%.*]], label [[OUTER_LATCH:%.*]], label [[INNER]]
|
|
; CHECK: outer.latch:
|
|
; CHECK-NEXT: br i1 [[C_2:%.*]], label [[EXIT:%.*]], label [[OUTER_HEADER]]
|
|
; CHECK: exit:
|
|
; CHECK-NEXT: [[GEP_0:%.*]] = getelementptr inbounds [12 x double], ptr [[SRC:%.*]], i64 0, i64 0
|
|
; CHECK-NEXT: [[GEP_4:%.*]] = getelementptr [12 x double], ptr [[SRC]], i64 0, i64 4
|
|
; CHECK-NEXT: [[INTERLEAVED_WIDE_LOAD:%.*]] = load <8 x double>, ptr [[GEP_0]], align 8
|
|
; CHECK-NEXT: [[L_0:%.*]] = load <4 x double>, ptr [[GEP_0]], align 8
|
|
; CHECK-NEXT: [[L_4:%.*]] = load <4 x double>, ptr [[GEP_4]], align 8
|
|
; CHECK-NEXT: [[INTERLEAVED_SHUFFLE:%.*]] = shufflevector <8 x double> [[INTERLEAVED_WIDE_LOAD]], <8 x double> poison, <2 x i32> <i32 0, i32 4>
|
|
; CHECK-NEXT: [[S_0:%.*]] = shufflevector <4 x double> [[L_0]], <4 x double> [[L_4]], <2 x i32> <i32 0, i32 4>
|
|
; CHECK-NEXT: [[INTERLEAVED_SHUFFLE1:%.*]] = shufflevector <8 x double> [[INTERLEAVED_WIDE_LOAD]], <8 x double> poison, <2 x i32> <i32 1, i32 5>
|
|
; CHECK-NEXT: [[S_1:%.*]] = shufflevector <4 x double> [[L_0]], <4 x double> [[L_4]], <2 x i32> <i32 1, i32 5>
|
|
; CHECK-NEXT: [[INTERLEAVED_SHUFFLE2:%.*]] = shufflevector <8 x double> [[INTERLEAVED_WIDE_LOAD]], <8 x double> poison, <2 x i32> <i32 2, i32 6>
|
|
; CHECK-NEXT: [[S_2:%.*]] = shufflevector <4 x double> [[L_0]], <4 x double> [[L_4]], <2 x i32> <i32 2, i32 6>
|
|
; CHECK-NEXT: [[INTERLEAVED_SHUFFLE3:%.*]] = shufflevector <8 x double> [[INTERLEAVED_WIDE_LOAD]], <8 x double> poison, <2 x i32> <i32 3, i32 7>
|
|
; CHECK-NEXT: [[S_3:%.*]] = shufflevector <4 x double> [[L_0]], <4 x double> [[L_4]], <2 x i32> <i32 3, i32 7>
|
|
; CHECK-NEXT: call void @clobber(<2 x double> [[INTERLEAVED_SHUFFLE]])
|
|
; CHECK-NEXT: call void @clobber(<2 x double> [[INTERLEAVED_SHUFFLE1]])
|
|
; CHECK-NEXT: call void @clobber(<2 x double> [[INTERLEAVED_SHUFFLE2]])
|
|
; CHECK-NEXT: call void @clobber(<2 x double> [[INTERLEAVED_SHUFFLE3]])
|
|
; CHECK-NEXT: ret void
|
|
;
|
|
bb:
|
|
br label %outer.header
|
|
|
|
outer.header:
|
|
br label %inner
|
|
|
|
inner:
|
|
br i1 %c.1, label %outer.latch, label %inner
|
|
|
|
outer.latch:
|
|
br i1 %c.2, label %exit, label %outer.header
|
|
|
|
exit:
|
|
%gep.0 = getelementptr inbounds [ 12 x double ], ptr %src, i64 0, i64 0
|
|
%gep.4 = getelementptr [ 12 x double ], ptr %src, i64 0, i64 4
|
|
%l.0 = load <4 x double>, ptr %gep.0, align 8
|
|
%l.4 = load <4 x double>, ptr %gep.4, align 8
|
|
%s.0 = shufflevector <4 x double> %l.0, <4 x double> %l.4, <2 x i32> <i32 0, i32 4>
|
|
%s.1 = shufflevector <4 x double> %l.0, <4 x double> %l.4, <2 x i32> <i32 1, i32 5>
|
|
%s.2 = shufflevector <4 x double> %l.0, <4 x double> %l.4, <2 x i32> <i32 2, i32 6>
|
|
%s.3 = shufflevector <4 x double> %l.0, <4 x double> %l.4, <2 x i32> <i32 3, i32 7>
|
|
call void @clobber(<2 x double> %s.0)
|
|
call void @clobber(<2 x double> %s.1)
|
|
call void @clobber(<2 x double> %s.2)
|
|
call void @clobber(<2 x double> %s.3)
|
|
ret void
|
|
}
|