@@ -51,8 +51,8 @@ define void @destroysrc(ptr %src, ptr %dst) {
51
51
52
52
define void @destroynoaliassrc (ptr noalias %src , ptr %dst ) {
53
53
; CHECK-LABEL: @destroynoaliassrc(
54
- ; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr align 8 [[DST:%.*]], ptr align 8 [[SRC]], i64 16, i1 false)
55
- ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[SRC:%.* ]], i8 0, i64 16, i1 false)
54
+ ; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr align 8 [[DST:%.*]], ptr align 8 [[SRC:%.* ]], i64 16, i1 false)
55
+ ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[SRC]], i8 0, i64 16, i1 false)
56
56
; CHECK-NEXT: ret void
57
57
;
58
58
%1 = load %S , ptr %src
@@ -79,9 +79,9 @@ define void @copyalias(ptr %src, ptr %dst) {
79
79
; sure we lift the computation as well if needed and possible.
80
80
define void @addrproducer (ptr %src , ptr %dst ) {
81
81
; CHECK-LABEL: @addrproducer(
82
- ; CHECK-NEXT: [[DST2:%.*]] = getelementptr [[S:%.*]], ptr [[DST]], i64 1
82
+ ; CHECK-NEXT: [[DST2:%.*]] = getelementptr [[S:%.*]], ptr [[DST:%.* ]], i64 1
83
83
; CHECK-NEXT: call void @llvm.memmove.p0.p0.i64(ptr align 8 [[DST2]], ptr align 8 [[SRC:%.*]], i64 16, i1 false)
84
- ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[DST:%.* ]], i8 undef, i64 16, i1 false)
84
+ ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[DST]], i8 undef, i64 16, i1 false)
85
85
; CHECK-NEXT: ret void
86
86
;
87
87
%1 = load %S , ptr %src
@@ -113,8 +113,8 @@ define void @noaliasaddrproducer(ptr %src, ptr noalias %dst, ptr noalias %dstidp
113
113
; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr [[DSTIDPTR:%.*]], align 4
114
114
; CHECK-NEXT: [[DSTINDEX:%.*]] = or i32 [[TMP2]], 1
115
115
; CHECK-NEXT: [[DST2:%.*]] = getelementptr [[S:%.*]], ptr [[DST:%.*]], i32 [[DSTINDEX]]
116
- ; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr align 8 [[DST2]], ptr align 8 [[SRC]], i64 16, i1 false)
117
- ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[SRC:%.* ]], i8 undef, i64 16, i1 false)
116
+ ; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr align 8 [[DST2]], ptr align 8 [[SRC:%.* ]], i64 16, i1 false)
117
+ ; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[SRC]], i8 undef, i64 16, i1 false)
118
118
; CHECK-NEXT: ret void
119
119
;
120
120
%1 = load %S , ptr %src
@@ -130,7 +130,7 @@ define void @throwing_call(ptr noalias %src, ptr %dst) {
130
130
; CHECK-LABEL: @throwing_call(
131
131
; CHECK-NEXT: [[TMP1:%.*]] = load [[S:%.*]], ptr [[SRC:%.*]], align 8
132
132
; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 8 [[SRC]], i8 0, i64 16, i1 false)
133
- ; CHECK-NEXT: call void @call() [[ATTR2:#.* ]]
133
+ ; CHECK-NEXT: call void @call() # [[ATTR2:[0-9]+ ]]
134
134
; CHECK-NEXT: store [[S]] [[TMP1]], ptr [[DST:%.*]], align 8
135
135
; CHECK-NEXT: ret void
136
136
;
@@ -156,4 +156,30 @@ loop:
156
156
br label %loop
157
157
}
158
158
159
+ ; There are multiple instructions that can clobber the source memory here.
160
+ ; We can move the dest write past the store to %ptr.24, but not the memcpy.
161
+ ; Make sure we don't perform fca2memcpy conversion in this case.
162
+ define void @multiple_clobbering (ptr %ptr , ptr %ptr.copy ) {
163
+ ; CHECK-LABEL: @multiple_clobbering(
164
+ ; CHECK-NEXT: [[PTR_8:%.*]] = getelementptr inbounds nuw i8, ptr [[PTR:%.*]], i64 8
165
+ ; CHECK-NEXT: [[PTR_24:%.*]] = getelementptr inbounds nuw i8, ptr [[PTR]], i64 24
166
+ ; CHECK-NEXT: [[PTR_32:%.*]] = getelementptr inbounds nuw i8, ptr [[PTR]], i64 32
167
+ ; CHECK-NEXT: [[PTR_COPY_8:%.*]] = getelementptr inbounds nuw i8, ptr [[PTR_COPY:%.*]], i64 8
168
+ ; CHECK-NEXT: [[STRUCT:%.*]] = load { i32, i64 }, ptr [[PTR_COPY_8]], align 8
169
+ ; CHECK-NEXT: call void @llvm.memcpy.p0.p0.i64(ptr [[PTR_8]], ptr [[PTR_32]], i64 12, i1 false)
170
+ ; CHECK-NEXT: store i64 1, ptr [[PTR_24]], align 8
171
+ ; CHECK-NEXT: store { i32, i64 } [[STRUCT]], ptr [[PTR_32]], align 8
172
+ ; CHECK-NEXT: ret void
173
+ ;
174
+ %ptr.8 = getelementptr inbounds nuw i8 , ptr %ptr , i64 8
175
+ %ptr.24 = getelementptr inbounds nuw i8 , ptr %ptr , i64 24
176
+ %ptr.32 = getelementptr inbounds nuw i8 , ptr %ptr , i64 32
177
+ %ptr.copy.8 = getelementptr inbounds nuw i8 , ptr %ptr.copy , i64 8
178
+ %struct = load { i32 , i64 }, ptr %ptr.copy.8 , align 8
179
+ call void @llvm.memcpy.p0.p0.i64 (ptr %ptr.8 , ptr %ptr.32 , i64 12 , i1 false )
180
+ store i64 1 , ptr %ptr.24 , align 8
181
+ store { i32 , i64 } %struct , ptr %ptr.32 , align 8
182
+ ret void
183
+ }
184
+
159
185
declare void @call ()
0 commit comments