1 //=========- MemTransferLowerTest.cpp - MemTransferLower unit tests -=========//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/Analysis/CGSCCPassManager.h"
10 #include "llvm/Analysis/ScalarEvolution.h"
11 #include "llvm/Analysis/TargetTransformInfo.h"
12 #include "llvm/AsmParser/Parser.h"
13 #include "llvm/IR/BasicBlock.h"
14 #include "llvm/IR/Function.h"
15 #include "llvm/IR/Instructions.h"
16 #include "llvm/IR/IntrinsicInst.h"
17 #include "llvm/IR/LLVMContext.h"
18 #include "llvm/IR/Module.h"
19 #include "llvm/IR/PassManager.h"
20 #include "llvm/Passes/PassBuilder.h"
21 #include "llvm/Support/Debug.h"
22 #include "llvm/Support/SourceMgr.h"
23 #include "llvm/Testing/Support/Error.h"
24 #include "llvm/Transforms/Utils/LowerMemIntrinsics.h"
25 #include "llvm/Transforms/Vectorize/LoopVectorize.h"
27 #include "gtest/gtest-spi.h"
28 #include "gtest/gtest.h"
33 struct ForwardingPass
: public PassInfoMixin
<ForwardingPass
> {
34 template <typename T
> ForwardingPass(T
&&Arg
) : Func(std::forward
<T
>(Arg
)) {}
36 PreservedAnalyses
run(Function
&F
, FunctionAnalysisManager
&FAM
) {
40 std::function
<PreservedAnalyses(Function
&, FunctionAnalysisManager
&)> Func
;
43 struct MemTransferLowerTest
: public testing::Test
{
45 LoopAnalysisManager LAM
;
46 FunctionAnalysisManager FAM
;
47 CGSCCAnalysisManager CGAM
;
48 ModuleAnalysisManager MAM
;
49 ModulePassManager MPM
;
51 std::unique_ptr
<Module
> M
;
53 MemTransferLowerTest() {
54 // Register all the basic analyses with the managers.
55 PB
.registerModuleAnalyses(MAM
);
56 PB
.registerCGSCCAnalyses(CGAM
);
57 PB
.registerFunctionAnalyses(FAM
);
58 PB
.registerLoopAnalyses(LAM
);
59 PB
.crossRegisterProxies(LAM
, FAM
, CGAM
, MAM
);
62 BasicBlock
*getBasicBlockByName(Function
&F
, StringRef Name
) const {
63 for (BasicBlock
&BB
: F
) {
64 if (BB
.getName() == Name
)
70 Instruction
*getInstructionByOpcode(BasicBlock
&BB
, unsigned Opcode
,
71 unsigned Number
) const {
72 unsigned CurrNumber
= 0;
73 for (Instruction
&I
: BB
)
74 if (I
.getOpcode() == Opcode
) {
76 if (CurrNumber
== Number
)
82 void ParseAssembly(const char *IR
) {
84 M
= parseAssemblyString(IR
, Error
, Context
);
86 raw_string_ostream
os(errMsg
);
89 // A failure here means that the test itself is buggy.
91 report_fatal_error(os
.str().c_str());
95 // By semantics source and destination of llvm.memcpy.* intrinsic
96 // are either equal or don't overlap. Once the intrinsic is lowered
97 // to a loop it can be hard or impossible to reason about these facts.
98 // For that reason expandMemCpyAsLoop is expected to explicitly mark
99 // loads from source and stores to destination as not aliasing.
100 TEST_F(MemTransferLowerTest
, MemCpyKnownLength
) {
101 ParseAssembly("declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8 *, i64, i1)\n"
102 "define void @foo(i8* %dst, i8* %src, i64 %n) optsize {\n"
104 " %is_not_equal = icmp ne i8* %dst, %src\n"
105 " br i1 %is_not_equal, label %memcpy, label %exit\n"
107 " call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, "
108 "i64 1024, i1 false)\n"
114 FunctionPassManager FPM
;
115 FPM
.addPass(ForwardingPass(
116 [=](Function
&F
, FunctionAnalysisManager
&FAM
) -> PreservedAnalyses
{
117 TargetTransformInfo
TTI(M
->getDataLayout());
118 auto *MemCpyBB
= getBasicBlockByName(F
, "memcpy");
119 Instruction
*Inst
= &MemCpyBB
->front();
120 MemCpyInst
*MemCpyI
= cast
<MemCpyInst
>(Inst
);
121 auto &SE
= FAM
.getResult
<ScalarEvolutionAnalysis
>(F
);
122 expandMemCpyAsLoop(MemCpyI
, TTI
, &SE
);
123 auto *CopyLoopBB
= getBasicBlockByName(F
, "load-store-loop");
124 Instruction
*LoadInst
=
125 getInstructionByOpcode(*CopyLoopBB
, Instruction::Load
, 1);
126 EXPECT_NE(nullptr, LoadInst
->getMetadata(LLVMContext::MD_alias_scope
));
127 Instruction
*StoreInst
=
128 getInstructionByOpcode(*CopyLoopBB
, Instruction::Store
, 1);
129 EXPECT_NE(nullptr, StoreInst
->getMetadata(LLVMContext::MD_noalias
));
130 return PreservedAnalyses::none();
132 MPM
.addPass(createModuleToFunctionPassAdaptor(std::move(FPM
)));
137 // This test indirectly checks that loads and stores (generated as a result of
138 // llvm.memcpy lowering) doesn't alias by making sure the loop can be
139 // successfully vectorized without additional runtime checks.
140 TEST_F(MemTransferLowerTest
, VecMemCpyKnownLength
) {
141 ParseAssembly("declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8 *, i64, i1)\n"
142 "define void @foo(i8* %dst, i8* %src, i64 %n) optsize {\n"
144 " %is_not_equal = icmp ne i8* %dst, %src\n"
145 " br i1 %is_not_equal, label %memcpy, label %exit\n"
147 " call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dst, i8* %src, "
148 "i64 1024, i1 false)\n"
154 FunctionPassManager FPM
;
155 FPM
.addPass(ForwardingPass(
156 [=](Function
&F
, FunctionAnalysisManager
&FAM
) -> PreservedAnalyses
{
157 TargetTransformInfo
TTI(M
->getDataLayout());
158 auto *MemCpyBB
= getBasicBlockByName(F
, "memcpy");
159 Instruction
*Inst
= &MemCpyBB
->front();
160 MemCpyInst
*MemCpyI
= cast
<MemCpyInst
>(Inst
);
161 auto &SE
= FAM
.getResult
<ScalarEvolutionAnalysis
>(F
);
162 expandMemCpyAsLoop(MemCpyI
, TTI
, &SE
);
163 return PreservedAnalyses::none();
165 FPM
.addPass(LoopVectorizePass(LoopVectorizeOptions()));
166 FPM
.addPass(ForwardingPass(
167 [=](Function
&F
, FunctionAnalysisManager
&FAM
) -> PreservedAnalyses
{
168 auto *TargetBB
= getBasicBlockByName(F
, "vector.body");
169 EXPECT_NE(nullptr, TargetBB
);
170 return PreservedAnalyses::all();
172 MPM
.addPass(createModuleToFunctionPassAdaptor(std::move(FPM
)));
177 TEST_F(MemTransferLowerTest
, AtomicMemCpyKnownLength
) {
178 ParseAssembly("declare void "
179 "@llvm.memcpy.element.unordered.atomic.p0i32.p0i32.i64(i32*, "
181 "define void @foo(i32* %dst, i32* %src, i64 %n) optsize {\n"
183 " %is_not_equal = icmp ne i32* %dst, %src\n"
184 " br i1 %is_not_equal, label %memcpy, label %exit\n"
187 "@llvm.memcpy.element.unordered.atomic.p0i32.p0i32.i64(i32* "
195 FunctionPassManager FPM
;
196 FPM
.addPass(ForwardingPass(
197 [=](Function
&F
, FunctionAnalysisManager
&FAM
) -> PreservedAnalyses
{
198 TargetTransformInfo
TTI(M
->getDataLayout());
199 auto *MemCpyBB
= getBasicBlockByName(F
, "memcpy");
200 Instruction
*Inst
= &MemCpyBB
->front();
201 assert(isa
<AtomicMemCpyInst
>(Inst
) &&
202 "Expecting llvm.memcpy.p0i8.i64 instructon");
203 AtomicMemCpyInst
*MemCpyI
= cast
<AtomicMemCpyInst
>(Inst
);
204 auto &SE
= FAM
.getResult
<ScalarEvolutionAnalysis
>(F
);
205 expandAtomicMemCpyAsLoop(MemCpyI
, TTI
, &SE
);
206 auto *CopyLoopBB
= getBasicBlockByName(F
, "load-store-loop");
207 Instruction
*LoadInst
=
208 getInstructionByOpcode(*CopyLoopBB
, Instruction::Load
, 1);
209 EXPECT_TRUE(LoadInst
->isAtomic());
210 EXPECT_NE(LoadInst
->getMetadata(LLVMContext::MD_alias_scope
), nullptr);
211 Instruction
*StoreInst
=
212 getInstructionByOpcode(*CopyLoopBB
, Instruction::Store
, 1);
213 EXPECT_TRUE(StoreInst
->isAtomic());
214 EXPECT_NE(StoreInst
->getMetadata(LLVMContext::MD_noalias
), nullptr);
215 return PreservedAnalyses::none();
217 MPM
.addPass(createModuleToFunctionPassAdaptor(std::move(FPM
)));
222 TEST_F(MemTransferLowerTest
, AtomicMemCpyUnKnownLength
) {
223 ParseAssembly("declare void "
224 "@llvm.memcpy.element.unordered.atomic.p0i32.p0i32.i64(i32*, "
226 "define void @foo(i32* %dst, i32* %src, i64 %n) optsize {\n"
228 " %is_not_equal = icmp ne i32* %dst, %src\n"
229 " br i1 %is_not_equal, label %memcpy, label %exit\n"
232 "@llvm.memcpy.element.unordered.atomic.p0i32.p0i32.i64(i32* "
240 FunctionPassManager FPM
;
241 FPM
.addPass(ForwardingPass(
242 [=](Function
&F
, FunctionAnalysisManager
&FAM
) -> PreservedAnalyses
{
243 TargetTransformInfo
TTI(M
->getDataLayout());
244 auto *MemCpyBB
= getBasicBlockByName(F
, "memcpy");
245 Instruction
*Inst
= &MemCpyBB
->front();
246 assert(isa
<AtomicMemCpyInst
>(Inst
) &&
247 "Expecting llvm.memcpy.p0i8.i64 instructon");
248 AtomicMemCpyInst
*MemCpyI
= cast
<AtomicMemCpyInst
>(Inst
);
249 auto &SE
= FAM
.getResult
<ScalarEvolutionAnalysis
>(F
);
250 expandAtomicMemCpyAsLoop(MemCpyI
, TTI
, &SE
);
251 auto *CopyLoopBB
= getBasicBlockByName(F
, "loop-memcpy-expansion");
252 Instruction
*LoadInst
=
253 getInstructionByOpcode(*CopyLoopBB
, Instruction::Load
, 1);
254 EXPECT_TRUE(LoadInst
->isAtomic());
255 EXPECT_NE(LoadInst
->getMetadata(LLVMContext::MD_alias_scope
), nullptr);
256 Instruction
*StoreInst
=
257 getInstructionByOpcode(*CopyLoopBB
, Instruction::Store
, 1);
258 EXPECT_TRUE(StoreInst
->isAtomic());
259 EXPECT_NE(StoreInst
->getMetadata(LLVMContext::MD_noalias
), nullptr);
260 return PreservedAnalyses::none();
262 MPM
.addPass(createModuleToFunctionPassAdaptor(std::move(FPM
)));