[ThinLTO] Add code comment. NFC
[llvm-complete.git] / unittests / Support / ItaniumManglingCanonicalizerTest.cpp
blob91432899d1457204968c0208d361a735c41ba930
1 //===-------------- ItaniumManglingCanonicalizerTest.cpp ------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
9 #include "llvm/Support/ItaniumManglingCanonicalizer.h"
10 #include "llvm/ADT/ArrayRef.h"
11 #include "llvm/ADT/StringRef.h"
12 #include "gtest/gtest.h"
14 #include <cstdlib>
15 #include <map>
16 #include <vector>
18 using namespace llvm;
20 namespace {
22 using EquivalenceError = llvm::ItaniumManglingCanonicalizer::EquivalenceError;
23 using FragmentKind = llvm::ItaniumManglingCanonicalizer::FragmentKind;
25 struct Equivalence {
26 FragmentKind Kind;
27 llvm::StringRef First;
28 llvm::StringRef Second;
31 // A set of manglings that should all be considered equivalent.
32 using EquivalenceClass = std::vector<llvm::StringRef>;
34 struct Testcase {
35 // A set of equivalences to register.
36 std::vector<Equivalence> Equivalences;
37 // A set of distinct equivalence classes created by registering the
38 // equivalences.
39 std::vector<EquivalenceClass> Classes;
42 // A function that returns a set of test cases.
43 static std::vector<Testcase> getTestcases() {
44 return {
45 // Three different manglings for std::string (old libstdc++, new libstdc++,
46 // libc++).
49 {FragmentKind::Type, "Ss",
50 "NSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE"},
51 {FragmentKind::Type, "Ss",
52 "NSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
55 {"_Z1fv"},
56 {"_Z1fSs",
57 "_Z1fNSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE",
58 "_Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
59 {"_ZNKSs4sizeEv",
60 "_ZNKSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEE4sizeEv",
61 "_ZNKSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE4sizeEv"},
65 // Check that substitutions are properly handled.
68 // ::X <-> ::N::X<int>
69 {FragmentKind::Type, "1X", "N1N1XIiEE"},
70 // ::T<T<int, int>, T<int, int>> <-> T<int>
71 {FragmentKind::Type, "1TIS_IiiES0_E", "1TIiE"},
72 // A::B::foo <-> AB::foo
73 {FragmentKind::Name, "N1A1B3fooE", "N2AB3fooE"},
76 {"_Z1f1XPS_RS_", "_Z1fN1N1XIiEEPS1_RS1_"},
77 {"_ZN1A1B3fooE1TIS1_IiiES2_EPS3_RS3_", "_ZN2AB3fooE1TIiEPS1_RS1_"},
81 // Check that nested equivalences are properly handled.
84 // std::__1::char_traits == std::__cxx11::char_traits
85 // (Note that this is unused and should make no difference,
86 // but it should not cause us to fail to match up the cases
87 // below.)
88 {FragmentKind::Name,
89 "NSt3__111char_traitsE",
90 "NSt7__cxx1111char_traitsE"},
91 // std::__1::allocator == std::allocator
92 {FragmentKind::Name,
93 "NSt3__19allocatorE",
94 "Sa"}, // "Sa" is not strictly a <name> but we accept it as one.
95 // std::__1::vector == std::vector
96 {FragmentKind::Name,
97 "St6vector",
98 "NSt3__16vectorE"},
99 // std::__1::basic_string<
100 // char
101 // std::__1::char_traits<char>,
102 // std::__1::allocator<char>> ==
103 // std::__cxx11::basic_string<
104 // char,
105 // std::char_traits<char>,
106 // std::allocator<char>>
107 {FragmentKind::Type,
108 "NSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE",
109 "NSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
110 // X<A> <-> X<B>
111 {FragmentKind::Type, "1XI1AE", "1XI1BE"},
112 // X <-> Y
113 {FragmentKind::Name, "1X", "1Y"},
116 // f(std::string)
117 {"_Z1fNSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE",
118 "_Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
119 // f(std::vector<int>)
120 {"_Z1fSt6vectorIiSaIiEE", "_Z1fNSt3__16vectorIiNS_9allocatorIiEEEE"},
121 // f(X<A>), f(X<B>), f(Y<A>), f(Y<B>)
122 {"_Z1f1XI1AE", "_Z1f1XI1BE", "_Z1f1YI1AE", "_Z1f1YI1BE"},
123 // f(X<C>), f(Y<C>)
124 {"_Z1f1XI1CE", "_Z1f1YI1CE"},
128 // Check namespace equivalences.
131 // std::__1 == std::__cxx11
132 {FragmentKind::Name, "St3__1", "St7__cxx11"},
133 // std::__1::allocator == std::allocator
134 {FragmentKind::Name, "NSt3__19allocatorE", "Sa"},
135 // std::vector == std::__1::vector
136 {FragmentKind::Name, "St6vector", "NSt3__16vectorE"},
137 // std::__cxx11::char_traits == std::char_traits
138 // (This indirectly means that std::__1::char_traits == std::char_traits,
139 // due to the std::__cxx11 == std::__1 equivalence, which is what we rely
140 // on below.)
141 {FragmentKind::Name, "NSt7__cxx1111char_traitsE", "St11char_traits"},
144 // f(std::foo)
145 {"_Z1fNSt7__cxx113fooE",
146 "_Z1fNSt3__13fooE"},
147 // f(std::string)
148 {"_Z1fNSt7__cxx1111char_traitsIcEE",
149 "_Z1fNSt3__111char_traitsIcEE",
150 "_Z1fSt11char_traitsIcE"},
151 // f(std::string)
152 {"_Z1fNSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE",
153 "_Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
154 // f(std::vector<int>)
155 {"_Z1fSt6vectorIiSaIiEE", "_Z1fNSt3__16vectorIiNS_9allocatorIiEEEE"},
159 // Check namespace equivalences for namespace 'std'. We support using 'St'
160 // for this, despite it not technically being a <name>.
163 // std::__1 == std
164 {FragmentKind::Name, "St3__1", "St"},
165 // std::__1 == std::__cxx11
166 {FragmentKind::Name, "St3__1", "St7__cxx11"},
167 // FIXME: Should a 'std' equivalence also cover the predefined
168 // substitutions?
169 // std::__1::allocator == std::allocator
170 {FragmentKind::Name, "NSt3__19allocatorE", "Sa"},
173 {"_Z1fSt3foo", "_Z1fNSt3__13fooE", "_Z1fNSt7__cxx113fooE"},
174 {"_Z1fNSt3bar3bazE", "_Z1fNSt3__13bar3bazE"},
175 // f(std::string)
176 {"_Z1fNSt3__112basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEEE",
177 "_Z1fNSt7__cxx1112basic_stringIcSt11char_traitsIcESaIcEEE"},
178 // f(std::vector<int>)
179 {"_Z1fSt6vectorIiSaIiEE", "_Z1fNSt3__16vectorIiNS_9allocatorIiEEEE"},
183 // Check mutually-recursive equivalences.
186 {FragmentKind::Type, "1A", "1B"},
187 {FragmentKind::Type, "1A", "1C"},
188 {FragmentKind::Type, "1D", "1B"},
189 {FragmentKind::Type, "1C", "1E"},
192 {"_Z1f1A", "_Z1f1B", "_Z1f1C", "_Z1f1D", "_Z1f1E"},
193 {"_Z1f1F"},
197 // Check <encoding>s.
200 {FragmentKind::Encoding, "1fv", "1gv"},
203 // f(void) -> g(void)
204 {"_Z1fv", "_Z1gv"},
205 // static local 'n' in f(void) -> static local 'n' in g(void)
206 {"_ZZ1fvE1n", "_ZZ1gvE1n"},
210 // Corner case: the substitution can appear within its own expansion.
213 // X <-> Y<X>
214 {FragmentKind::Type, "1X", "1YI1XE"},
215 // A<B> <-> B
216 {FragmentKind::Type, "1AI1BE", "1B"},
219 // f(X) == f(Y<X>) == f(Y<Y<X>>) == f(Y<Y<Y<X>>>)
220 {"_Z1f1X", "_Z1f1YI1XE", "_Z1f1YIS_I1XEE", "_Z1f1YIS_IS_I1XEEE"},
221 // f(B) == f(A<B>) == f(A<A<B>>) == f(A<A<A<B>>>)
222 {"_Z1f1B", "_Z1f1AI1BE", "_Z1f1AIS_I1BEE", "_Z1f1AIS_IS_I1BEEE"},
226 // Redundant equivalences are accepted (and have no effect).
229 {FragmentKind::Name, "3std", "St"},
230 {FragmentKind::Name, "1X", "1Y"},
231 {FragmentKind::Name, "N1X1ZE", "N1Y1ZE"},
236 // Check that ctor and dtor variants are considered distinct.
239 {{"_ZN1XC1Ev"}, {"_ZN1XC2Ev"}, {"_ZN1XD1Ev"}, {"_ZN1XD2Ev"}}
242 // Ensure array types with and without bounds are handled properly.
245 {FragmentKind::Type, "A_i", "A1_f"},
248 {"_Z1fRA_i", "_Z1fRA_i", "_Z1fRA1_f"},
249 {"_Z1fRA1_i"}, {"_Z1fRA_f"},
255 // A function to get a set of test cases for forward template references.
256 static std::vector<Testcase> getForwardTemplateReferenceTestcases() {
257 return {
258 // ForwardTemplateReference does not support canonicalization.
259 // FIXME: We should consider ways of fixing this, perhaps by eliminating
260 // the ForwardTemplateReference node with a tree transformation.
263 // X::operator T() <with T = A> == Y::operator T() <with T = A>
264 {FragmentKind::Encoding, "N1XcvT_I1AEEv", "N1YcvT_I1AEEv"},
265 // A == B
266 {FragmentKind::Name, "1A", "1B"},
269 // All combinations result in unique equivalence classes.
270 {"_ZN1XcvT_I1AEEv"},
271 {"_ZN1XcvT_I1BEEv"},
272 {"_ZN1YcvT_I1AEEv"},
273 {"_ZN1YcvT_I1BEEv"},
274 // Even giving the same string twice gives a new class.
275 {"_ZN1XcvT_I1AEEv"},
281 template<bool CanonicalizeFirst>
282 static void testTestcases(ArrayRef<Testcase> Testcases) {
283 for (const auto &Testcase : Testcases) {
284 llvm::ItaniumManglingCanonicalizer Canonicalizer;
285 for (const auto &Equiv : Testcase.Equivalences) {
286 auto Result =
287 Canonicalizer.addEquivalence(Equiv.Kind, Equiv.First, Equiv.Second);
288 EXPECT_EQ(Result, EquivalenceError::Success)
289 << "couldn't add equivalence between " << Equiv.First << " and "
290 << Equiv.Second;
293 using CanonKey = llvm::ItaniumManglingCanonicalizer::Key;
295 std::map<const EquivalenceClass*, CanonKey> Keys;
296 if (CanonicalizeFirst)
297 for (const auto &Class : Testcase.Classes)
298 Keys.insert({&Class, Canonicalizer.canonicalize(*Class.begin())});
300 std::map<CanonKey, llvm::StringRef> Found;
301 for (const auto &Class : Testcase.Classes) {
302 CanonKey ClassKey = Keys[&Class];
303 for (llvm::StringRef Str : Class) {
304 // Force a copy to be made when calling lookup to test that it doesn't
305 // retain any part of the provided string.
306 CanonKey ThisKey = CanonicalizeFirst
307 ? Canonicalizer.lookup(std::string(Str))
308 : Canonicalizer.canonicalize(Str);
309 EXPECT_NE(ThisKey, CanonKey()) << "couldn't canonicalize " << Str;
310 if (ClassKey) {
311 EXPECT_EQ(ThisKey, ClassKey)
312 << Str << " not in the same class as " << *Class.begin();
313 } else {
314 ClassKey = ThisKey;
317 EXPECT_TRUE(Found.insert({ClassKey, *Class.begin()}).second)
318 << *Class.begin() << " is in the same class as " << Found[ClassKey];
323 TEST(ItaniumManglingCanonicalizerTest, TestCanonicalize) {
324 testTestcases<false>(getTestcases());
327 TEST(ItaniumManglingCanonicalizerTest, TestLookup) {
328 testTestcases<true>(getTestcases());
331 TEST(ItaniumManglingCanonicalizerTest, TestForwardTemplateReference) {
332 // lookup(...) after canonicalization (intentionally) returns different
333 // values for this testcase.
334 testTestcases<false>(getForwardTemplateReferenceTestcases());
338 TEST(ItaniumManglingCanonicalizerTest, TestInvalidManglings) {
339 llvm::ItaniumManglingCanonicalizer Canonicalizer;
340 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "", "1X"),
341 EquivalenceError::InvalidFirstMangling);
342 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "1X", "1ab"),
343 EquivalenceError::InvalidSecondMangling);
344 EXPECT_EQ(Canonicalizer.canonicalize("_Z3fooE"),
345 llvm::ItaniumManglingCanonicalizer::Key());
346 EXPECT_EQ(Canonicalizer.canonicalize("foo"),
347 llvm::ItaniumManglingCanonicalizer::Key());
349 // A reference to a template parameter ('T_' etc) cannot appear in a <name>,
350 // because we don't have template arguments to bind to it. (The arguments in
351 // an 'I ... E' construct in the <name> aren't registered as
352 // backreferenceable arguments in this sense, because they're not part of
353 // the template argument list of an <encoding>.
354 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Name, "N1XcvT_I1AEE",
355 "1f"),
356 EquivalenceError::InvalidFirstMangling);
359 TEST(ItaniumManglingCanonicalizerTest, TestBadEquivalenceOrder) {
360 llvm::ItaniumManglingCanonicalizer Canonicalizer;
361 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "N1P1XE", "N1Q1XE"),
362 EquivalenceError::Success);
363 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "1P", "1Q"),
364 EquivalenceError::ManglingAlreadyUsed);
366 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "N1C1XE", "N1A1YE"),
367 EquivalenceError::Success);
368 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "1A", "1B"),
369 EquivalenceError::Success);
370 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "1C", "1D"),
371 EquivalenceError::Success);
372 EXPECT_EQ(Canonicalizer.addEquivalence(FragmentKind::Type, "1B", "1D"),
373 EquivalenceError::ManglingAlreadyUsed);
376 } // end anonymous namespace