blob: ba0b835ab928c635cd0c36c08700219871b219ae [file] [log] [blame]
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +00001// Part of the Crubit project, under the Apache License v2.0 with LLVM
2// Exceptions. See /LICENSE for license information.
3// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
4
Michael Forster500b4762022-01-27 12:30:17 +00005#include "rs_bindings_from_cc/importer.h"
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +00006
Marcel Hlopko9c150da2021-11-12 10:30:03 +00007#include <stdint.h>
8
Googler4e1bc132021-12-06 10:10:42 +00009#include <algorithm>
Devin Jeanpierre56777022022-02-03 01:57:15 +000010#include <cstddef>
Marcel Hlopko7d739792021-08-12 07:52:47 +000011#include <memory>
Marcel Hlopko20f4ce42021-11-02 08:20:00 +000012#include <optional>
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +000013#include <string>
Michael Forster365bba12022-01-24 16:56:06 +000014#include <tuple>
Marcel Hlopko20f4ce42021-11-02 08:20:00 +000015#include <utility>
Marcel Hlopko7d739792021-08-12 07:52:47 +000016#include <vector>
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +000017
Marcel Hlopko80441c12021-11-12 10:43:18 +000018#include "base/logging.h"
Devin Jeanpierred3f959f2021-10-27 18:47:50 +000019#include "rs_bindings_from_cc/ast_convert.h"
Marcel Hlopko80441c12021-11-12 10:43:18 +000020#include "rs_bindings_from_cc/bazel_types.h"
Marcel Hlopko7d739792021-08-12 07:52:47 +000021#include "rs_bindings_from_cc/ir.h"
Marcel Hlopko80441c12021-11-12 10:43:18 +000022#include "third_party/absl/container/flat_hash_map.h"
Marcel Hlopko7d739792021-08-12 07:52:47 +000023#include "third_party/absl/container/flat_hash_set.h"
Marcel Hlopko20f4ce42021-11-02 08:20:00 +000024#include "third_party/absl/status/status.h"
25#include "third_party/absl/status/statusor.h"
26#include "third_party/absl/strings/cord.h"
Lukasz Anforowicz0c816f12021-12-15 17:41:49 +000027#include "third_party/absl/strings/str_cat.h"
Lukasz Anforowiczc4ceb4f2022-01-28 19:29:19 +000028#include "third_party/absl/strings/str_join.h"
Marcel Hlopkoa5f59ae2021-08-24 20:38:04 +000029#include "third_party/absl/strings/string_view.h"
Michael Forster1de27b82021-09-17 07:22:22 +000030#include "third_party/absl/strings/substitute.h"
Marcel Hlopko7d739792021-08-12 07:52:47 +000031#include "third_party/llvm/llvm-project/clang/include/clang/AST/ASTContext.h"
Devin Jeanpierreb69bcae2022-02-03 09:45:50 +000032#include "third_party/llvm/llvm-project/clang/include/clang/AST/Attrs.inc"
Devin Jeanpierre56777022022-02-03 01:57:15 +000033#include "third_party/llvm/llvm-project/clang/include/clang/AST/CXXInheritance.h"
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +000034#include "third_party/llvm/llvm-project/clang/include/clang/AST/Decl.h"
Googler2e85f342021-09-17 07:04:07 +000035#include "third_party/llvm/llvm-project/clang/include/clang/AST/DeclCXX.h"
Googler846e1fc2022-01-10 13:14:57 +000036#include "third_party/llvm/llvm-project/clang/include/clang/AST/DeclTemplate.h"
Marcel Hlopko7d739792021-08-12 07:52:47 +000037#include "third_party/llvm/llvm-project/clang/include/clang/AST/Mangle.h"
Michael Forster028800b2021-10-05 12:39:59 +000038#include "third_party/llvm/llvm-project/clang/include/clang/AST/RawCommentList.h"
Googler6986c072021-09-17 13:54:56 +000039#include "third_party/llvm/llvm-project/clang/include/clang/AST/RecordLayout.h"
Marcel Hlopko7d739792021-08-12 07:52:47 +000040#include "third_party/llvm/llvm-project/clang/include/clang/AST/Type.h"
Michael Forster7b628b12022-01-27 17:48:57 +000041#include "third_party/llvm/llvm-project/clang/include/clang/Basic/FileManager.h"
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +000042#include "third_party/llvm/llvm-project/clang/include/clang/Basic/OperatorKinds.h"
Michael Forster6a184ad2021-10-12 13:04:05 +000043#include "third_party/llvm/llvm-project/clang/include/clang/Basic/SourceLocation.h"
Michael Forster028800b2021-10-05 12:39:59 +000044#include "third_party/llvm/llvm-project/clang/include/clang/Basic/SourceManager.h"
Googler2e85f342021-09-17 07:04:07 +000045#include "third_party/llvm/llvm-project/clang/include/clang/Basic/Specifiers.h"
Marcel Hlopko20f4ce42021-11-02 08:20:00 +000046#include "third_party/llvm/llvm-project/clang/include/clang/Sema/Sema.h"
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +000047#include "third_party/llvm/llvm-project/llvm/include/llvm/ADT/Optional.h"
Devin Jeanpierre56777022022-02-03 01:57:15 +000048#include "third_party/llvm/llvm-project/llvm/include/llvm/ADT/SmallPtrSet.h"
Marcel Hlopkob4b28742021-09-15 12:45:20 +000049#include "third_party/llvm/llvm-project/llvm/include/llvm/Support/Casting.h"
Lukasz Anforowiczc4ceb4f2022-01-28 19:29:19 +000050#include "third_party/llvm/llvm-project/llvm/include/llvm/Support/Regex.h"
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +000051
52namespace rs_bindings_from_cc {
Devin Jeanpierre56777022022-02-03 01:57:15 +000053namespace {
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +000054
Michael Forsterb836c582022-01-21 11:20:22 +000055constexpr absl::string_view kTypeStatusPayloadUrl =
Michael Forsterdc683af2021-09-17 08:51:28 +000056 "type.googleapis.com/devtools.rust.cc_interop.rs_binding_from_cc.type";
57
Googler44e3fbc2022-01-11 10:19:26 +000058// A mapping of C++ standard types to their equivalent Rust types.
59// To produce more idiomatic results, these types receive special handling
60// instead of using the generic type mapping mechanism.
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +000061std::optional<absl::string_view> MapKnownCcTypeToRsType(
62 absl::string_view cc_type) {
63 static const auto* const kWellKnownTypes =
64 new absl::flat_hash_map<absl::string_view, absl::string_view>({
65 {"ptrdiff_t", "isize"},
66 {"intptr_t", "isize"},
67 {"size_t", "usize"},
68 {"uintptr_t", "usize"},
69 {"std::ptrdiff_t", "isize"},
70 {"std::intptr_t", "isize"},
71 {"std::size_t", "usize"},
72 {"std::uintptr_t", "usize"},
Googler4e504882022-01-13 10:03:19 +000073
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +000074 {"int8_t", "i8"},
75 {"int16_t", "i16"},
76 {"int32_t", "i32"},
77 {"int64_t", "i64"},
78 {"std::int8_t", "i8"},
79 {"std::int16_t", "i16"},
80 {"std::int32_t", "i32"},
81 {"std::int64_t", "i64"},
Googler4e504882022-01-13 10:03:19 +000082
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +000083 {"uint8_t", "u8"},
84 {"uint16_t", "u16"},
85 {"uint32_t", "u32"},
Devin Jeanpierre56777022022-02-03 01:57:15 +000086
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +000087 {"uint64_t", "u64"},
88 {"std::uint8_t", "u8"},
89 {"std::uint16_t", "u16"},
90 {"std::uint32_t", "u32"},
91 {"std::uint64_t", "u64"},
Googler4e504882022-01-13 10:03:19 +000092
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +000093 {"char16_t", "u16"},
94 {"char32_t", "u32"},
95 {"wchar_t", "i32"},
96 });
97 auto it = kWellKnownTypes->find(cc_type);
98 if (it == kWellKnownTypes->end()) return std::nullopt;
99 return it->second;
100}
Googler44e3fbc2022-01-11 10:19:26 +0000101
Devin Jeanpierre56777022022-02-03 01:57:15 +0000102DeclId GenerateDeclId(const clang::Decl* decl) {
Marcel Hlopko9c150da2021-11-12 10:30:03 +0000103 return DeclId(reinterpret_cast<uintptr_t>(decl->getCanonicalDecl()));
104}
105
Devin Jeanpierre56777022022-02-03 01:57:15 +0000106std::vector<BaseClass> GetUnambiguousPublicBases(
Devin Jeanpierred652d932022-02-03 08:55:33 +0000107 const clang::CXXRecordDecl& record_decl, const clang::ASTContext& ctx) {
Devin Jeanpierre56777022022-02-03 01:57:15 +0000108 // This function is unfortunate: the only way to correctly get information
109 // about the bases is lookupInBases. It runs a complex O(N^3) algorithm for
110 // e.g. correctly determining virtual base paths, etc.
111 //
112 // However, lookupInBases does not recurse into a class once it's found.
113 // So we need to call lookupInBases once per class, making this O(N^4).
114
115 llvm::SmallPtrSet<const clang::CXXRecordDecl*, 4> seen;
116 std::vector<BaseClass> bases;
117 clang::CXXBasePaths paths;
118 // the const cast is a common pattern, apparently, see e.g.
119 // https://clang.llvm.org/doxygen/CXXInheritance_8cpp_source.html#l00074
Devin Jeanpierred652d932022-02-03 08:55:33 +0000120 paths.setOrigin(const_cast<clang::CXXRecordDecl*>(&record_decl));
Devin Jeanpierre56777022022-02-03 01:57:15 +0000121
122 auto next_class = [&]() {
123 const clang::CXXRecordDecl* found = nullptr;
124
125 // Matches the first new class it encounters (and adds it to `seen`, so
126 // that future runs don't rediscover it.)
127 auto is_new_class = [&](const clang::CXXBaseSpecifier* base_specifier,
128 clang::CXXBasePath&) {
129 const auto* record_decl = base_specifier->getType()->getAsCXXRecordDecl();
130 if (found) {
131 return record_decl == found;
132 }
133
134 if (record_decl && seen.insert(record_decl).second) {
135 found = record_decl;
136 return true;
137 }
138 return false;
139 };
Devin Jeanpierred652d932022-02-03 08:55:33 +0000140 return record_decl.lookupInBases(is_new_class, paths);
Devin Jeanpierre56777022022-02-03 01:57:15 +0000141 };
142
143 for (; next_class(); paths.clear()) {
144 for (const clang::CXXBasePath& path : paths) {
145 if (path.Access != clang::AS_public) {
146 continue;
147 }
148 const clang::CXXBaseSpecifier& base_specifier =
149 *path[path.size() - 1].Base;
150 const clang::QualType& base = base_specifier.getType();
151 if (paths.isAmbiguous(ctx.getCanonicalType(base))) {
152 continue;
153 }
154 const clang::CXXRecordDecl* base_record_decl =
155 ABSL_DIE_IF_NULL(base_specifier.getType()->getAsCXXRecordDecl());
156 std::optional<int64_t> offset = {0};
157 for (const clang::CXXBasePathElement& base_path_element : path) {
158 if (base_path_element.Base->isVirtual()) {
159 offset = std::nullopt;
160 break;
161 }
162 *offset +=
163 {ctx.getASTRecordLayout(base_path_element.Class)
164 .getBaseClassOffset(ABSL_DIE_IF_NULL(
165 base_path_element.Base->getType()->getAsCXXRecordDecl()))
166 .getQuantity()};
167 }
168 DCHECK(!offset.has_value() || *offset >= 0)
169 << "Concrete base classes should have non-negative offsets.";
170 bases.push_back(
171 BaseClass{.base_record_id = GenerateDeclId(base_record_decl),
172 .offset = offset});
173 break;
174 }
175 }
176 return bases;
177}
178} // namespace
179
Michael Forster7b628b12022-01-27 17:48:57 +0000180std::vector<clang::RawComment*> Importer::ImportFreeComments() {
Michael Forstera49d2e62022-01-28 07:26:40 +0000181 clang::SourceManager& sm = ctx_.getSourceManager();
Michael Forster7b628b12022-01-27 17:48:57 +0000182
183 // We put all comments into an ordered set in source order. Later we'll remove
184 // the comments that we don't want or that we get by other means.
185 auto source_order = [&sm](const clang::SourceLocation& a,
186 const clang::SourceLocation& b) {
187 return b.isValid() && (a.isInvalid() || sm.isBeforeInTranslationUnit(a, b));
188 };
189 auto ordered_comments = std::map<clang::SourceLocation, clang::RawComment*,
190 decltype(source_order)>(source_order);
191
Michael Forstera49d2e62022-01-28 07:26:40 +0000192 // We start off by getting the comments from all entry header files...
193 for (const auto& header : invocation_.entry_headers_) {
Michael Forster7b628b12022-01-27 17:48:57 +0000194 if (auto file = sm.getFileManager().getFile(header.IncludePath())) {
Michael Forstera49d2e62022-01-28 07:26:40 +0000195 if (auto comments = ctx_.Comments.getCommentsInFile(
Michael Forster7b628b12022-01-27 17:48:57 +0000196 sm.getOrCreateFileID(*file, clang::SrcMgr::C_User))) {
197 for (const auto& [_, comment] : *comments) {
198 ordered_comments.insert({comment->getBeginLoc(), comment});
199 }
200 }
201 }
202 }
203
204 // ... and then we remove those that "conflict" with an IR item.
205 for (const auto& [decl, result] : lookup_cache_) {
206 if (result.item()) {
207 // Remove doc comments of imported items.
Michael Forstera49d2e62022-01-28 07:26:40 +0000208 if (auto raw_comment = ctx_.getRawCommentForDeclNoCache(decl)) {
Michael Forster7b628b12022-01-27 17:48:57 +0000209 ordered_comments.erase(raw_comment->getBeginLoc());
210 }
211 // Remove comments that are within a visited decl.
212 // TODO(forster): We should retain floating comments in decls like
213 // records and namespaces.
214 ordered_comments.erase(ordered_comments.lower_bound(decl->getBeginLoc()),
215 ordered_comments.upper_bound(decl->getEndLoc()));
216 }
217 }
218
219 // Return the remaining comments as a `std::vector`.
220 std::vector<clang::RawComment*> result;
221 result.reserve(ordered_comments.size());
222 for (auto& [_, comment] : ordered_comments) {
223 result.push_back(comment);
224 }
225 return result;
226}
227
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000228// Multiple IR items can be associated with the same source location (e.g. the
229// implicitly defined constructors and assignment operators). To produce
230// deterministic output, we order such items based on GetDeclOrder. The order
231// is somewhat arbitrary, but we still try to make it aesthetically pleasing
232// (e.g. constructors go before assignment operators; default constructor goes
233// first, etc.).
234static int GetDeclOrder(const clang::Decl* decl) {
235 if (clang::isa<clang::RecordDecl>(decl)) {
236 return decl->getDeclContext()->isRecord() ? 101 : 100;
237 }
238
239 if (auto* ctor = clang::dyn_cast<clang::CXXConstructorDecl>(decl)) {
240 return ctor->isDefaultConstructor() ? 202
241 : ctor->isCopyConstructor() ? 203
242 : ctor->isMoveConstructor() ? 204
243 : 299;
244 }
245
246 if (clang::isa<clang::CXXDestructorDecl>(decl)) {
247 return 306;
248 }
249
250 if (auto* method = clang::dyn_cast<clang::CXXMethodDecl>(decl)) {
251 return method->isCopyAssignmentOperator() ? 401
252 : method->isMoveAssignmentOperator() ? 402
253 : 499;
254 }
255
256 return 999;
257}
258
Michael Forstera49d2e62022-01-28 07:26:40 +0000259void Importer::Import(clang::TranslationUnitDecl* translation_unit_decl) {
260 ImportDeclsFromDeclContext(translation_unit_decl);
261
Lukasz Anforowiczbdf70d32022-01-26 19:06:21 +0000262 using OrderedItem = std::tuple<clang::SourceRange, int, IR::Item>;
Michael Forstera49d2e62022-01-28 07:26:40 +0000263 clang::SourceManager& sm = ctx_.getSourceManager();
Lukasz Anforowiczbdf70d32022-01-26 19:06:21 +0000264 auto is_less_than = [&sm](const OrderedItem& a, const OrderedItem& b) {
265 auto a_range = std::get<0>(a);
266 auto b_range = std::get<0>(b);
Lukasz Anforowiczbdf70d32022-01-26 19:06:21 +0000267 if (!a_range.isValid() || !b_range.isValid()) {
268 if (a_range.isValid() != b_range.isValid())
269 return !a_range.isValid() && b_range.isValid();
270 } else {
271 if (a_range.getBegin() != b_range.getBegin()) {
272 return sm.isBeforeInTranslationUnit(a_range.getBegin(),
273 b_range.getBegin());
274 }
275 if (a_range.getEnd() != b_range.getEnd()) {
276 return sm.isBeforeInTranslationUnit(a_range.getEnd(), b_range.getEnd());
277 }
278 }
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000279
280 auto a_decl_order = std::get<1>(a);
281 auto b_decl_order = std::get<1>(b);
282 if (a_decl_order != b_decl_order) return a_decl_order < b_decl_order;
283
284 // A single FunctionDecl can be associated with multiple UnsupportedItems.
285 // Comparing the fields allows deterministic order between items like:
286 // Non-trivial_abi type '...' is not supported by value as a parameter.
287 // Non-trivial_abi type '...' is not supported by value as a return type.
288 const auto& a_variant = std::get<2>(a);
289 const auto& b_variant = std::get<2>(b);
290 const auto* a_unsupported = std::get_if<UnsupportedItem>(&a_variant);
291 const auto* b_unsupported = std::get_if<UnsupportedItem>(&b_variant);
292 if (a_unsupported && b_unsupported) {
293 if (a_unsupported->name != b_unsupported->name)
294 return a_unsupported->name < b_unsupported->name;
295 return a_unsupported->message < b_unsupported->message;
296 }
297
298 return false;
299 };
300 auto are_equal = [&is_less_than](const OrderedItem& a, const OrderedItem& b) {
301 return !is_less_than(a, b) && !is_less_than(b, a);
Lukasz Anforowiczbdf70d32022-01-26 19:06:21 +0000302 };
Michael Forster365bba12022-01-24 16:56:06 +0000303
304 // We emit IR items in the order of the decls they were generated for.
305 // For decls that emit multiple items we use a stable, but arbitrary order.
Lukasz Anforowiczbdf70d32022-01-26 19:06:21 +0000306 std::vector<OrderedItem> items;
Michael Forster500b4762022-01-27 12:30:17 +0000307 for (const auto& [decl, result] : lookup_cache_) {
Michael Forster500b4762022-01-27 12:30:17 +0000308 auto item = result.item();
309 if (item) {
Michael Forster365bba12022-01-24 16:56:06 +0000310 items.push_back(
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000311 std::make_tuple(decl->getSourceRange(), GetDeclOrder(decl), *item));
Michael Forster500b4762022-01-27 12:30:17 +0000312 }
313 if (IsFromCurrentTarget(decl)) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000314 std::string name = "unnamed";
315 if (const auto* named_decl = clang::dyn_cast<clang::NamedDecl>(decl)) {
316 name = named_decl->getQualifiedNameAsString();
317 }
318 SourceLoc source_loc = ConvertSourceLocation(decl->getBeginLoc());
Michael Forster500b4762022-01-27 12:30:17 +0000319 for (const auto& error : result.errors()) {
Michael Forster500b4762022-01-27 12:30:17 +0000320 items.push_back(std::make_tuple(
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000321 decl->getSourceRange(), GetDeclOrder(decl),
Michael Forster500b4762022-01-27 12:30:17 +0000322 UnsupportedItem{
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000323 .name = name, .message = error, .source_loc = source_loc}));
Michael Forster500b4762022-01-27 12:30:17 +0000324 }
Michael Forster365bba12022-01-24 16:56:06 +0000325 }
326 }
Michael Forster500b4762022-01-27 12:30:17 +0000327
Michael Forster7b628b12022-01-27 17:48:57 +0000328 for (auto comment : ImportFreeComments()) {
Michael Forster365bba12022-01-24 16:56:06 +0000329 items.push_back(std::make_tuple(
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000330 comment->getSourceRange(), 0 /* decl_order */,
Michael Forster365bba12022-01-24 16:56:06 +0000331 Comment{.text = comment->getFormattedText(sm, sm.getDiagnostics())}));
332 }
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000333 std::sort(items.begin(), items.end(), is_less_than);
Michael Forster365bba12022-01-24 16:56:06 +0000334
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000335 for (size_t i = 0; i < items.size(); i++) {
336 const auto& item = items[i];
337 if (i > 0) {
338 const auto& prev = items[i - 1];
339 if (are_equal(item, prev)) {
340 std::string prev_json =
341 std::visit([&](auto&& item) { return item.ToJson().dump(); },
342 std::get<2>(prev));
343 std::string curr_json =
344 std::visit([&](auto&& item) { return item.ToJson().dump(); },
345 std::get<2>(item));
346 if (prev_json != curr_json) {
347 LOG(FATAL) << "Non-deterministic order of IR items: " << prev_json
348 << " -VS- " << curr_json;
349 } else {
350 // TODO(lukasza): Avoid generating duplicate IR items. Currently
351 // known example: UnsupportedItem: name=std::signbit; message=
352 // Items contained in namespaces are not supported yet.
353 LOG(WARNING) << "Duplicated IR item: " << curr_json;
354 continue;
355 }
356 }
357 }
Michael Forstera49d2e62022-01-28 07:26:40 +0000358 invocation_.ir_.items.push_back(std::get<2>(item));
Michael Forster365bba12022-01-24 16:56:06 +0000359 }
360}
361
Michael Forster500b4762022-01-27 12:30:17 +0000362void Importer::ImportDeclsFromDeclContext(
363 const clang::DeclContext* decl_context) {
364 for (auto decl : decl_context->decls()) {
Michael Forster500b4762022-01-27 12:30:17 +0000365 LookupDecl(decl->getCanonicalDecl());
366
367 if (auto* nested_context = clang::dyn_cast<clang::DeclContext>(decl)) {
368 if (nested_context->isNamespace())
369 ImportDeclsFromDeclContext(nested_context);
370 }
371 }
372}
373
374Importer::LookupResult Importer::LookupDecl(clang::Decl* decl) {
375 if (!lookup_cache_.contains(decl)) {
376 lookup_cache_.insert({decl, ImportDecl(decl)});
377 }
378
379 return lookup_cache_[decl];
380}
381
382Importer::LookupResult Importer::ImportDecl(clang::Decl* decl) {
383 if (decl->getDeclContext()->isNamespace()) {
384 return LookupResult("Items contained in namespaces are not supported yet");
385 }
386
387 if (auto* function_decl = clang::dyn_cast<clang::FunctionDecl>(decl)) {
388 return ImportFunction(function_decl);
389 } else if (auto* function_template_decl =
390 clang::dyn_cast<clang::FunctionTemplateDecl>(decl)) {
391 return ImportFunction(function_template_decl->getTemplatedDecl());
Devin Jeanpierred652d932022-02-03 08:55:33 +0000392 } else if (auto* record_decl = clang::dyn_cast<clang::CXXRecordDecl>(decl)) {
Michael Forster500b4762022-01-27 12:30:17 +0000393 auto result = ImportRecord(record_decl);
394 // TODO(forster): Should we even visit the nested decl if we couldn't
395 // import the parent? For now we have tests that check that we generate
396 // error messages for those decls, so we're visiting.
397 ImportDeclsFromDeclContext(record_decl);
398 return result;
399 } else if (auto* typedef_name_decl =
400 clang::dyn_cast<clang::TypedefNameDecl>(decl)) {
401 return ImportTypedefName(typedef_name_decl);
402 } else if (clang::isa<clang::ClassTemplateDecl>(decl)) {
403 return LookupResult("Class templates are not supported yet");
404 } else {
405 return LookupResult();
406 }
407}
408
409Importer::LookupResult Importer::ImportFunction(
410 clang::FunctionDecl* function_decl) {
411 if (!IsFromCurrentTarget(function_decl)) return LookupResult();
412 if (function_decl->isDeleted()) return LookupResult();
Marcel Hlopko3df195b2022-01-26 14:15:03 +0000413 if (function_decl->isTemplated()) {
Michael Forster500b4762022-01-27 12:30:17 +0000414 return LookupResult("Function templates are not supported yet");
Marcel Hlopko3df195b2022-01-26 14:15:03 +0000415 }
Marcel Hlopko36ced2d2021-12-02 10:47:37 +0000416
Googler4e1bc132021-12-06 10:10:42 +0000417 devtools_rust::LifetimeSymbolTable lifetime_symbol_table;
418 llvm::Expected<devtools_rust::FunctionLifetimes> lifetimes =
Michael Forstera49d2e62022-01-28 07:26:40 +0000419 devtools_rust::GetLifetimeAnnotations(function_decl,
420 *invocation_.lifetime_context_,
Googler4e1bc132021-12-06 10:10:42 +0000421 &lifetime_symbol_table);
422 llvm::DenseSet<devtools_rust::Lifetime> all_lifetimes;
423
Marcel Hlopko7d739792021-08-12 07:52:47 +0000424 std::vector<FuncParam> params;
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000425 std::set<std::string> errors;
426 auto add_error = [&errors, function_decl](std::string msg) {
427 auto result = errors.insert(std::move(msg));
428 CHECK(result.second) << "Duplicated error message for "
429 << function_decl->getNameAsString() << ": "
430 << *result.first;
431 };
Michael Forster500b4762022-01-27 12:30:17 +0000432 if (auto* method_decl =
433 clang::dyn_cast<clang::CXXMethodDecl>(function_decl)) {
Marcel Hlopkoa5a18732022-01-27 09:58:53 +0000434 if (!known_type_decls_.contains(
435 method_decl->getParent()->getCanonicalDecl())) {
Michael Forster500b4762022-01-27 12:30:17 +0000436 return LookupResult("Couldn't import the parent");
Marcel Hlopkoa5a18732022-01-27 09:58:53 +0000437 }
438
439 // non-static member functions receive an implicit `this` parameter.
Devin Jeanpierred4dde0e2021-10-13 20:48:25 +0000440 if (method_decl->isInstance()) {
Googler4e1bc132021-12-06 10:10:42 +0000441 std::optional<devtools_rust::TypeLifetimes> this_lifetimes;
442 if (lifetimes) {
443 this_lifetimes = lifetimes->this_lifetimes;
444 all_lifetimes.insert(this_lifetimes->begin(), this_lifetimes->end());
445 }
446 auto param_type = ConvertType(method_decl->getThisType(), this_lifetimes,
447 /*nullable=*/false);
Devin Jeanpierred4dde0e2021-10-13 20:48:25 +0000448 if (!param_type.ok()) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000449 add_error(absl::StrCat("`this` parameter is not supported: ",
450 param_type.status().message()));
Devin Jeanpierrefecf5472021-10-27 10:52:30 +0000451 } else {
452 params.push_back({*std::move(param_type), Identifier("__this")});
Devin Jeanpierred4dde0e2021-10-13 20:48:25 +0000453 }
Devin Jeanpierred4dde0e2021-10-13 20:48:25 +0000454 }
455 }
Michael Forster523dbd42021-10-12 11:05:44 +0000456
Googler4e1bc132021-12-06 10:10:42 +0000457 if (lifetimes) {
458 CHECK_EQ(lifetimes->param_lifetimes.size(), function_decl->getNumParams());
459 }
460 for (unsigned i = 0; i < function_decl->getNumParams(); ++i) {
461 const clang::ParmVarDecl* param = function_decl->getParamDecl(i);
462 std::optional<devtools_rust::TypeLifetimes> param_lifetimes;
463 if (lifetimes) {
464 param_lifetimes = lifetimes->param_lifetimes[i];
465 all_lifetimes.insert(param_lifetimes->begin(), param_lifetimes->end());
466 }
467 auto param_type = ConvertType(param->getType(), param_lifetimes);
Michael Forsterdc683af2021-09-17 08:51:28 +0000468 if (!param_type.ok()) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000469 add_error(absl::Substitute("Parameter #$0 is not supported: $1", i,
470 param_type.status().message()));
Michael Forster523dbd42021-10-12 11:05:44 +0000471 continue;
Michael Forster1de27b82021-09-17 07:22:22 +0000472 }
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000473
474 if (const clang::RecordType* record_type =
Michael Forster500b4762022-01-27 12:30:17 +0000475 clang::dyn_cast<clang::RecordType>(param->getType())) {
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000476 if (clang::RecordDecl* record_decl =
Michael Forster500b4762022-01-27 12:30:17 +0000477 clang::dyn_cast<clang::RecordDecl>(record_type->getDecl())) {
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000478 // TODO(b/200067242): non-trivial_abi structs, when passed by value,
479 // have a different representation which needs special support. We
480 // currently do not support it.
481 if (!record_decl->canPassInRegisters()) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000482 add_error(
Marcel Hlopko3df72542021-11-30 09:38:36 +0000483 absl::Substitute("Non-trivial_abi type '$0' is not "
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000484 "supported by value as parameter #$1",
485 param->getType().getAsString(), i));
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000486 }
487 }
488 }
489
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000490 std::optional<Identifier> param_name = GetTranslatedIdentifier(param);
Lukasz Anforowicz0c816f12021-12-15 17:41:49 +0000491 CHECK(param_name.has_value()); // No known cases where the above can fail.
Devin Jeanpierree78b2fb2021-10-05 11:40:33 +0000492 params.push_back({*param_type, *std::move(param_name)});
Marcel Hlopko7d739792021-08-12 07:52:47 +0000493 }
494
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000495 if (const clang::RecordType* record_return_type =
Michael Forster500b4762022-01-27 12:30:17 +0000496 clang::dyn_cast<clang::RecordType>(function_decl->getReturnType())) {
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000497 if (clang::RecordDecl* record_decl =
Michael Forster500b4762022-01-27 12:30:17 +0000498 clang::dyn_cast<clang::RecordDecl>(record_return_type->getDecl())) {
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000499 // TODO(b/200067242): non-trivial_abi structs, when passed by value,
500 // have a different representation which needs special support. We
501 // currently do not support it.
502 if (!record_decl->canPassInRegisters()) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000503 add_error(
Marcel Hlopko3df72542021-11-30 09:38:36 +0000504 absl::Substitute("Non-trivial_abi type '$0' is not supported "
505 "by value as a return type",
Michael Forster500b4762022-01-27 12:30:17 +0000506 function_decl->getReturnType().getAsString()));
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000507 }
508 }
509 }
510
Googler4e1bc132021-12-06 10:10:42 +0000511 std::optional<devtools_rust::TypeLifetimes> return_lifetimes;
512 if (lifetimes) {
513 return_lifetimes = lifetimes->return_lifetimes;
514 all_lifetimes.insert(return_lifetimes->begin(), return_lifetimes->end());
515 }
516 auto return_type =
517 ConvertType(function_decl->getReturnType(), return_lifetimes);
Michael Forsterdc683af2021-09-17 08:51:28 +0000518 if (!return_type.ok()) {
Lukasz Anforowicz49b5bbc2022-02-04 23:40:10 +0000519 add_error(absl::StrCat("Return type is not supported: ",
520 return_type.status().message()));
Michael Forster1de27b82021-09-17 07:22:22 +0000521 }
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000522
Googler4e1bc132021-12-06 10:10:42 +0000523 std::vector<Lifetime> lifetime_params;
524 for (devtools_rust::Lifetime lifetime : all_lifetimes) {
525 std::optional<llvm::StringRef> name =
526 lifetime_symbol_table.LookupLifetime(lifetime);
527 CHECK(name.has_value());
528 lifetime_params.push_back(
529 {.name = name->str(), .id = LifetimeId(lifetime.Id())});
530 }
531 std::sort(
532 lifetime_params.begin(), lifetime_params.end(),
533 [](const Lifetime& l1, const Lifetime& l2) { return l1.name < l2.name; });
534
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000535 std::optional<MemberFuncMetadata> member_func_metadata;
Michael Forster500b4762022-01-27 12:30:17 +0000536 if (auto* method_decl =
537 clang::dyn_cast<clang::CXXMethodDecl>(function_decl)) {
Lukasz Anforowicz57331cf2021-12-16 02:57:19 +0000538 switch (method_decl->getAccess()) {
539 case clang::AS_public:
540 break;
541 case clang::AS_protected:
542 case clang::AS_private:
543 case clang::AS_none:
544 // No need for IR to include Func representing private methods.
545 // TODO(lukasza): Revisit this for protected methods.
Michael Forster500b4762022-01-27 12:30:17 +0000546 return LookupResult();
Lukasz Anforowicz57331cf2021-12-16 02:57:19 +0000547 }
Devin Jeanpierre96839c12021-12-14 00:27:38 +0000548 std::optional<MemberFuncMetadata::InstanceMethodMetadata> instance_metadata;
549 if (method_decl->isInstance()) {
550 MemberFuncMetadata::ReferenceQualification reference;
551 switch (method_decl->getRefQualifier()) {
552 case clang::RQ_LValue:
553 reference = MemberFuncMetadata::kLValue;
554 break;
555 case clang::RQ_RValue:
556 reference = MemberFuncMetadata::kRValue;
557 break;
558 case clang::RQ_None:
559 reference = MemberFuncMetadata::kUnqualified;
560 break;
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000561 }
Devin Jeanpierre96839c12021-12-14 00:27:38 +0000562 instance_metadata = MemberFuncMetadata::InstanceMethodMetadata{
563 .reference = reference,
564 .is_const = method_decl->isConst(),
565 .is_virtual = method_decl->isVirtual(),
Lukasz Anforowicz71716b72022-01-26 17:05:05 +0000566 .is_explicit_ctor = false,
Devin Jeanpierre96839c12021-12-14 00:27:38 +0000567 };
Lukasz Anforowicz71716b72022-01-26 17:05:05 +0000568 if (auto* ctor_decl =
Michael Forster500b4762022-01-27 12:30:17 +0000569 clang::dyn_cast<clang::CXXConstructorDecl>(function_decl)) {
Lukasz Anforowicz71716b72022-01-26 17:05:05 +0000570 instance_metadata->is_explicit_ctor = ctor_decl->isExplicit();
571 }
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000572 }
Devin Jeanpierre96839c12021-12-14 00:27:38 +0000573
574 member_func_metadata = MemberFuncMetadata{
575 .record_id = GenerateDeclId(method_decl->getParent()),
576 .instance_method_metadata = instance_metadata};
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000577 }
578
Michael Forster500b4762022-01-27 12:30:17 +0000579 if (!errors.empty()) {
580 return LookupResult(errors);
581 }
582
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000583 std::optional<UnqualifiedIdentifier> translated_name =
584 GetTranslatedName(function_decl);
Michael Forster277ff952022-01-27 18:14:56 +0000585 CHECK(return_type.ok()); // Silence ClangTidy, checked above.
Michael Forster500b4762022-01-27 12:30:17 +0000586 if (translated_name.has_value()) {
587 return LookupResult(Func{
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000588 .name = *translated_name,
Marcel Hlopko80441c12021-11-12 10:43:18 +0000589 .owning_target = GetOwningTarget(function_decl),
Michael Forster523dbd42021-10-12 11:05:44 +0000590 .doc_comment = GetComment(function_decl),
591 .mangled_name = GetMangledName(function_decl),
592 .return_type = *return_type,
593 .params = std::move(params),
Googler4e1bc132021-12-06 10:10:42 +0000594 .lifetime_params = std::move(lifetime_params),
Michael Forster523dbd42021-10-12 11:05:44 +0000595 .is_inline = function_decl->isInlined(),
Devin Jeanpierrec6877bb2021-10-13 20:47:54 +0000596 .member_func_metadata = std::move(member_func_metadata),
Googler95f29a12022-01-07 07:47:26 +0000597 .source_loc = ConvertSourceLocation(function_decl->getBeginLoc()),
Michael Forster523dbd42021-10-12 11:05:44 +0000598 });
Devin Jeanpierree78b2fb2021-10-05 11:40:33 +0000599 }
Michael Forster500b4762022-01-27 12:30:17 +0000600 return LookupResult();
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +0000601}
602
Michael Forster500b4762022-01-27 12:30:17 +0000603BlazeLabel Importer::GetOwningTarget(const clang::Decl* decl) const {
Michael Forstera49d2e62022-01-28 07:26:40 +0000604 clang::SourceManager& source_manager = ctx_.getSourceManager();
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +0000605 auto source_location = decl->getLocation();
Marcel Hlopko80441c12021-11-12 10:43:18 +0000606
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +0000607 // If the header this decl comes from is not associated with a target we
608 // consider it a textual header. In that case we go up the include stack
609 // until we find a header that has an owning target.
610
Rosica Dejanovska381d1032022-02-03 22:19:54 +0000611 while (source_location.isValid()) {
Rosica Dejanovska503d7dd2022-02-01 20:37:49 +0000612 if (source_location.isMacroID()) {
613 source_location = source_manager.getExpansionLoc(source_location);
614 }
615 auto id = source_manager.getFileID(source_location);
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +0000616 llvm::Optional<llvm::StringRef> filename =
617 source_manager.getNonBuiltinFilenameForID(id);
618 if (!filename) {
619 return BlazeLabel("//:builtin");
620 }
621 if (filename->startswith("./")) {
622 filename = filename->substr(2);
623 }
Michael Forstera49d2e62022-01-28 07:26:40 +0000624
625 if (auto target = invocation_.header_target(HeaderName(filename->str()))) {
626 return *target;
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +0000627 }
628 source_location = source_manager.getIncludeLoc(id);
Marcel Hlopko4c660dd2021-12-02 09:52:47 +0000629 }
Rosica Dejanovskad0fc2942022-01-21 11:26:00 +0000630
631 return BlazeLabel("//:virtual_clang_resource_dir_target");
Marcel Hlopko80441c12021-11-12 10:43:18 +0000632}
633
Michael Forster500b4762022-01-27 12:30:17 +0000634bool Importer::IsFromCurrentTarget(const clang::Decl* decl) const {
Michael Forstera49d2e62022-01-28 07:26:40 +0000635 return invocation_.target_ == GetOwningTarget(decl);
Marcel Hlopko4c660dd2021-12-02 09:52:47 +0000636}
637
Devin Jeanpierred652d932022-02-03 08:55:33 +0000638Importer::LookupResult Importer::ImportRecord(
639 clang::CXXRecordDecl* record_decl) {
Googler21351fc2021-10-19 08:58:04 +0000640 const clang::DeclContext* decl_context = record_decl->getDeclContext();
Dmitri Gribenko14627692022-01-31 09:37:00 +0000641 if (decl_context->isFunctionOrMethod()) {
642 return LookupResult();
643 }
644 if (record_decl->isInjectedClassName()) {
645 return LookupResult();
Googler21351fc2021-10-19 08:58:04 +0000646 }
Michael Forster500b4762022-01-27 12:30:17 +0000647 if (decl_context->isRecord()) {
648 return LookupResult("Nested classes are not supported yet");
649 }
Marcel Hlopko872df5e2022-01-25 21:18:55 +0000650 if (record_decl->isUnion()) {
Michael Forster500b4762022-01-27 12:30:17 +0000651 return LookupResult("Unions are not supported yet");
Marcel Hlopko872df5e2022-01-25 21:18:55 +0000652 }
Googler8173f592022-01-04 13:57:32 +0000653 // Make sure the record has a definition that we'll be able to call
654 // ASTContext::getASTRecordLayout() on.
655 record_decl = record_decl->getDefinition();
656 if (!record_decl || record_decl->isInvalidDecl() ||
657 !record_decl->isCompleteDefinition()) {
Michael Forster500b4762022-01-27 12:30:17 +0000658 return LookupResult();
Googler8173f592022-01-04 13:57:32 +0000659 }
660
Devin Jeanpierrec80e6242022-02-03 01:56:40 +0000661 // To compute the memory layout of the record, it needs to be a concrete type,
662 // not a template.
Devin Jeanpierred652d932022-02-03 08:55:33 +0000663 if (record_decl->getDescribedClassTemplate() ||
664 clang::isa<clang::ClassTemplateSpecializationDecl>(record_decl)) {
Devin Jeanpierrec80e6242022-02-03 01:56:40 +0000665 return LookupResult("Class templates are not supported yet");
666 }
667
Devin Jeanpierred652d932022-02-03 08:55:33 +0000668 sema_.ForceDeclarationOfImplicitMembers(record_decl);
669
Devin Jeanpierrec80e6242022-02-03 01:56:40 +0000670 const clang::ASTRecordLayout& layout = ctx_.getASTRecordLayout(record_decl);
Devin Jeanpierred652d932022-02-03 08:55:33 +0000671
Devin Jeanpierrec80e6242022-02-03 01:56:40 +0000672 std::optional<size_t> base_size = std::nullopt;
Marcel Hlopko14ee3c82022-02-09 09:46:23 +0000673 bool override_alignment = record_decl->hasAttr<clang::AlignedAttr>();
Devin Jeanpierred652d932022-02-03 08:55:33 +0000674 if (record_decl->getNumBases() != 0) {
675 // The size of the base class subobjects is easy to compute, so long as we
676 // know that fields start after the base class subobjects. (This is not
677 // guaranteed by the standard, but is true on the ABIs we work with.)
678 base_size = layout.getFieldCount() == 0
679 ? static_cast<size_t>(layout.getDataSize().getQuantity())
680 : layout.getFieldOffset(0) / 8;
681 // Ideally, we'd only include an alignment adjustment if one of the base
682 // classes is more-aligned than any of the fields, but it is simpler do it
683 // whenever there are any base classes at all.
684 override_alignment = true;
Googler2e85f342021-09-17 07:04:07 +0000685 }
Devin Jeanpierred652d932022-02-03 08:55:33 +0000686
Googler279eca32022-01-04 14:03:44 +0000687 std::optional<Identifier> record_name = GetTranslatedIdentifier(record_decl);
688 if (!record_name.has_value()) {
Michael Forster500b4762022-01-27 12:30:17 +0000689 return LookupResult();
Googler279eca32022-01-04 14:03:44 +0000690 }
691 // Provisionally assume that we know this RecordDecl so that we'll be able
692 // to import fields whose type contains the record itself.
Googlerdcca7f72022-01-10 12:30:43 +0000693 known_type_decls_.insert(record_decl);
Devin Jeanpierred652d932022-02-03 08:55:33 +0000694 absl::StatusOr<std::vector<Field>> fields = ImportFields(record_decl);
Michael Forster500b4762022-01-27 12:30:17 +0000695 if (!fields.ok()) {
Googler279eca32022-01-04 14:03:44 +0000696 // Importing a field failed, so note that we didn't import this RecordDecl
697 // after all.
Googlerdcca7f72022-01-10 12:30:43 +0000698 known_type_decls_.erase(record_decl);
Michael Forster500b4762022-01-27 12:30:17 +0000699 return LookupResult("Importing field failed");
Devin Jeanpierree78b2fb2021-10-05 11:40:33 +0000700 }
Michael Forster500b4762022-01-27 12:30:17 +0000701
Devin Jeanpierreb69bcae2022-02-03 09:45:50 +0000702 for (const Field& field : *fields) {
703 if (field.is_no_unique_address) {
704 override_alignment = true;
705 break;
706 }
707 }
708
Devin Jeanpierre56777022022-02-03 01:57:15 +0000709 return LookupResult(Record{
710 .identifier = *record_name,
711 .id = GenerateDeclId(record_decl),
712 .owning_target = GetOwningTarget(record_decl),
713 .doc_comment = GetComment(record_decl),
714 .unambiguous_public_bases = GetUnambiguousPublicBases(*record_decl, ctx_),
715 .fields = *std::move(fields),
716 .size = layout.getSize().getQuantity(),
717 .alignment = layout.getAlignment().getQuantity(),
718 .base_size = base_size,
719 .override_alignment = override_alignment,
720 .copy_constructor = GetCopyCtorSpecialMemberFunc(*record_decl),
721 .move_constructor = GetMoveCtorSpecialMemberFunc(*record_decl),
722 .destructor = GetDestructorSpecialMemberFunc(*record_decl),
723 .is_trivial_abi = record_decl->canPassInRegisters(),
Devin Jeanpierred652d932022-02-03 08:55:33 +0000724 .is_final = record_decl->isEffectivelyFinal()});
Marcel Hlopkob4b28742021-09-15 12:45:20 +0000725}
726
Michael Forster500b4762022-01-27 12:30:17 +0000727Importer::LookupResult Importer::ImportTypedefName(
Googler68346992022-01-05 06:11:31 +0000728 clang::TypedefNameDecl* typedef_name_decl) {
Googlerdcca7f72022-01-10 12:30:43 +0000729 const clang::DeclContext* decl_context = typedef_name_decl->getDeclContext();
730 if (decl_context) {
731 if (decl_context->isFunctionOrMethod()) {
Michael Forster500b4762022-01-27 12:30:17 +0000732 return LookupResult();
Googlerdcca7f72022-01-10 12:30:43 +0000733 }
734 if (decl_context->isRecord()) {
Michael Forster500b4762022-01-27 12:30:17 +0000735 return LookupResult("Typedefs nested in classes are not supported yet");
Googlerdcca7f72022-01-10 12:30:43 +0000736 }
737 }
738
Googler44e3fbc2022-01-11 10:19:26 +0000739 clang::QualType type =
740 typedef_name_decl->getASTContext().getTypedefType(typedef_name_decl);
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +0000741 if (MapKnownCcTypeToRsType(type.getAsString()).has_value()) {
Michael Forster500b4762022-01-27 12:30:17 +0000742 return LookupResult();
Googler44e3fbc2022-01-11 10:19:26 +0000743 }
744
Googlerdcca7f72022-01-10 12:30:43 +0000745 std::optional<Identifier> identifier =
746 GetTranslatedIdentifier(typedef_name_decl);
747 if (!identifier.has_value()) {
748 // This should never happen.
749 LOG(FATAL) << "Couldn't get identifier for TypedefNameDecl";
Googlerdcca7f72022-01-10 12:30:43 +0000750 }
751 absl::StatusOr<MappedType> underlying_type =
752 ConvertType(typedef_name_decl->getUnderlyingType());
753 if (underlying_type.ok()) {
754 known_type_decls_.insert(typedef_name_decl);
Michael Forster500b4762022-01-27 12:30:17 +0000755 return LookupResult(
Googlerdcca7f72022-01-10 12:30:43 +0000756 TypeAlias{.identifier = *identifier,
757 .id = GenerateDeclId(typedef_name_decl),
758 .owning_target = GetOwningTarget(typedef_name_decl),
759 .underlying_type = *underlying_type});
760 } else {
Michael Forster500b4762022-01-27 12:30:17 +0000761 return LookupResult(std::string(underlying_type.status().message()));
Googlerdcca7f72022-01-10 12:30:43 +0000762 }
Googler68346992022-01-05 06:11:31 +0000763}
764
Lukasz Anforowiczc4ceb4f2022-01-28 19:29:19 +0000765static bool ShouldKeepCommentLine(absl::string_view line) {
766 // Based on https://clang.llvm.org/extra/clang-tidy/:
767 llvm::Regex patterns_to_ignore(
768 "^[[:space:]/]*" // Whitespace, or extra //
769 "(NOLINT|NOLINTNEXTLINE|NOLINTBEGIN|NOLINTEND)"
770 "(\\([^)[:space:]]*\\)?)?" // Optional (...)
771 "[[:space:]]*$"); // Whitespace
772 return !patterns_to_ignore.match(line);
773}
774
Michael Forster500b4762022-01-27 12:30:17 +0000775std::optional<std::string> Importer::GetComment(const clang::Decl* decl) const {
Michael Forster409d9412021-10-07 08:35:29 +0000776 // This does currently not distinguish between different types of comments.
777 // In general it is not possible in C++ to reliably only extract doc comments.
778 // This is going to be a heuristic that needs to be tuned over time.
779
Michael Forstera49d2e62022-01-28 07:26:40 +0000780 clang::SourceManager& sm = ctx_.getSourceManager();
781 clang::RawComment* raw_comment = ctx_.getRawCommentForDeclNoCache(decl);
Michael Forstercc5941a2021-10-07 07:12:24 +0000782
783 if (raw_comment == nullptr) {
784 return {};
Michael Forstercc5941a2021-10-07 07:12:24 +0000785 }
Lukasz Anforowiczc4ceb4f2022-01-28 19:29:19 +0000786
787 std::string raw_comment_text =
788 raw_comment->getFormattedText(sm, sm.getDiagnostics());
789 std::string cleaned_comment_text = absl::StrJoin(
790 absl::StrSplit(raw_comment_text, '\n', ShouldKeepCommentLine), "\n");
791 return cleaned_comment_text.empty()
792 ? std::nullopt
793 : std::optional<std::string>(std::move(cleaned_comment_text));
Michael Forstercc5941a2021-10-07 07:12:24 +0000794}
795
Michael Forster500b4762022-01-27 12:30:17 +0000796SourceLoc Importer::ConvertSourceLocation(clang::SourceLocation loc) const {
Michael Forstera49d2e62022-01-28 07:26:40 +0000797 auto& sm = ctx_.getSourceManager();
Michael Forsterd3ef1e92021-10-12 16:15:31 +0000798
Googlerc8a8e732021-10-19 07:49:24 +0000799 clang::StringRef filename = sm.getFilename(loc);
Michael Forsterd3ef1e92021-10-12 16:15:31 +0000800 if (filename.startswith("./")) {
801 filename = filename.substr(2);
802 }
803
804 return SourceLoc{.filename = filename.str(),
805 .line = sm.getSpellingLineNumber(loc),
806 .column = sm.getSpellingColumnNumber(loc)};
807}
808
Michael Forster500b4762022-01-27 12:30:17 +0000809absl::StatusOr<MappedType> Importer::ConvertType(
Googler4e1bc132021-12-06 10:10:42 +0000810 clang::QualType qual_type,
811 std::optional<devtools_rust::TypeLifetimes> lifetimes,
812 bool nullable) const {
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000813 std::optional<MappedType> type = std::nullopt;
Googlerdb111532022-01-05 06:12:13 +0000814 // When converting the type to a string, don't include qualifiers -- we handle
815 // these separately.
816 std::string type_string = qual_type.getUnqualifiedType().getAsString();
Michael Forsterdc683af2021-09-17 08:51:28 +0000817
Lukasz Anforowiczb22917e2022-02-16 23:49:59 +0000818 if (auto maybe_mapped_type = MapKnownCcTypeToRsType(type_string);
819 maybe_mapped_type.has_value()) {
820 type = MappedType::Simple(std::string(*maybe_mapped_type), type_string);
Googler06f2c9a2022-01-05 12:00:47 +0000821 } else if (const auto* pointer_type =
822 qual_type->getAs<clang::PointerType>()) {
Googler4e1bc132021-12-06 10:10:42 +0000823 std::optional<LifetimeId> lifetime;
824 if (lifetimes.has_value()) {
825 CHECK(!lifetimes->empty());
826 lifetime = LifetimeId(lifetimes->back().Id());
827 lifetimes->pop_back();
828 }
829 auto pointee_type = ConvertType(pointer_type->getPointeeType(), lifetimes);
Michael Forsterdc683af2021-09-17 08:51:28 +0000830 if (pointee_type.ok()) {
Googler4e1bc132021-12-06 10:10:42 +0000831 type = MappedType::PointerTo(*pointee_type, lifetime, nullable);
Michael Forster1de27b82021-09-17 07:22:22 +0000832 }
Googler61dce3b2021-12-02 09:16:32 +0000833 } else if (const auto* lvalue_ref_type =
834 qual_type->getAs<clang::LValueReferenceType>()) {
Googler4e1bc132021-12-06 10:10:42 +0000835 std::optional<LifetimeId> lifetime;
836 if (lifetimes.has_value()) {
837 CHECK(!lifetimes->empty());
838 lifetime = LifetimeId(lifetimes->back().Id());
839 lifetimes->pop_back();
840 }
841 auto pointee_type =
842 ConvertType(lvalue_ref_type->getPointeeType(), lifetimes);
Googler61dce3b2021-12-02 09:16:32 +0000843 if (pointee_type.ok()) {
Googler4e1bc132021-12-06 10:10:42 +0000844 type = MappedType::LValueReferenceTo(*pointee_type, lifetime);
Googler61dce3b2021-12-02 09:16:32 +0000845 }
Googlerb6c0fe02021-12-01 10:55:31 +0000846 } else if (const auto* builtin_type =
Googler06f2c9a2022-01-05 12:00:47 +0000847 // Use getAsAdjusted instead of getAs so we don't desugar
848 // typedefs.
849 qual_type->getAsAdjusted<clang::BuiltinType>()) {
Michael Forster51da81a2021-09-20 07:14:23 +0000850 switch (builtin_type->getKind()) {
851 case clang::BuiltinType::Bool:
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000852 type = MappedType::Simple("bool", "bool");
Michael Forster51da81a2021-09-20 07:14:23 +0000853 break;
854 case clang::BuiltinType::Float:
Michael Forsterc7976ec2021-10-01 10:05:16 +0000855 type = MappedType::Simple("f32", "float");
Michael Forster51da81a2021-09-20 07:14:23 +0000856 break;
857 case clang::BuiltinType::Double:
Michael Forsterc7976ec2021-10-01 10:05:16 +0000858 type = MappedType::Simple("f64", "double");
Michael Forster51da81a2021-09-20 07:14:23 +0000859 break;
860 case clang::BuiltinType::Void:
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000861 type = MappedType::Void();
Michael Forster51da81a2021-09-20 07:14:23 +0000862 break;
863 default:
864 if (builtin_type->isIntegerType()) {
Michael Forstera49d2e62022-01-28 07:26:40 +0000865 auto size = ctx_.getTypeSize(builtin_type);
Googler06f2c9a2022-01-05 12:00:47 +0000866 if (size == 8 || size == 16 || size == 32 || size == 64) {
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000867 type = MappedType::Simple(
Michael Forster51da81a2021-09-20 07:14:23 +0000868 absl::Substitute(
869 "$0$1", builtin_type->isSignedInteger() ? 'i' : 'u', size),
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000870 type_string);
Michael Forster51da81a2021-09-20 07:14:23 +0000871 }
872 }
Marcel Hlopko7d739792021-08-12 07:52:47 +0000873 }
Michael Forster365bba12022-01-24 16:56:06 +0000874 } else if (const auto* tag_type =
Googler6a0a5252022-01-11 14:08:09 +0000875 qual_type->getAsAdjusted<clang::TagType>()) {
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000876 clang::TagDecl* tag_decl = tag_type->getDecl();
877
Googlerdcca7f72022-01-10 12:30:43 +0000878 if (known_type_decls_.contains(tag_decl)) {
Googler279eca32022-01-04 14:03:44 +0000879 if (std::optional<Identifier> id = GetTranslatedIdentifier(tag_decl)) {
880 std::string ident(id->Ident());
881 DeclId decl_id = GenerateDeclId(tag_decl);
882 type = MappedType::WithDeclIds(ident, decl_id, ident, decl_id);
883 }
Devin Jeanpierrebf0d5602021-10-13 20:47:39 +0000884 }
Michael Forster365bba12022-01-24 16:56:06 +0000885 } else if (const auto* typedef_type =
Googler6a0a5252022-01-11 14:08:09 +0000886 qual_type->getAsAdjusted<clang::TypedefType>()) {
Googlerdcca7f72022-01-10 12:30:43 +0000887 clang::TypedefNameDecl* typedef_name_decl = typedef_type->getDecl();
888
889 if (known_type_decls_.contains(typedef_name_decl)) {
890 if (std::optional<Identifier> id =
891 GetTranslatedIdentifier(typedef_name_decl)) {
892 std::string ident(id->Ident());
893 DeclId decl_id = GenerateDeclId(typedef_name_decl);
894 type = MappedType::WithDeclIds(ident, decl_id, ident, decl_id);
895 }
896 }
Marcel Hlopko7d739792021-08-12 07:52:47 +0000897 }
Devin Jeanpierre184f9ac2021-09-17 13:47:03 +0000898
899 if (!type.has_value()) {
900 absl::Status error = absl::UnimplementedError(
901 absl::Substitute("Unsupported type '$0'", type_string));
902 error.SetPayload(kTypeStatusPayloadUrl, absl::Cord(type_string));
903 return error;
904 }
905
Lukasz Anforowicz0c3f8b22022-02-15 14:56:40 +0000906 // Handle cv-qualification.
Devin Jeanpierre09c6f452021-09-29 07:34:24 +0000907 type->cc_type.is_const = qual_type.isConstQualified();
Lukasz Anforowicz0c3f8b22022-02-15 14:56:40 +0000908 if (qual_type.isVolatileQualified()) {
909 return absl::UnimplementedError(
910 absl::StrCat("Unsupported `volatile` qualifier: ", type_string));
911 }
Devin Jeanpierre184f9ac2021-09-17 13:47:03 +0000912
913 return *std::move(type);
Marcel Hlopko7d739792021-08-12 07:52:47 +0000914}
915
Michael Forster500b4762022-01-27 12:30:17 +0000916absl::StatusOr<std::vector<Field>> Importer::ImportFields(
Devin Jeanpierred652d932022-02-03 08:55:33 +0000917 clang::CXXRecordDecl* record_decl) {
918 clang::AccessSpecifier default_access =
919 record_decl->isClass() ? clang::AS_private : clang::AS_public;
Googlere3434c32021-10-19 10:28:35 +0000920 std::vector<Field> fields;
Michael Forstera49d2e62022-01-28 07:26:40 +0000921 const clang::ASTRecordLayout& layout = ctx_.getASTRecordLayout(record_decl);
Googlere3434c32021-10-19 10:28:35 +0000922 for (const clang::FieldDecl* field_decl : record_decl->fields()) {
923 auto type = ConvertType(field_decl->getType());
924 if (!type.ok()) {
Michael Forster500b4762022-01-27 12:30:17 +0000925 return absl::UnimplementedError(
926 absl::Substitute("Field type '$0' is not supported",
927 field_decl->getType().getAsString()));
Googlere3434c32021-10-19 10:28:35 +0000928 }
929 clang::AccessSpecifier access = field_decl->getAccess();
930 if (access == clang::AS_none) {
931 access = default_access;
932 }
933
934 std::optional<Identifier> field_name = GetTranslatedIdentifier(field_decl);
935 if (!field_name.has_value()) {
Michael Forster500b4762022-01-27 12:30:17 +0000936 return absl::UnimplementedError(
Googler279eca32022-01-04 14:03:44 +0000937 absl::Substitute("Cannot translate name for field '$0'",
Michael Forster500b4762022-01-27 12:30:17 +0000938 field_decl->getNameAsString()));
Googlere3434c32021-10-19 10:28:35 +0000939 }
940 fields.push_back(
941 {.identifier = *std::move(field_name),
942 .doc_comment = GetComment(field_decl),
943 .type = *type,
944 .access = TranslateAccessSpecifier(access),
Devin Jeanpierreb69bcae2022-02-03 09:45:50 +0000945 .offset = layout.getFieldOffset(field_decl->getFieldIndex()),
946 .is_no_unique_address =
947 field_decl->hasAttr<clang::NoUniqueAddressAttr>()});
Googlere3434c32021-10-19 10:28:35 +0000948 }
949 return fields;
950}
951
Michael Forster500b4762022-01-27 12:30:17 +0000952std::string Importer::GetMangledName(const clang::NamedDecl* named_decl) const {
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000953 clang::GlobalDecl decl;
954
955 // There are only three named decl types that don't work with the GlobalDecl
956 // unary constructor: GPU kernels (which do not exist in standard C++, so we
957 // ignore), constructors, and destructors. GlobalDecl does not support
958 // constructors and destructors from the unary constructor because there is
959 // more than one global declaration for a given constructor or destructor!
960 //
961 // * (Ctor|Dtor)_Complete is a function which constructs / destroys the
962 // entire object. This is what we want. :)
963 // * Dtor_Deleting is a function which additionally calls operator delete.
964 // * (Ctor|Dtor)_Base is a function which constructs/destroys the object but
965 // NOT including virtual base class subobjects.
966 // * (Ctor|Dtor)_Comdat: I *believe* this is the identifier used to
967 // deduplicate inline functions, and is not callable.
968 // * Dtor_(Copying|Default)Closure: These only exist in the MSVC++ ABI,
969 // which we don't support for now. I don't know when they are used.
970 //
971 // It was hard to piece this together, so writing it down here to explain why
972 // we magically picked the *_Complete variants.
Michael Forster500b4762022-01-27 12:30:17 +0000973 if (auto dtor = clang::dyn_cast<clang::CXXDestructorDecl>(named_decl)) {
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000974 decl = clang::GlobalDecl(dtor, clang::CXXDtorType::Dtor_Complete);
975 } else if (auto ctor =
Michael Forster500b4762022-01-27 12:30:17 +0000976 clang::dyn_cast<clang::CXXConstructorDecl>(named_decl)) {
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000977 decl = clang::GlobalDecl(ctor, clang::CXXCtorType::Ctor_Complete);
978 } else {
979 decl = clang::GlobalDecl(named_decl);
980 }
981
Marcel Hlopko7d739792021-08-12 07:52:47 +0000982 std::string name;
983 llvm::raw_string_ostream stream(name);
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000984 mangler_->mangleName(decl, stream);
Marcel Hlopko7d739792021-08-12 07:52:47 +0000985 stream.flush();
Marcel Hlopkoa5f59ae2021-08-24 20:38:04 +0000986 return name;
Marcel Hlopko7d739792021-08-12 07:52:47 +0000987}
988
Michael Forster500b4762022-01-27 12:30:17 +0000989std::optional<UnqualifiedIdentifier> Importer::GetTranslatedName(
Marcel Hlopko7d739792021-08-12 07:52:47 +0000990 const clang::NamedDecl* named_decl) const {
Devin Jeanpierref2ec8712021-10-13 20:47:16 +0000991 switch (named_decl->getDeclName().getNameKind()) {
992 case clang::DeclarationName::Identifier: {
993 auto name = std::string(named_decl->getName());
994 if (name.empty()) {
Lukasz Anforowicz0c816f12021-12-15 17:41:49 +0000995 if (const clang::ParmVarDecl* param_decl =
996 clang::dyn_cast<clang::ParmVarDecl>(named_decl)) {
997 int param_pos = param_decl->getFunctionScopeIndex();
998 return {Identifier(absl::StrCat("__param_", param_pos))};
999 }
1000 // TODO(lukasza): Handle anonymous structs (probably this won't be an
1001 // issue until nested types are handled - b/200067824).
Devin Jeanpierref2ec8712021-10-13 20:47:16 +00001002 return std::nullopt;
1003 }
1004 return {Identifier(std::move(name))};
1005 }
1006 case clang::DeclarationName::CXXConstructorName:
1007 return {SpecialName::kConstructor};
1008 case clang::DeclarationName::CXXDestructorName:
1009 return {SpecialName::kDestructor};
Lukasz Anforowiczfae90a12022-02-03 20:58:15 +00001010 case clang::DeclarationName::CXXOperatorName:
1011 switch (named_decl->getDeclName().getCXXOverloadedOperator()) {
1012 case clang::OO_None:
1013 LOG(FATAL) << "No OO_None expected under CXXOperatorName branch";
1014 return std::nullopt;
1015 case clang::NUM_OVERLOADED_OPERATORS:
1016 LOG(FATAL) << "No NUM_OVERLOADED_OPERATORS expected at runtime";
1017 return std::nullopt;
1018 // clang-format off
1019 #define OVERLOADED_OPERATOR(name, spelling, ...) \
1020 case clang::OO_##name: { \
Lukasz Anforowicz9c663ca2022-02-09 01:33:31 +00001021 return {Operator(spelling)}; \
Lukasz Anforowiczfae90a12022-02-03 20:58:15 +00001022 }
1023 #include "third_party/llvm/llvm-project/clang/include/clang/Basic/OperatorKinds.def"
1024 #undef OVERLOADED_OPERATOR
1025 // clang-format on
1026 }
1027 LOG(FATAL) << "The `switch` above should handle all cases and `return`";
Devin Jeanpierref2ec8712021-10-13 20:47:16 +00001028 default:
Lukasz Anforowiczfae90a12022-02-03 20:58:15 +00001029 // To be implemented later: CXXConversionFunctionName.
Devin Jeanpierref2ec8712021-10-13 20:47:16 +00001030 // There are also e.g. literal operators, deduction guides, etc., but
1031 // we might not need to implement them at all. Full list at:
1032 // https://clang.llvm.org/doxygen/classclang_1_1DeclarationName.html#a9ab322d434446b43379d39e41af5cbe3
1033 return std::nullopt;
Devin Jeanpierree78b2fb2021-10-05 11:40:33 +00001034 }
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +00001035}
1036
Marcel Hlopkoe8f1c4e2021-07-28 18:12:49 +00001037} // namespace rs_bindings_from_cc