thunk.cpp 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/check/thunk.h"
  5. #include <utility>
  6. #include "toolchain/base/kind_switch.h"
  7. #include "toolchain/check/call.h"
  8. #include "toolchain/check/convert.h"
  9. #include "toolchain/check/cpp/operators.h"
  10. #include "toolchain/check/deferred_definition_worklist.h"
  11. #include "toolchain/check/diagnostic_helpers.h"
  12. #include "toolchain/check/function.h"
  13. #include "toolchain/check/generic.h"
  14. #include "toolchain/check/inst.h"
  15. #include "toolchain/check/member_access.h"
  16. #include "toolchain/check/name_ref.h"
  17. #include "toolchain/check/pattern.h"
  18. #include "toolchain/check/pattern_match.h"
  19. #include "toolchain/check/pointer_dereference.h"
  20. #include "toolchain/check/return.h"
  21. #include "toolchain/check/type.h"
  22. #include "toolchain/diagnostics/diagnostic.h"
  23. #include "toolchain/sem_ir/function.h"
  24. #include "toolchain/sem_ir/generic.h"
  25. #include "toolchain/sem_ir/ids.h"
  26. #include "toolchain/sem_ir/inst.h"
  27. #include "toolchain/sem_ir/pattern.h"
  28. #include "toolchain/sem_ir/typed_insts.h"
  29. namespace Carbon::Check {
  30. // Adds a pattern instruction for a thunk, copying the location from an existing
  31. // instruction.
  32. static auto RebuildPatternInst(Context& context, SemIR::InstId orig_inst_id,
  33. SemIR::Inst new_inst) -> SemIR::InstId {
  34. // Ensure we built the same kind of instruction. In particular, this ensures
  35. // that the location of the old instruction can be reused for the new one.
  36. CARBON_CHECK(context.insts().Get(orig_inst_id).kind() == new_inst.kind(),
  37. "Rebuilt pattern with the wrong kind: {0} -> {1}",
  38. context.insts().Get(orig_inst_id), new_inst);
  39. return AddInst(context,
  40. SemIR::LocIdAndInst::RuntimeVerified(
  41. context.sem_ir(), SemIR::LocId(orig_inst_id), new_inst));
  42. }
  43. // Wrapper to allow the type to be specified as a template argument for API
  44. // consistency with `AddInst`.
  45. template <typename InstT>
  46. static auto RebuildPatternInst(Context& context, SemIR::InstId orig_inst_id,
  47. InstT new_inst) -> SemIR::InstId {
  48. return RebuildPatternInst(context, orig_inst_id, SemIR::Inst(new_inst));
  49. }
  50. // Makes a copy of the given binding pattern, with its type adjusted to be
  51. // `new_pattern_type_id`.
  52. static auto CloneBindingPattern(Context& context, SemIR::InstId pattern_id,
  53. SemIR::AnyBindingPattern pattern,
  54. SemIR::TypeId new_pattern_type_id)
  55. -> SemIR::InstId {
  56. auto entity_name = context.entity_names().Get(pattern.entity_name_id);
  57. CARBON_CHECK((pattern.kind == SemIR::SymbolicBindingPattern::Kind) ==
  58. entity_name.bind_index().has_value());
  59. CARBON_CHECK(pattern.kind != SemIR::FormBindingPattern::Kind);
  60. // Get the transformed type of the binding.
  61. if (new_pattern_type_id == SemIR::ErrorInst::TypeId) {
  62. return SemIR::ErrorInst::InstId;
  63. }
  64. pattern.type_id = new_pattern_type_id;
  65. auto phase = BindingPhase::Runtime;
  66. if (pattern.kind == SemIR::SymbolicBindingPattern::Kind) {
  67. phase = entity_name.is_template ? BindingPhase::Template
  68. : BindingPhase::Symbolic;
  69. }
  70. pattern.entity_name_id = AddBindingEntityName(context, entity_name.name_id,
  71. /*form_id=*/SemIR::InstId::None,
  72. entity_name.is_unused, phase);
  73. if (pattern.kind == SemIR::WrapperBindingPattern::Kind) {
  74. auto subpattern = context.insts().GetAs<SemIR::AnyLeafParamPattern>(
  75. pattern.subpattern_id);
  76. if (subpattern.kind == SemIR::FormParamPattern::Kind) {
  77. context.TODO(pattern_id, "Support for cloning form bindings");
  78. return SemIR::ErrorInst::InstId;
  79. }
  80. pattern.subpattern_id = RebuildPatternInst<SemIR::AnyLeafParamPattern>(
  81. context, pattern.subpattern_id,
  82. {.kind = subpattern.kind,
  83. .type_id = new_pattern_type_id,
  84. .pretty_name_id = entity_name.name_id});
  85. }
  86. // Rebuild the binding pattern.
  87. return AddBindingPattern(context, SemIR::LocId(pattern_id),
  88. SemIR::ExprRegionId::None, pattern)
  89. .pattern_id;
  90. }
  91. // Makes a copy of the given pattern instruction, substituting values from a
  92. // specific as needed. The resulting pattern behaves like a newly-created
  93. // pattern, so is suitable for running `CalleePatternMatch` against.
  94. static auto ClonePattern(Context& context, SemIR::SpecificId specific_id,
  95. SemIR::InstId pattern_id) -> SemIR::InstId {
  96. if (!pattern_id.has_value()) {
  97. return SemIR::InstId::None;
  98. }
  99. auto get_type = [&](SemIR::InstId inst_id) -> SemIR::TypeId {
  100. return SemIR::GetTypeOfInstInSpecific(context.sem_ir(), specific_id,
  101. inst_id);
  102. };
  103. auto pattern = context.insts().Get(pattern_id);
  104. // Decompose the pattern. The forms we allow for patterns in a function
  105. // parameter list are currently fairly restrictive.
  106. // Optional var parameter pattern.
  107. auto [var_param, var_param_id] = context.insts().TryUnwrap(
  108. pattern, pattern_id, &SemIR::VarParamPattern::subpattern_id);
  109. // Finally, either a binding pattern or a return slot pattern.
  110. auto new_pattern_id = SemIR::InstId::None;
  111. if (auto binding = pattern.TryAs<SemIR::AnyBindingPattern>()) {
  112. new_pattern_id = CloneBindingPattern(context, pattern_id, *binding,
  113. get_type(pattern_id));
  114. } else if (auto return_slot = pattern.TryAs<SemIR::ReturnSlotPattern>()) {
  115. auto new_subpattern_id = RebuildPatternInst<SemIR::OutParamPattern>(
  116. context, return_slot->subpattern_id,
  117. {.type_id = get_type(return_slot->subpattern_id),
  118. .pretty_name_id = SemIR::NameId::ReturnSlot});
  119. new_pattern_id = RebuildPatternInst<SemIR::ReturnSlotPattern>(
  120. context, pattern_id,
  121. {.type_id = get_type(pattern_id),
  122. .subpattern_id = new_subpattern_id,
  123. .type_inst_id = SemIR::TypeInstId::None});
  124. } else {
  125. CARBON_CHECK(pattern.Is<SemIR::ErrorInst>(),
  126. "Unexpected pattern {0} in function signature", pattern);
  127. return SemIR::ErrorInst::InstId;
  128. }
  129. // Rebuild parameter.
  130. if (var_param && new_pattern_id != SemIR::ErrorInst::InstId) {
  131. new_pattern_id = RebuildPatternInst<SemIR::VarParamPattern>(
  132. context, var_param_id,
  133. {.type_id = get_type(var_param_id), .subpattern_id = new_pattern_id});
  134. }
  135. return new_pattern_id;
  136. }
  137. static auto ClonePatternBlock(Context& context, SemIR::SpecificId specific_id,
  138. SemIR::InstBlockId inst_block_id)
  139. -> SemIR::InstBlockId {
  140. if (!inst_block_id.has_value()) {
  141. return SemIR::InstBlockId::None;
  142. }
  143. return context.inst_blocks().Transform(
  144. inst_block_id, [&](SemIR::InstId inst_id) {
  145. return ClonePattern(context, specific_id, inst_id);
  146. });
  147. }
  148. static auto CloneInstId(Context& context, SemIR::SpecificId specific_id,
  149. SemIR::InstId inst_id) -> SemIR::InstId {
  150. if (!inst_id.has_value()) {
  151. return SemIR::InstId::None;
  152. }
  153. return GetOrAddInst<SemIR::SpecificConstant>(
  154. context, SemIR::LocId(inst_id),
  155. {.type_id = SemIR::TypeType::TypeId,
  156. .inst_id = inst_id,
  157. .specific_id = specific_id});
  158. }
  159. static auto CloneTypeInstId(Context& context, SemIR::SpecificId specific_id,
  160. SemIR::TypeInstId inst_id) -> SemIR::TypeInstId {
  161. if (!inst_id.has_value()) {
  162. return SemIR::TypeInstId::None;
  163. }
  164. return context.types().GetAsTypeInstId(
  165. CloneInstId(context, specific_id, inst_id));
  166. }
  167. static auto CloneFunctionDecl(Context& context, SemIR::LocId loc_id,
  168. SemIR::FunctionId signature_id,
  169. SemIR::SpecificId signature_specific_id,
  170. SemIR::FunctionId callee_id)
  171. -> std::pair<SemIR::FunctionId, SemIR::InstId> {
  172. StartGenericDecl(context);
  173. const auto& signature = context.functions().Get(signature_id);
  174. // Clone the signature.
  175. context.pattern_block_stack().Push();
  176. auto implicit_param_patterns_id = ClonePatternBlock(
  177. context, signature_specific_id, signature.implicit_param_patterns_id);
  178. auto param_patterns_id = ClonePatternBlock(context, signature_specific_id,
  179. signature.param_patterns_id);
  180. auto return_patterns_id = ClonePatternBlock(context, signature_specific_id,
  181. signature.return_patterns_id);
  182. auto return_type_inst_id = CloneTypeInstId(context, signature_specific_id,
  183. signature.return_type_inst_id);
  184. auto return_form_inst_id = CloneInstId(context, signature_specific_id,
  185. signature.return_form_inst_id);
  186. auto self_param_id = FindSelfPattern(context, implicit_param_patterns_id);
  187. auto pattern_block_id = context.pattern_block_stack().Pop();
  188. // Perform callee-side pattern matching to rebuild the parameter list.
  189. context.inst_block_stack().Push();
  190. auto match_results =
  191. CalleePatternMatch(context, implicit_param_patterns_id, param_patterns_id,
  192. return_patterns_id);
  193. auto decl_block_id = context.inst_block_stack().Pop();
  194. // Create the `FunctionDecl` instruction.
  195. auto& callee = context.functions().Get(callee_id);
  196. auto [decl_id, function_id] = MakeFunctionDecl(
  197. context, loc_id, decl_block_id, /*build_generic=*/true,
  198. /*is_definition=*/true,
  199. SemIR::Function{
  200. {
  201. .name_id = signature.name_id,
  202. .parent_scope_id = callee.parent_scope_id,
  203. // Set by `MakeFunctionDecl`.
  204. .generic_id = SemIR::GenericId::None,
  205. .first_param_node_id = signature.first_param_node_id,
  206. .last_param_node_id = signature.last_param_node_id,
  207. .pattern_block_id = pattern_block_id,
  208. .implicit_param_patterns_id = implicit_param_patterns_id,
  209. .param_patterns_id = param_patterns_id,
  210. .is_extern = false,
  211. .extern_library_id = SemIR::LibraryNameId::None,
  212. .non_owning_decl_id = SemIR::InstId::None,
  213. // Set by `MakeFunctionDecl`.
  214. .first_owning_decl_id = SemIR::InstId::None,
  215. },
  216. {
  217. .call_param_patterns_id = match_results.call_param_patterns_id,
  218. .call_params_id = match_results.call_params_id,
  219. .call_param_ranges = match_results.param_ranges,
  220. .return_type_inst_id = return_type_inst_id,
  221. .return_form_inst_id = return_form_inst_id,
  222. .return_patterns_id = return_patterns_id,
  223. .virtual_modifier = callee.virtual_modifier,
  224. .virtual_index = callee.virtual_index,
  225. .evaluation_mode = signature.evaluation_mode,
  226. .self_param_id = self_param_id,
  227. }});
  228. context.inst_block_stack().AddInstId(decl_id);
  229. return {function_id, decl_id};
  230. }
  231. static auto HasDeclaredReturnType(Context& context,
  232. SemIR::FunctionId function_id) -> bool {
  233. return context.functions().Get(function_id).return_type_inst_id.has_value();
  234. }
  235. auto PerformThunkCall(Context& context, SemIR::LocId loc_id,
  236. SemIR::FunctionId function_id,
  237. llvm::ArrayRef<SemIR::InstId> param_pattern_ids,
  238. llvm::ArrayRef<SemIR::InstId> call_arg_ids,
  239. SemIR::InstId callee_id) -> SemIR::InstId {
  240. auto& function = context.functions().Get(function_id);
  241. auto [args_vec, ignored_call_args] = ThunkPatternMatch(
  242. context, function.self_param_id, param_pattern_ids, call_arg_ids);
  243. llvm::ArrayRef<SemIR::InstId> args = args_vec;
  244. // If we have a self parameter, form `self.<callee_id>` if needed.
  245. // When calling a C++ constructor to implement `Copy`, or calling a C++
  246. // non-method operator to implement a Carbon operator, the interface has a
  247. // `self` parameter but C++ models that parameter as an explicit argument
  248. // instead, so add the `self` to the argument list instead in that case.
  249. if (function.self_param_id.has_value() &&
  250. !IsCppConstructorOrNonMethodOperator(context, callee_id)) {
  251. callee_id = PerformCompoundMemberAccess(context, loc_id,
  252. args.consume_front(), callee_id);
  253. }
  254. return PerformCall(context, loc_id, callee_id, args);
  255. }
  256. // Build a call to a function that forwards the arguments of the enclosing
  257. // function, for use when constructing a thunk.
  258. static auto BuildThunkCall(Context& context, SemIR::FunctionId function_id,
  259. SemIR::InstId callee_id,
  260. llvm::ArrayRef<SemIR::InstId> param_pattern_ids,
  261. llvm::ArrayRef<SemIR::InstId> call_arg_ids)
  262. -> SemIR::InstId {
  263. auto& function = context.functions().Get(function_id);
  264. // Build a `NameRef` naming the callee, and a `SpecificConstant` if needed.
  265. auto loc_id = SemIR::LocId(callee_id);
  266. auto callee_type = context.types().GetAs<SemIR::FunctionType>(
  267. context.insts().Get(callee_id).type_id());
  268. callee_id = BuildNameRef(context, loc_id, function.name_id, callee_id,
  269. callee_type.specific_id);
  270. return PerformThunkCall(context, loc_id, function_id, param_pattern_ids,
  271. call_arg_ids, callee_id);
  272. }
  273. static auto StartThunkFunctionDefinition(Context& context,
  274. SemIR::FunctionId function_id,
  275. SemIR::InstId thunk_id,
  276. SemIR::InstId callee_id) {
  277. // The check below produces diagnostics referring to the signature, so also
  278. // note the callee.
  279. Diagnostics::AnnotationScope annot_scope(
  280. &context.emitter(), [&](DiagnosticBuilder& builder) {
  281. CARBON_DIAGNOSTIC(ThunkCallee, Note,
  282. "while building thunk calling this function");
  283. builder.Note(callee_id, ThunkCallee);
  284. });
  285. StartFunctionDefinition(context, thunk_id, function_id);
  286. }
  287. // Given a declaration of a thunk and the function that it should call, build
  288. // the thunk body.
  289. static auto BuildThunkDefinition(Context& context,
  290. SemIR::FunctionId signature_id,
  291. SemIR::FunctionId function_id,
  292. SemIR::InstId thunk_id,
  293. SemIR::InstId callee_id) -> void {
  294. // TODO: Improve the diagnostics produced here. Specifically, it would likely
  295. // be better for the primary error message to be that we tried to produce a
  296. // thunk because of a type mismatch, but couldn't, with notes explaining
  297. // why, rather than the primary error message being whatever went wrong
  298. // building the thunk.
  299. StartThunkFunctionDefinition(context, function_id, thunk_id, callee_id);
  300. // The checks below produce diagnostics pointing at the callee, so also note
  301. // the signature.
  302. Diagnostics::AnnotationScope annot_scope(
  303. &context.emitter(), [&](DiagnosticBuilder& builder) {
  304. CARBON_DIAGNOSTIC(
  305. ThunkSignature, Note,
  306. "while building thunk to match the signature of this function");
  307. builder.Note(context.functions().Get(signature_id).first_owning_decl_id,
  308. ThunkSignature);
  309. });
  310. const auto& function = context.functions().Get(function_id);
  311. llvm::ArrayRef<SemIR::InstId> param_pattern_ids;
  312. if (function.param_patterns_id.has_value()) {
  313. param_pattern_ids = context.inst_blocks().Get(function.param_patterns_id);
  314. }
  315. auto call_param_ids = context.inst_blocks().Get(function.call_params_id);
  316. auto call_id = BuildThunkCall(context, function_id, callee_id,
  317. param_pattern_ids, call_param_ids);
  318. if (HasDeclaredReturnType(context, function_id)) {
  319. BuildReturnWithExpr(context, SemIR::LocId(callee_id), call_id);
  320. } else {
  321. DiscardExpr(context, call_id);
  322. BuildReturnWithNoExpr(context, SemIR::LocId(callee_id));
  323. }
  324. FinishFunctionDefinition(context, function_id);
  325. }
  326. auto BuildThunkDefinitionForExport(Context& context,
  327. SemIR::FunctionId thunk_function_id,
  328. SemIR::FunctionId callee_function_id,
  329. SemIR::InstId thunk_id,
  330. SemIR::InstId callee_id) -> void {
  331. auto& thunk_function = context.functions().Get(thunk_function_id);
  332. auto& callee_function = context.functions().Get(callee_function_id);
  333. StartThunkFunctionDefinition(context, thunk_function_id, thunk_id, callee_id);
  334. const bool thunk_has_return_param =
  335. callee_function.return_type_inst_id != SemIR::TypeInstId::None;
  336. llvm::ArrayRef<SemIR::InstId> param_pattern_ids;
  337. if (thunk_function.param_patterns_id.has_value()) {
  338. param_pattern_ids =
  339. context.inst_blocks().Get(thunk_function.param_patterns_id);
  340. }
  341. auto call_param_ids =
  342. context.inst_blocks().Get(thunk_function.call_params_id);
  343. if (thunk_has_return_param) {
  344. param_pattern_ids = param_pattern_ids.drop_back();
  345. call_param_ids = call_param_ids.drop_back();
  346. }
  347. auto call_id = BuildThunkCall(context, thunk_function_id, callee_id,
  348. param_pattern_ids, call_param_ids);
  349. if (thunk_has_return_param) {
  350. auto out_param_id =
  351. context.inst_blocks().Get(thunk_function.call_params_id).back();
  352. SemIR::LocId loc_id(out_param_id);
  353. auto init_id =
  354. Initialize(context, loc_id, out_param_id, call_id, /*for_return=*/true);
  355. AddInst(context, loc_id,
  356. SemIR::Assign{
  357. .lhs_id = out_param_id,
  358. .rhs_id = init_id,
  359. });
  360. } else {
  361. DiscardExpr(context, call_id);
  362. }
  363. BuildReturnWithNoExpr(context, SemIR::LocId(callee_id));
  364. FinishFunctionDefinition(context, thunk_function_id);
  365. }
  366. auto BuildThunkDefinition(Context& context,
  367. DeferredDefinitionWorklist::DefineThunk&& task)
  368. -> void {
  369. context.scope_stack().Restore(std::move(task.scope));
  370. BuildThunkDefinition(context, task.info.signature_id, task.info.function_id,
  371. task.info.decl_id, task.info.callee_id);
  372. context.scope_stack().Pop();
  373. }
  374. auto BuildThunk(Context& context, SemIR::FunctionId signature_id,
  375. SemIR::SpecificId signature_specific_id,
  376. SemIR::InstId callee_id, bool defer_definition)
  377. -> SemIR::InstId {
  378. auto callee = SemIR::GetCalleeAsFunction(context.sem_ir(), callee_id);
  379. // Check whether we can use the given function without a thunk.
  380. // TODO: For virtual functions, we want different rules for checking `self`.
  381. // TODO: This is too strict; for example, we should not compare parameter
  382. // names here.
  383. if (CheckFunctionTypeMatches(
  384. context, context.functions().Get(callee.function_id),
  385. context.functions().Get(signature_id), signature_specific_id,
  386. /*check_syntax=*/false, /*check_self=*/true, /*diagnose=*/false)) {
  387. return callee_id;
  388. }
  389. // From P3763:
  390. // If the function in the interface does not have a return type, the
  391. // program is invalid if the function in the impl specifies a return type.
  392. //
  393. // Call into the redeclaration checking logic to produce a suitable error.
  394. //
  395. // TODO: Consider a different rule: always use an explicit return type for the
  396. // thunk, and always convert the result of the wrapped call to the return type
  397. // of the thunk.
  398. if (!HasDeclaredReturnType(context, signature_id) &&
  399. HasDeclaredReturnType(context, callee.function_id)) {
  400. bool success = CheckFunctionReturnTypeMatches(
  401. context, context.functions().Get(callee.function_id),
  402. context.functions().Get(signature_id), signature_specific_id);
  403. CARBON_CHECK(!success, "Return type unexpectedly matches");
  404. return SemIR::ErrorInst::InstId;
  405. }
  406. // Create a scope for the function's parameters and generic parameters.
  407. context.scope_stack().PushForDeclName();
  408. // We can't use the function directly. Build a thunk.
  409. // TODO: Check for and diagnose obvious reasons why this will fail, such as
  410. // arity mismatch, before trying to build the thunk.
  411. auto [function_id, thunk_id] =
  412. CloneFunctionDecl(context, SemIR::LocId(callee_id), signature_id,
  413. signature_specific_id, callee.function_id);
  414. // Track that this function is a thunk.
  415. context.functions().Get(function_id).SetThunk(callee_id);
  416. if (defer_definition) {
  417. // Register the thunk to be defined when we reach the end of the enclosing
  418. // deferred definition scope, for example an `impl` or `class` definition,
  419. // as if the thunk's body were written inline in this location.
  420. context.deferred_definition_worklist().SuspendThunkAndPush(
  421. context, {
  422. .signature_id = signature_id,
  423. .function_id = function_id,
  424. .decl_id = thunk_id,
  425. .callee_id = callee_id,
  426. });
  427. } else {
  428. BuildThunkDefinition(context, signature_id, function_id, thunk_id,
  429. callee_id);
  430. context.scope_stack().Pop();
  431. }
  432. return thunk_id;
  433. }
  434. } // namespace Carbon::Check