function_context.cpp 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/lower/function_context.h"
  5. #include "common/pretty_stack_trace_function.h"
  6. #include "common/vlog.h"
  7. #include "toolchain/base/kind_switch.h"
  8. #include "toolchain/sem_ir/diagnostic_loc_converter.h"
  9. #include "toolchain/sem_ir/file.h"
  10. #include "toolchain/sem_ir/generic.h"
  11. namespace Carbon::Lower {
  12. FunctionContext::FunctionContext(
  13. FileContext& file_context, llvm::Function* function,
  14. FileContext& specific_file_context, SemIR::SpecificId specific_id,
  15. SpecificCoalescer::SpecificFunctionFingerprint* function_fingerprint,
  16. llvm::DISubprogram* di_subprogram, llvm::raw_ostream* vlog_stream)
  17. : file_context_(&file_context),
  18. function_(function),
  19. specific_file_context_(&specific_file_context),
  20. specific_id_(specific_id),
  21. builder_(file_context.llvm_context(), llvm::ConstantFolder(),
  22. Inserter(file_context.inst_namer())),
  23. di_subprogram_(di_subprogram),
  24. vlog_stream_(vlog_stream),
  25. function_fingerprint_(function_fingerprint) {
  26. function_->setSubprogram(di_subprogram_);
  27. }
  28. auto FunctionContext::GetBlock(SemIR::InstBlockId block_id)
  29. -> llvm::BasicBlock* {
  30. auto result = blocks_.Insert(block_id, [&] {
  31. llvm::StringRef label_name;
  32. if (const auto* inst_namer = file_context_->inst_namer()) {
  33. label_name = inst_namer->GetUnscopedLabelFor(block_id);
  34. }
  35. return llvm::BasicBlock::Create(llvm_context(), label_name, function_);
  36. });
  37. return result.value();
  38. }
  39. auto FunctionContext::TryToReuseBlock(SemIR::InstBlockId block_id,
  40. llvm::BasicBlock* block) -> bool {
  41. if (!blocks_.Insert(block_id, block).is_inserted()) {
  42. return false;
  43. }
  44. if (block == synthetic_block_) {
  45. synthetic_block_ = nullptr;
  46. }
  47. if (const auto* inst_namer = file_context_->inst_namer()) {
  48. block->setName(inst_namer->GetUnscopedLabelFor(block_id));
  49. }
  50. return true;
  51. }
  52. auto FunctionContext::LowerBlockContents(SemIR::InstBlockId block_id) -> void {
  53. auto inst_id_for_stack_trace = SemIR::InstId::None;
  54. // On crash, report the instruction we were lowering.
  55. PrettyStackTraceFunction stack_trace_entry([&](llvm::raw_ostream& output) {
  56. SemIR::DiagnosticLocConverter converter(
  57. &file_context_->context().tree_and_subtrees_getters(), &sem_ir());
  58. auto converted = converter.Convert(SemIR::LocId(inst_id_for_stack_trace),
  59. /*token_only=*/false);
  60. converted.loc.FormatLocation(output);
  61. // TODO: Format SemIR for the instruction we were lowering?
  62. output << "Lowering "
  63. << sem_ir().insts().Get(inst_id_for_stack_trace).kind().ir_name()
  64. << "\n";
  65. // Crash output has a tab indent; try to indent slightly past that.
  66. converted.loc.FormatSnippet(output, /*indent=*/10);
  67. });
  68. for (auto inst_id : sem_ir().inst_blocks().Get(block_id)) {
  69. inst_id_for_stack_trace = inst_id;
  70. LowerInst(inst_id);
  71. }
  72. }
  73. // Handles typed instructions for LowerInst. Many instructions lower using
  74. // HandleInst, but others are unsupported or have trivial lowering.
  75. //
  76. // This only calls HandleInst for versions that should have implementations. A
  77. // different approach would be to have the logic below implemented as HandleInst
  78. // overloads. However, forward declarations of HandleInst exist for all `InstT`
  79. // types, which would make getting the right overload resolution complex.
  80. template <typename InstT>
  81. static auto LowerInstHelper(FunctionContext& context, SemIR::InstId inst_id,
  82. InstT inst) -> void {
  83. if constexpr (!InstT::Kind.is_lowered()) {
  84. CARBON_FATAL(
  85. "Encountered an instruction that isn't expected to lower. It's "
  86. "possible that logic needs to be changed in order to stop showing this "
  87. "instruction in lowered contexts. Instruction: {0}",
  88. inst);
  89. } else if constexpr (InstT::Kind.constant_kind() ==
  90. SemIR::InstConstantKind::Always ||
  91. InstT::Kind.constant_kind() ==
  92. SemIR::InstConstantKind::AlwaysUnique) {
  93. CARBON_FATAL("Missing constant value for constant instruction {0}", inst);
  94. } else if constexpr (InstT::Kind.is_type() == SemIR::InstIsType::Always) {
  95. // For instructions that are always of type `type`, produce the trivial
  96. // runtime representation of type `type`.
  97. context.SetLocal(inst_id, context.GetTypeAsValue());
  98. } else {
  99. HandleInst(context, inst_id, inst);
  100. }
  101. }
  102. // TODO: Consider renaming Handle##Name, instead relying on typed_inst overload
  103. // resolution. That would allow putting the nonexistent handler implementations
  104. // in `requires`-style overloads.
  105. // NOLINTNEXTLINE(readability-function-size): The define confuses lint.
  106. auto FunctionContext::LowerInst(SemIR::InstId inst_id) -> void {
  107. // Skip over constants. `FileContext::GetGlobal` lowers them as needed.
  108. if (sem_ir().constant_values().Get(inst_id).is_constant()) {
  109. return;
  110. }
  111. auto inst = sem_ir().insts().Get(inst_id);
  112. CARBON_VLOG("Lowering {0}: {1}\n", inst_id, inst);
  113. builder_.getInserter().SetCurrentInstId(inst_id);
  114. auto debug_loc = GetDebugLoc(inst_id);
  115. if (debug_loc) {
  116. builder_.SetCurrentDebugLocation(debug_loc);
  117. }
  118. CARBON_KIND_SWITCH(inst) {
  119. #define CARBON_SEM_IR_INST_KIND(Name) \
  120. case CARBON_KIND(SemIR::Name typed_inst): { \
  121. LowerInstHelper(*this, inst_id, typed_inst); \
  122. break; \
  123. }
  124. #include "toolchain/sem_ir/inst_kind.def"
  125. }
  126. if (debug_loc) {
  127. builder_.SetCurrentDebugLocation(llvm::DebugLoc());
  128. }
  129. builder_.getInserter().SetCurrentInstId(SemIR::InstId::None);
  130. }
  131. auto FunctionContext::GetBlockArg(SemIR::InstBlockId block_id, TypeInFile type)
  132. -> llvm::PHINode* {
  133. llvm::BasicBlock* block = GetBlock(block_id);
  134. // Find the existing phi, if any.
  135. auto phis = block->phis();
  136. if (!phis.empty()) {
  137. CARBON_CHECK(std::next(phis.begin()) == phis.end(),
  138. "Expected at most one phi, found {0}",
  139. std::distance(phis.begin(), phis.end()));
  140. return &*phis.begin();
  141. }
  142. // The number of predecessor slots to reserve.
  143. static constexpr unsigned NumReservedPredecessors = 2;
  144. auto* phi = llvm::PHINode::Create(GetType(type), NumReservedPredecessors);
  145. phi->insertInto(block, block->begin());
  146. return phi;
  147. }
  148. auto FunctionContext::GetValue(SemIR::InstId inst_id) -> llvm::Value* {
  149. // All builtins are types, with the same empty lowered value.
  150. if (SemIR::IsSingletonInstId(inst_id)) {
  151. return GetTypeAsValue();
  152. }
  153. if (auto result = locals_.Lookup(inst_id)) {
  154. return result.value();
  155. }
  156. if (auto result = file_context_->global_variables().Lookup(inst_id)) {
  157. return result.value();
  158. }
  159. auto [const_ir, const_id] = GetConstantValueInSpecific(
  160. specific_sem_ir(), specific_id_, sem_ir(), inst_id);
  161. CARBON_CHECK(const_ir == &sem_ir() || const_ir == &specific_sem_ir());
  162. CARBON_CHECK(const_id.is_concrete(),
  163. "Missing value: {0} {1} in {2} has non-concrete value {3}",
  164. inst_id, sem_ir().insts().Get(inst_id), specific_id_, const_id);
  165. // We can only pass on the InstId if it refers to the file in which the
  166. // constant value was provided.
  167. auto* global = GetFileContext(const_ir).GetConstant(
  168. const_id, const_ir == &sem_ir() ? inst_id : SemIR::InstId::None);
  169. AddGlobalToCurrentFingerprint(global);
  170. return global;
  171. }
  172. auto FunctionContext::MakeSyntheticBlock() -> llvm::BasicBlock* {
  173. synthetic_block_ = llvm::BasicBlock::Create(llvm_context(), "", function_);
  174. return synthetic_block_;
  175. }
  176. auto FunctionContext::CreateAlloca(llvm::Type* type, const llvm::Twine& name)
  177. -> llvm::AllocaInst* {
  178. // Position the first alloca right before the start of the executable code in
  179. // the function.
  180. llvm::AllocaInst* alloca;
  181. {
  182. llvm::IRBuilderBase::InsertPointGuard guard(builder());
  183. auto debug_loc = builder().getCurrentDebugLocation();
  184. if (after_allocas_) {
  185. builder().SetInsertPoint(after_allocas_);
  186. } else {
  187. builder().SetInsertPointPastAllocas(&llvm_function());
  188. }
  189. // IRBuilder tramples over our debug location when setting the insert point,
  190. // so undo that.
  191. builder().SetCurrentDebugLocation(debug_loc);
  192. // Create an alloca for this variable in the entry block.
  193. // TODO: Compute alignment of the type, which may be greater than the
  194. // alignment computed by LLVM.
  195. alloca = builder().CreateAlloca(type, /*ArraySize=*/nullptr, name);
  196. }
  197. // Create a lifetime start intrinsic here to indicate where its scope really
  198. // begins.
  199. builder().CreateLifetimeStart(alloca);
  200. // If we just created the first alloca, there is now definitely at least one
  201. // instruction after it -- there is a lifetime start instruction if nothing
  202. // else. Use that instruction as our insert point for all future allocas.
  203. if (!after_allocas_) {
  204. auto loc = alloca->getIterator();
  205. ++loc;
  206. after_allocas_ = &*loc;
  207. }
  208. // TODO: Create a matching `@llvm.lifetime.end` intrinsic call when the
  209. // variable goes out of scope.
  210. return alloca;
  211. }
  212. auto FunctionContext::GetDebugLoc(SemIR::InstId inst_id) -> llvm::DebugLoc {
  213. if (!di_subprogram_) {
  214. return llvm::DebugLoc();
  215. }
  216. auto loc = file_context_->GetLocForDI(inst_id);
  217. if (loc.filename != di_subprogram_->getFile()->getFilename()) {
  218. // Location is from a different file. We can't represent that directly
  219. // within the scope of this function's subprogram, and we don't want to
  220. // generate a new subprogram, so just discard the location information. This
  221. // happens for thunks when emitting the portion of the thunk that is
  222. // duplicated from the original signature.
  223. //
  224. // TODO: Handle this case better.
  225. if (sem_ir().insts().Is<SemIR::Call>(inst_id)) {
  226. // Return a stub location for calls, because they may be inlineable (an
  227. // LLVM verifier issue).
  228. return llvm::DILocation::get(builder_.getContext(), -1, -1,
  229. di_subprogram_);
  230. }
  231. return llvm::DebugLoc();
  232. }
  233. return llvm::DILocation::get(builder_.getContext(), loc.line_number,
  234. loc.column_number, di_subprogram_);
  235. }
  236. auto FunctionContext::FinishInit(TypeInFile type, SemIR::InstId dest_id,
  237. SemIR::InstId source_id) -> void {
  238. switch (GetInitRepr(type).kind) {
  239. case SemIR::InitRepr::None:
  240. break;
  241. case SemIR::InitRepr::InPlace:
  242. if (sem_ir().constant_values().Get(source_id).is_constant()) {
  243. // When initializing from a constant, emission of the source doesn't
  244. // initialize the destination. Copy the constant value instead.
  245. CopyValue(type, source_id, dest_id);
  246. }
  247. break;
  248. case SemIR::InitRepr::ByCopy:
  249. CopyValue(type, source_id, dest_id);
  250. break;
  251. case SemIR::InitRepr::Incomplete:
  252. CARBON_FATAL("Lowering aggregate initialization of incomplete type {0}",
  253. type.file->types().GetAsInst(type.type_id));
  254. case SemIR::InitRepr::Dependent:
  255. CARBON_FATAL("Lowering aggregate initialization of dependent type {0}",
  256. type.file->types().GetAsInst(type.type_id));
  257. }
  258. }
  259. auto FunctionContext::GetTypeIdOfInst(SemIR::InstId inst_id) -> TypeInFile {
  260. auto [file, type_id] = SemIR::GetTypeOfInstInSpecific(
  261. specific_sem_ir(), specific_id(), sem_ir(), inst_id);
  262. return {.file = file, .type_id = type_id};
  263. }
  264. auto FunctionContext::GetValueRepr(TypeInFile type) -> ValueReprInFile {
  265. ValueReprInFile result = {
  266. .file = type.file,
  267. .repr = SemIR::ValueRepr::ForType(*type.file, type.type_id)};
  268. AddEnumToCurrentFingerprint(result.repr.kind);
  269. AddEnumToCurrentFingerprint(result.repr.aggregate_kind);
  270. return result;
  271. }
  272. auto FunctionContext::GetInitRepr(TypeInFile type) -> SemIR::InitRepr {
  273. auto result = SemIR::InitRepr::ForType(*type.file, type.type_id);
  274. AddEnumToCurrentFingerprint(result.kind);
  275. return result;
  276. }
  277. auto FunctionContext::GetReturnTypeInfo(TypeInFile type)
  278. -> ReturnTypeInfoInFile {
  279. ReturnTypeInfoInFile result = {
  280. .file = type.file,
  281. .info = SemIR::ReturnTypeInfo::ForType(*type.file, type.type_id)};
  282. AddEnumToCurrentFingerprint(result.info.init_repr.kind);
  283. return result;
  284. }
  285. // Given a type used for an LLVM value, return the type that we use to store
  286. // that value in memory. This is the same type unless the type is a
  287. // non-multiple-of-8 integer type, which we explicitly widen to a multiple of 8
  288. // for Clang compatibility and to make our generated IR easier for LLVM to
  289. // handle.
  290. static auto GetWidenedMemoryType(llvm::Type* type) -> llvm::Type* {
  291. if (auto* int_type = dyn_cast<llvm::IntegerType>(type)) {
  292. auto width = llvm::alignToPowerOf2(int_type->getBitWidth(), 8);
  293. if (width != int_type->getBitWidth()) {
  294. return llvm::IntegerType::get(type->getContext(), width);
  295. }
  296. }
  297. return type;
  298. }
  299. auto FunctionContext::LoadObject(TypeInFile type, llvm::Value* addr,
  300. llvm::Twine name) -> llvm::Value* {
  301. auto* llvm_type = GetType(type);
  302. auto* load_type = GetWidenedMemoryType(llvm_type);
  303. // TODO: Include alias and alignment information.
  304. llvm::Value* value = builder().CreateLoad(load_type, addr, name);
  305. if (load_type != llvm_type) {
  306. value = builder().CreateTrunc(value, llvm_type);
  307. }
  308. return value;
  309. }
  310. auto FunctionContext::StoreObject(TypeInFile type, llvm::Value* value,
  311. llvm::Value* addr) -> void {
  312. // TODO: Include alias and alignment information.
  313. auto* llvm_type = GetType(type);
  314. CARBON_CHECK(value->getType() == llvm_type);
  315. // Don't emit a store of `iN` if N is not a multiple of 8. See `LoadObject`.
  316. auto* store_type = GetWidenedMemoryType(llvm_type);
  317. if (store_type != llvm_type) {
  318. // TODO: Should we consider creating a sext if the value is signed?
  319. value = builder().CreateZExt(value, store_type);
  320. }
  321. builder().CreateStore(value, addr);
  322. }
  323. auto FunctionContext::CopyValue(TypeInFile type, SemIR::InstId source_id,
  324. SemIR::InstId dest_id) -> void {
  325. switch (GetValueRepr(type).repr.kind) {
  326. case SemIR::ValueRepr::Unknown:
  327. CARBON_FATAL("Attempt to copy incomplete type");
  328. case SemIR::ValueRepr::Dependent:
  329. CARBON_FATAL("Attempt to copy dependent type");
  330. case SemIR::ValueRepr::None:
  331. break;
  332. case SemIR::ValueRepr::Copy:
  333. StoreObject(type, GetValue(source_id), GetValue(dest_id));
  334. break;
  335. case SemIR::ValueRepr::Pointer:
  336. CopyObject(type, source_id, dest_id);
  337. break;
  338. case SemIR::ValueRepr::Custom:
  339. CARBON_FATAL("TODO: Add support for CopyValue with custom value rep");
  340. }
  341. }
  342. auto FunctionContext::CopyObject(TypeInFile type, SemIR::InstId source_id,
  343. SemIR::InstId dest_id) -> void {
  344. const auto& layout = llvm_module().getDataLayout();
  345. auto* llvm_type = GetType(type);
  346. // TODO: Compute known alignment of the source and destination, which may
  347. // be greater than the alignment computed by LLVM.
  348. auto align = layout.getABITypeAlign(llvm_type);
  349. // TODO: Attach !tbaa.struct metadata indicating which portions of the
  350. // type we actually need to copy and which are padding.
  351. builder().CreateMemCpy(GetValue(dest_id), align, GetValue(source_id), align,
  352. layout.getTypeAllocSize(llvm_type));
  353. }
  354. auto FunctionContext::Inserter::InsertHelper(
  355. llvm::Instruction* inst, const llvm::Twine& name,
  356. llvm::BasicBlock::iterator insert_pt) const -> void {
  357. llvm::StringRef base_name;
  358. llvm::StringRef separator;
  359. if (inst_namer_ && !inst->getType()->isVoidTy()) {
  360. base_name = inst_namer_->GetUnscopedNameFor(inst_id_);
  361. }
  362. if (!base_name.empty() && !name.isTriviallyEmpty()) {
  363. separator = ".";
  364. }
  365. IRBuilderDefaultInserter::InsertHelper(inst, base_name + separator + name,
  366. insert_pt);
  367. }
  368. auto FunctionContext::AddCallToCurrentFingerprint(SemIR::CheckIRId file_id,
  369. SemIR::FunctionId function_id,
  370. SemIR::SpecificId specific_id)
  371. -> void {
  372. if (!function_fingerprint_) {
  373. return;
  374. }
  375. RawStringOstream os;
  376. // TODO: Replace indexes with info that is translation unit independent.
  377. // Using a string that includes the `FunctionId` string and the index to
  378. // avoid possible collisions. This needs revisiting.
  379. os << "file_id" << file_id.index << "\n";
  380. os << "function_id" << function_id.index << "\n";
  381. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  382. // TODO: Replace index with info that is translation unit independent.
  383. if (specific_id.has_value()) {
  384. current_fingerprint_.specific_fingerprint.update(specific_id.index);
  385. // TODO: Uses -1 as delimiter. This needs revisiting.
  386. current_fingerprint_.specific_fingerprint.update(-1);
  387. function_fingerprint_->calls.push_back(specific_id);
  388. }
  389. }
  390. auto FunctionContext::AddIntToCurrentFingerprint(uint64_t value) -> void {
  391. if (!function_fingerprint_) {
  392. return;
  393. }
  394. // TODO: Instead just include the raw bytes of the integer?
  395. RawStringOstream os;
  396. os << value << "\n";
  397. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  398. }
  399. auto FunctionContext::AddTypeToCurrentFingerprint(llvm::Type* type) -> void {
  400. if (!function_fingerprint_ || !type) {
  401. return;
  402. }
  403. RawStringOstream os;
  404. type->print(os);
  405. os << "\n";
  406. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  407. }
  408. auto FunctionContext::AddGlobalToCurrentFingerprint(llvm::Value* global)
  409. -> void {
  410. if (!function_fingerprint_ || !global) {
  411. return;
  412. }
  413. RawStringOstream os;
  414. global->print(os);
  415. os << "\n";
  416. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  417. }
  418. auto FunctionContext::EmitFinalFingerprint() -> void {
  419. if (!function_fingerprint_) {
  420. return;
  421. }
  422. current_fingerprint_.common_fingerprint.final(
  423. function_fingerprint_->common_fingerprint);
  424. current_fingerprint_.specific_fingerprint.final(
  425. function_fingerprint_->specific_fingerprint);
  426. }
  427. } // namespace Carbon::Lower