function_context.cpp 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/lower/function_context.h"
  5. #include "common/pretty_stack_trace_function.h"
  6. #include "common/vlog.h"
  7. #include "toolchain/base/kind_switch.h"
  8. #include "toolchain/sem_ir/diagnostic_loc_converter.h"
  9. #include "toolchain/sem_ir/file.h"
  10. #include "toolchain/sem_ir/generic.h"
  11. namespace Carbon::Lower {
  12. FunctionContext::FunctionContext(
  13. FileContext& file_context, llvm::Function* function,
  14. FileContext& specific_file_context, SemIR::SpecificId specific_id,
  15. SpecificCoalescer::SpecificFunctionFingerprint* function_fingerprint,
  16. llvm::DISubprogram* di_subprogram, llvm::raw_ostream* vlog_stream)
  17. : file_context_(&file_context),
  18. function_(function),
  19. specific_file_context_(&specific_file_context),
  20. specific_id_(specific_id),
  21. builder_(file_context.llvm_context(), llvm::ConstantFolder(),
  22. Inserter(file_context.inst_namer())),
  23. di_subprogram_(di_subprogram),
  24. vlog_stream_(vlog_stream),
  25. function_fingerprint_(function_fingerprint) {
  26. function_->setSubprogram(di_subprogram_);
  27. }
  28. auto FunctionContext::GetBlock(SemIR::InstBlockId block_id)
  29. -> llvm::BasicBlock* {
  30. auto result = blocks_.Insert(block_id, [&] {
  31. llvm::StringRef label_name;
  32. if (const auto* inst_namer = file_context_->inst_namer()) {
  33. label_name = inst_namer->GetUnscopedLabelFor(block_id);
  34. }
  35. return llvm::BasicBlock::Create(llvm_context(), label_name, function_);
  36. });
  37. return result.value();
  38. }
  39. auto FunctionContext::TryToReuseBlock(SemIR::InstBlockId block_id,
  40. llvm::BasicBlock* block) -> bool {
  41. if (!blocks_.Insert(block_id, block).is_inserted()) {
  42. return false;
  43. }
  44. if (block == synthetic_block_) {
  45. synthetic_block_ = nullptr;
  46. }
  47. if (const auto* inst_namer = file_context_->inst_namer()) {
  48. block->setName(inst_namer->GetUnscopedLabelFor(block_id));
  49. }
  50. return true;
  51. }
  52. auto FunctionContext::LowerBlockContents(SemIR::InstBlockId block_id) -> void {
  53. auto inst_id_for_stack_trace = SemIR::InstId::None;
  54. // On crash, report the instruction we were lowering.
  55. PrettyStackTraceFunction stack_trace_entry([&](llvm::raw_ostream& output) {
  56. SemIR::DiagnosticLocConverter converter(
  57. &file_context_->context().tree_and_subtrees_getters(), &sem_ir());
  58. auto converted = converter.Convert(SemIR::LocId(inst_id_for_stack_trace),
  59. /*token_only=*/false);
  60. converted.loc.FormatLocation(output);
  61. // TODO: Format SemIR for the instruction we were lowering?
  62. output << "Lowering "
  63. << sem_ir().insts().Get(inst_id_for_stack_trace).kind().ir_name()
  64. << "\n";
  65. // Crash output has a tab indent; try to indent slightly past that.
  66. converted.loc.FormatSnippet(output, /*indent=*/10);
  67. });
  68. for (auto inst_id : sem_ir().inst_blocks().Get(block_id)) {
  69. inst_id_for_stack_trace = inst_id;
  70. LowerInst(inst_id);
  71. }
  72. }
  73. // Handles typed instructions for LowerInst. Many instructions lower using
  74. // HandleInst, but others are unsupported or have trivial lowering.
  75. //
  76. // This only calls HandleInst for versions that should have implementations. A
  77. // different approach would be to have the logic below implemented as HandleInst
  78. // overloads. However, forward declarations of HandleInst exist for all `InstT`
  79. // types, which would make getting the right overload resolution complex.
  80. template <typename InstT>
  81. static auto LowerInstHelper(FunctionContext& context, SemIR::InstId inst_id,
  82. InstT inst) -> void {
  83. if constexpr (!InstT::Kind.is_lowered()) {
  84. CARBON_FATAL(
  85. "Encountered an instruction that isn't expected to lower. It's "
  86. "possible that logic needs to be changed in order to stop showing this "
  87. "instruction in lowered contexts. Instruction: {0}",
  88. inst);
  89. } else if constexpr (InstT::Kind.constant_kind() ==
  90. SemIR::InstConstantKind::Always ||
  91. InstT::Kind.constant_kind() ==
  92. SemIR::InstConstantKind::AlwaysUnique) {
  93. CARBON_FATAL("Missing constant value for constant instruction {0}", inst);
  94. } else if constexpr (InstT::Kind.is_type() == SemIR::InstIsType::Always) {
  95. // For instructions that are always of type `type`, produce the trivial
  96. // runtime representation of type `type`.
  97. context.SetLocal(inst_id, context.GetTypeAsValue());
  98. } else {
  99. HandleInst(context, inst_id, inst);
  100. }
  101. }
  102. // TODO: Consider renaming Handle##Name, instead relying on typed_inst overload
  103. // resolution. That would allow putting the nonexistent handler implementations
  104. // in `requires`-style overloads.
  105. // NOLINTNEXTLINE(readability-function-size): The define confuses lint.
  106. auto FunctionContext::LowerInst(SemIR::InstId inst_id) -> void {
  107. // Skip over constants. `FileContext::GetGlobal` lowers them as needed.
  108. if (sem_ir().constant_values().Get(inst_id).is_constant()) {
  109. return;
  110. }
  111. auto inst = sem_ir().insts().Get(inst_id);
  112. CARBON_VLOG("Lowering {0}: {1}\n", inst_id, inst);
  113. builder_.getInserter().SetCurrentInstId(inst_id);
  114. auto debug_loc = GetDebugLoc(inst_id);
  115. if (debug_loc) {
  116. builder_.SetCurrentDebugLocation(debug_loc);
  117. }
  118. CARBON_KIND_SWITCH(inst) {
  119. #define CARBON_SEM_IR_INST_KIND(Name) \
  120. case CARBON_KIND(SemIR::Name typed_inst): { \
  121. LowerInstHelper(*this, inst_id, typed_inst); \
  122. break; \
  123. }
  124. #include "toolchain/sem_ir/inst_kind.def"
  125. }
  126. if (debug_loc) {
  127. builder_.SetCurrentDebugLocation(llvm::DebugLoc());
  128. }
  129. builder_.getInserter().SetCurrentInstId(SemIR::InstId::None);
  130. }
  131. auto FunctionContext::GetBlockArg(SemIR::InstBlockId block_id, TypeInFile type)
  132. -> llvm::PHINode* {
  133. llvm::BasicBlock* block = GetBlock(block_id);
  134. // Find the existing phi, if any.
  135. auto phis = block->phis();
  136. if (!phis.empty()) {
  137. CARBON_CHECK(std::next(phis.begin()) == phis.end(),
  138. "Expected at most one phi, found {0}",
  139. std::distance(phis.begin(), phis.end()));
  140. return &*phis.begin();
  141. }
  142. // The number of predecessor slots to reserve.
  143. static constexpr unsigned NumReservedPredecessors = 2;
  144. auto* phi = llvm::PHINode::Create(GetType(type), NumReservedPredecessors);
  145. phi->insertInto(block, block->begin());
  146. return phi;
  147. }
  148. auto FunctionContext::GetValue(SemIR::InstId inst_id) -> llvm::Value* {
  149. // All builtins are types, with the same empty lowered value.
  150. if (SemIR::IsSingletonInstId(inst_id)) {
  151. return GetTypeAsValue();
  152. }
  153. if (auto result = locals_.Lookup(inst_id)) {
  154. return result.value();
  155. }
  156. if (auto result = file_context_->global_variables().Lookup(inst_id)) {
  157. return result.value();
  158. }
  159. auto [const_ir, const_id] = GetConstantValueInSpecific(
  160. specific_sem_ir(), specific_id_, sem_ir(), inst_id);
  161. CARBON_CHECK(const_ir == &sem_ir() || const_ir == &specific_sem_ir());
  162. CARBON_CHECK(const_id.is_concrete(),
  163. "Missing value: {0} {1} in {2} has non-concrete value {3}",
  164. inst_id, sem_ir().insts().Get(inst_id), specific_id_, const_id);
  165. // We can only pass on the InstId if it refers to the file in which the
  166. // constant value was provided.
  167. auto* global = GetFileContext(const_ir).GetConstant(
  168. const_id, const_ir == &sem_ir() ? inst_id : SemIR::InstId::None);
  169. AddGlobalToCurrentFingerprint(global);
  170. return global;
  171. }
  172. auto FunctionContext::MakeSyntheticBlock() -> llvm::BasicBlock* {
  173. synthetic_block_ = llvm::BasicBlock::Create(llvm_context(), "", function_);
  174. return synthetic_block_;
  175. }
  176. auto FunctionContext::CreateAlloca(llvm::Type* type, const llvm::Twine& name)
  177. -> llvm::AllocaInst* {
  178. // Position the first alloca right before the start of the executable code in
  179. // the function.
  180. llvm::AllocaInst* alloca;
  181. {
  182. llvm::IRBuilderBase::InsertPointGuard guard(builder());
  183. auto debug_loc = builder().getCurrentDebugLocation();
  184. if (after_allocas_) {
  185. builder().SetInsertPoint(after_allocas_);
  186. } else {
  187. builder().SetInsertPointPastAllocas(&llvm_function());
  188. }
  189. // IRBuilder tramples over our debug location when setting the insert point,
  190. // so undo that.
  191. builder().SetCurrentDebugLocation(debug_loc);
  192. // Create an alloca for this variable in the entry block.
  193. // TODO: Compute alignment of the type, which may be greater than the
  194. // alignment computed by LLVM.
  195. alloca = builder().CreateAlloca(type, /*ArraySize=*/nullptr, name);
  196. }
  197. // Create a lifetime start intrinsic here to indicate where its scope really
  198. // begins.
  199. builder().CreateLifetimeStart(alloca);
  200. // If we just created the first alloca, there is now definitely at least one
  201. // instruction after it -- there is a lifetime start instruction if nothing
  202. // else. Use that instruction as our insert point for all future allocas.
  203. if (!after_allocas_) {
  204. auto loc = alloca->getIterator();
  205. ++loc;
  206. after_allocas_ = &*loc;
  207. }
  208. // TODO: Create a matching `@llvm.lifetime.end` intrinsic call when the
  209. // variable goes out of scope.
  210. return alloca;
  211. }
  212. auto FunctionContext::GetDebugLoc(SemIR::InstId inst_id) -> llvm::DebugLoc {
  213. if (!di_subprogram_) {
  214. return llvm::DebugLoc();
  215. }
  216. auto loc = file_context_->GetLocForDI(inst_id);
  217. if (loc.filename != di_subprogram_->getFile()->getFilename()) {
  218. // Location is from a different file. We can't represent that directly
  219. // within the scope of this function's subprogram, and we don't want to
  220. // generate a new subprogram, so just discard the location information. This
  221. // happens for thunks when emitting the portion of the thunk that is
  222. // duplicated from the original signature.
  223. //
  224. // TODO: Handle this case better.
  225. if (sem_ir().insts().Is<SemIR::Call>(inst_id)) {
  226. // Return a stub location for calls, because they may be inlineable (an
  227. // LLVM verifier issue).
  228. return llvm::DILocation::get(builder_.getContext(), -1, -1,
  229. di_subprogram_);
  230. }
  231. return llvm::DebugLoc();
  232. }
  233. return llvm::DILocation::get(builder_.getContext(), loc.line_number,
  234. loc.column_number, di_subprogram_);
  235. }
  236. auto FunctionContext::FinishInit(TypeInFile type, SemIR::InstId dest_id,
  237. SemIR::InstId source_id) -> void {
  238. switch (GetInitRepr(type).kind) {
  239. case SemIR::InitRepr::None:
  240. break;
  241. case SemIR::InitRepr::InPlace:
  242. if (sem_ir().constant_values().Get(source_id).is_constant()) {
  243. // When initializing from a constant, emission of the source doesn't
  244. // initialize the destination. Copy the constant value instead.
  245. CopyValue(type, source_id, dest_id);
  246. }
  247. break;
  248. case SemIR::InitRepr::ByCopy:
  249. CopyValue(type, source_id, dest_id);
  250. break;
  251. case SemIR::InitRepr::Incomplete:
  252. CARBON_FATAL("Lowering aggregate initialization of incomplete type {0}",
  253. type.file->types().GetAsInst(type.type_id));
  254. }
  255. }
  256. auto FunctionContext::GetTypeIdOfInst(SemIR::InstId inst_id) -> TypeInFile {
  257. auto [file, type_id] = SemIR::GetTypeOfInstInSpecific(
  258. specific_sem_ir(), specific_id(), sem_ir(), inst_id);
  259. return {.file = file, .type_id = type_id};
  260. }
  261. auto FunctionContext::GetValueRepr(TypeInFile type) -> ValueReprInFile {
  262. ValueReprInFile result = {
  263. .file = type.file,
  264. .repr = SemIR::ValueRepr::ForType(*type.file, type.type_id)};
  265. AddEnumToCurrentFingerprint(result.repr.kind);
  266. AddEnumToCurrentFingerprint(result.repr.aggregate_kind);
  267. return result;
  268. }
  269. auto FunctionContext::GetInitRepr(TypeInFile type) -> SemIR::InitRepr {
  270. auto result = SemIR::InitRepr::ForType(*type.file, type.type_id);
  271. AddEnumToCurrentFingerprint(result.kind);
  272. return result;
  273. }
  274. auto FunctionContext::GetReturnTypeInfo(TypeInFile type)
  275. -> ReturnTypeInfoInFile {
  276. ReturnTypeInfoInFile result = {
  277. .file = type.file,
  278. .info = SemIR::ReturnTypeInfo::ForType(*type.file, type.type_id)};
  279. AddEnumToCurrentFingerprint(result.info.init_repr.kind);
  280. return result;
  281. }
  282. // Given a type used for an LLVM value, return the type that we use to store
  283. // that value in memory. This is the same type unless the type is a
  284. // non-multiple-of-8 integer type, which we explicitly widen to a multiple of 8
  285. // for Clang compatibility and to make our generated IR easier for LLVM to
  286. // handle.
  287. static auto GetWidenedMemoryType(llvm::Type* type) -> llvm::Type* {
  288. if (auto* int_type = dyn_cast<llvm::IntegerType>(type)) {
  289. auto width = llvm::alignToPowerOf2(int_type->getBitWidth(), 8);
  290. if (width != int_type->getBitWidth()) {
  291. return llvm::IntegerType::get(type->getContext(), width);
  292. }
  293. }
  294. return type;
  295. }
  296. auto FunctionContext::LoadObject(TypeInFile type, llvm::Value* addr,
  297. llvm::Twine name) -> llvm::Value* {
  298. auto* llvm_type = GetType(type);
  299. auto* load_type = GetWidenedMemoryType(llvm_type);
  300. // TODO: Include alias and alignment information.
  301. llvm::Value* value = builder().CreateLoad(load_type, addr, name);
  302. if (load_type != llvm_type) {
  303. value = builder().CreateTrunc(value, llvm_type);
  304. }
  305. return value;
  306. }
  307. auto FunctionContext::StoreObject(TypeInFile type, llvm::Value* value,
  308. llvm::Value* addr) -> void {
  309. // TODO: Include alias and alignment information.
  310. auto* llvm_type = GetType(type);
  311. CARBON_CHECK(value->getType() == llvm_type);
  312. // Don't emit a store of `iN` if N is not a multiple of 8. See `LoadObject`.
  313. auto* store_type = GetWidenedMemoryType(llvm_type);
  314. if (store_type != llvm_type) {
  315. // TODO: Should we consider creating a sext if the value is signed?
  316. value = builder().CreateZExt(value, store_type);
  317. }
  318. builder().CreateStore(value, addr);
  319. }
  320. auto FunctionContext::CopyValue(TypeInFile type, SemIR::InstId source_id,
  321. SemIR::InstId dest_id) -> void {
  322. switch (GetValueRepr(type).repr.kind) {
  323. case SemIR::ValueRepr::Unknown:
  324. CARBON_FATAL("Attempt to copy incomplete type");
  325. case SemIR::ValueRepr::None:
  326. break;
  327. case SemIR::ValueRepr::Copy:
  328. StoreObject(type, GetValue(source_id), GetValue(dest_id));
  329. break;
  330. case SemIR::ValueRepr::Pointer:
  331. CopyObject(type, source_id, dest_id);
  332. break;
  333. case SemIR::ValueRepr::Custom:
  334. CARBON_FATAL("TODO: Add support for CopyValue with custom value rep");
  335. }
  336. }
  337. auto FunctionContext::CopyObject(TypeInFile type, SemIR::InstId source_id,
  338. SemIR::InstId dest_id) -> void {
  339. const auto& layout = llvm_module().getDataLayout();
  340. auto* llvm_type = GetType(type);
  341. // TODO: Compute known alignment of the source and destination, which may
  342. // be greater than the alignment computed by LLVM.
  343. auto align = layout.getABITypeAlign(llvm_type);
  344. // TODO: Attach !tbaa.struct metadata indicating which portions of the
  345. // type we actually need to copy and which are padding.
  346. builder().CreateMemCpy(GetValue(dest_id), align, GetValue(source_id), align,
  347. layout.getTypeAllocSize(llvm_type));
  348. }
  349. auto FunctionContext::Inserter::InsertHelper(
  350. llvm::Instruction* inst, const llvm::Twine& name,
  351. llvm::BasicBlock::iterator insert_pt) const -> void {
  352. llvm::StringRef base_name;
  353. llvm::StringRef separator;
  354. if (inst_namer_ && !inst->getType()->isVoidTy()) {
  355. base_name = inst_namer_->GetUnscopedNameFor(inst_id_);
  356. }
  357. if (!base_name.empty() && !name.isTriviallyEmpty()) {
  358. separator = ".";
  359. }
  360. IRBuilderDefaultInserter::InsertHelper(inst, base_name + separator + name,
  361. insert_pt);
  362. }
  363. auto FunctionContext::AddCallToCurrentFingerprint(SemIR::CheckIRId file_id,
  364. SemIR::FunctionId function_id,
  365. SemIR::SpecificId specific_id)
  366. -> void {
  367. if (!function_fingerprint_) {
  368. return;
  369. }
  370. RawStringOstream os;
  371. // TODO: Replace indexes with info that is translation unit independent.
  372. // Using a string that includes the `FunctionId` string and the index to
  373. // avoid possible collisions. This needs revisiting.
  374. os << "file_id" << file_id.index << "\n";
  375. os << "function_id" << function_id.index << "\n";
  376. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  377. // TODO: Replace index with info that is translation unit independent.
  378. if (specific_id.has_value()) {
  379. current_fingerprint_.specific_fingerprint.update(specific_id.index);
  380. // TODO: Uses -1 as delimiter. This needs revisiting.
  381. current_fingerprint_.specific_fingerprint.update(-1);
  382. function_fingerprint_->calls.push_back(specific_id);
  383. }
  384. }
  385. auto FunctionContext::AddIntToCurrentFingerprint(uint64_t value) -> void {
  386. if (!function_fingerprint_) {
  387. return;
  388. }
  389. // TODO: Instead just include the raw bytes of the integer?
  390. RawStringOstream os;
  391. os << value << "\n";
  392. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  393. }
  394. auto FunctionContext::AddTypeToCurrentFingerprint(llvm::Type* type) -> void {
  395. if (!function_fingerprint_ || !type) {
  396. return;
  397. }
  398. RawStringOstream os;
  399. type->print(os);
  400. os << "\n";
  401. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  402. }
  403. auto FunctionContext::AddGlobalToCurrentFingerprint(llvm::Value* global)
  404. -> void {
  405. if (!function_fingerprint_ || !global) {
  406. return;
  407. }
  408. RawStringOstream os;
  409. global->print(os);
  410. os << "\n";
  411. current_fingerprint_.common_fingerprint.update(os.TakeStr());
  412. }
  413. auto FunctionContext::EmitFinalFingerprint() -> void {
  414. if (!function_fingerprint_) {
  415. return;
  416. }
  417. current_fingerprint_.common_fingerprint.final(
  418. function_fingerprint_->common_fingerprint);
  419. current_fingerprint_.specific_fingerprint.final(
  420. function_fingerprint_->specific_fingerprint);
  421. }
  422. } // namespace Carbon::Lower