// Part of the Carbon Language project, under the Apache License v2.0 with LLVM // Exceptions. See /LICENSE for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception #include "toolchain/sem_ir/file.h" #include "common/check.h" #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallVector.h" #include "toolchain/base/value_store.h" #include "toolchain/base/yaml.h" #include "toolchain/sem_ir/builtin_kind.h" #include "toolchain/sem_ir/ids.h" #include "toolchain/sem_ir/inst.h" #include "toolchain/sem_ir/inst_kind.h" namespace Carbon::SemIR { auto ValueRepr::Print(llvm::raw_ostream& out) const -> void { out << "{kind: "; switch (kind) { case Unknown: out << "unknown"; break; case None: out << "none"; break; case Copy: out << "copy"; break; case Pointer: out << "pointer"; break; case Custom: out << "custom"; break; } out << ", type: " << type_id << "}"; } auto TypeInfo::Print(llvm::raw_ostream& out) const -> void { out << "{inst: " << inst_id << ", value_rep: " << value_repr << "}"; } File::File(SharedValueStores& value_stores) : value_stores_(&value_stores), filename_(""), type_blocks_(allocator_), inst_blocks_(allocator_) { auto builtins_id = cross_ref_irs_.Add(this); CARBON_CHECK(builtins_id == CrossRefIRId::Builtins) << "Builtins must be the first IR, even if self-referential"; // Default entry for InstBlockId::Empty. inst_blocks_.AddDefaultValue(); insts_.Reserve(BuiltinKind::ValidCount); // Error uses a self-referential type so that it's not accidentally treated as // a normal type. Every other builtin is a type, including the // self-referential TypeType. #define CARBON_SEM_IR_BUILTIN_KIND(Name, ...) \ insts_.AddInNoBlock(Builtin{BuiltinKind::Name == BuiltinKind::Error \ ? TypeId::Error \ : TypeId::TypeType, \ BuiltinKind::Name}); #include "toolchain/sem_ir/builtin_kind.def" CARBON_CHECK(insts_.size() == BuiltinKind::ValidCount) << "Builtins should produce " << BuiltinKind::ValidCount << " insts, actual: " << insts_.size(); } File::File(SharedValueStores& value_stores, std::string filename, const File* builtins) : value_stores_(&value_stores), filename_(std::move(filename)), type_blocks_(allocator_), inst_blocks_(allocator_) { CARBON_CHECK(builtins != nullptr); auto builtins_id = cross_ref_irs_.Add(builtins); CARBON_CHECK(builtins_id == CrossRefIRId::Builtins) << "Builtins must be the first IR"; // Default entry for InstBlockId::Empty. inst_blocks_.AddDefaultValue(); // Copy builtins over. insts_.Reserve(BuiltinKind::ValidCount); static constexpr auto BuiltinIR = CrossRefIRId(0); for (auto [i, inst] : llvm::enumerate(builtins->insts_.array_ref())) { // We can reuse builtin type IDs because they're special-cased values. insts_.AddInNoBlock(CrossRef{inst.type_id(), BuiltinIR, SemIR::InstId(i)}); } } auto File::Verify() const -> ErrorOr { // Invariants don't necessarily hold for invalid IR. if (has_errors_) { return Success(); } // Check that every code block has a terminator sequence that appears at the // end of the block. for (const Function& function : functions_.array_ref()) { for (InstBlockId block_id : function.body_block_ids) { TerminatorKind prior_kind = TerminatorKind::NotTerminator; for (InstId inst_id : inst_blocks().Get(block_id)) { TerminatorKind inst_kind = insts().Get(inst_id).kind().terminator_kind(); if (prior_kind == TerminatorKind::Terminator) { return Error(llvm::formatv("Inst {0} in block {1} follows terminator", inst_id, block_id)); } if (prior_kind > inst_kind) { return Error( llvm::formatv("Non-terminator inst {0} in block {1} follows " "terminator sequence", inst_id, block_id)); } prior_kind = inst_kind; } if (prior_kind != TerminatorKind::Terminator) { return Error(llvm::formatv("No terminator in block {0}", block_id)); } } } // TODO: Check that an instruction only references other instructions that are // either global or that dominate it. return Success(); } auto File::OutputYaml(bool include_builtins) const -> Yaml::OutputMapping { return Yaml::OutputMapping([this, include_builtins](Yaml::OutputMapping::Map map) { map.Add("filename", filename_); map.Add("sem_ir", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { map.Add("cross_ref_irs_size", Yaml::OutputScalar(cross_ref_irs_.size())); map.Add("functions", functions_.OutputYaml()); map.Add("classes", classes_.OutputYaml()); map.Add("types", types_.OutputYaml()); map.Add("type_blocks", type_blocks_.OutputYaml()); map.Add("insts", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { int start = include_builtins ? 0 : BuiltinKind::ValidCount; for (int i : llvm::seq(start, insts_.size())) { auto id = InstId(i); map.Add(PrintToString(id), Yaml::OutputScalar(insts_.Get(id))); } })); map.Add("inst_blocks", inst_blocks_.OutputYaml()); })); }); } // Map an instruction kind representing a type into an integer describing the // precedence of that type's syntax. Higher numbers correspond to higher // precedence. static auto GetTypePrecedence(InstKind kind) -> int { // clang warns on unhandled enum values; clang-tidy is incorrect here. // NOLINTNEXTLINE(bugprone-switch-missing-default-case) switch (kind) { case ArrayType::Kind: case Builtin::Kind: case ClassType::Kind: case NameRef::Kind: case StructType::Kind: case TupleType::Kind: case UnboundElementType::Kind: return 0; case ConstType::Kind: return -1; case PointerType::Kind: return -2; case CrossRef::Kind: // TODO: Once we support stringification of cross-references, we'll need // to determine the precedence of the target of the cross-reference. For // now, all cross-references refer to builtin types from the prelude. return 0; case AddressOf::Kind: case ArrayIndex::Kind: case ArrayInit::Kind: case Assign::Kind: case BaseDecl::Kind: case BindName::Kind: case BindValue::Kind: case BlockArg::Kind: case BoolLiteral::Kind: case BoundMethod::Kind: case Branch::Kind: case BranchIf::Kind: case BranchWithArg::Kind: case Call::Kind: case ClassDecl::Kind: case ClassElementAccess::Kind: case ClassInit::Kind: case Converted::Kind: case Deref::Kind: case FieldDecl::Kind: case FunctionDecl::Kind: case Import::Kind: case InitializeFrom::Kind: case InterfaceDecl::Kind: case IntLiteral::Kind: case LazyImportRef::Kind: case Namespace::Kind: case NoOp::Kind: case Param::Kind: case RealLiteral::Kind: case Return::Kind: case ReturnExpr::Kind: case SelfParam::Kind: case SpliceBlock::Kind: case StringLiteral::Kind: case StructAccess::Kind: case StructTypeField::Kind: case StructLiteral::Kind: case StructInit::Kind: case StructValue::Kind: case Temporary::Kind: case TemporaryStorage::Kind: case TupleAccess::Kind: case TupleIndex::Kind: case TupleLiteral::Kind: case TupleInit::Kind: case TupleValue::Kind: case UnaryOperatorNot::Kind: case ValueAsRef::Kind: case ValueOfInitializer::Kind: case VarStorage::Kind: CARBON_FATAL() << "GetTypePrecedence for non-type inst kind " << kind; } } auto File::StringifyType(TypeId type_id) const -> std::string { return StringifyTypeExpr(types().GetInstId(type_id)); } auto File::StringifyTypeExpr(InstId outer_inst_id) const -> std::string { std::string str; llvm::raw_string_ostream out(str); struct Step { // The instruction to print. InstId inst_id; // The index into inst_id to print. Not used by all types. int index = 0; auto Next() const -> Step { return {.inst_id = inst_id, .index = index + 1}; } }; llvm::SmallVector steps = {{.inst_id = outer_inst_id}}; while (!steps.empty()) { auto step = steps.pop_back_val(); if (!step.inst_id.is_valid()) { out << ""; continue; } // Builtins have designated labels. if (step.inst_id.index < BuiltinKind::ValidCount) { out << BuiltinKind::FromInt(step.inst_id.index).label(); continue; } auto inst = insts().Get(step.inst_id); // clang warns on unhandled enum values; clang-tidy is incorrect here. // NOLINTNEXTLINE(bugprone-switch-missing-default-case) switch (inst.kind()) { case ArrayType::Kind: { auto array = inst.As(); if (step.index == 0) { out << "["; steps.push_back(step.Next()); steps.push_back( {.inst_id = types().GetInstId(array.element_type_id)}); } else if (step.index == 1) { out << "; " << GetArrayBoundValue(array.bound_id) << "]"; } break; } case ClassType::Kind: { auto class_name_id = classes().Get(inst.As().class_id).name_id; out << names().GetFormatted(class_name_id); break; } case ConstType::Kind: { if (step.index == 0) { out << "const "; // Add parentheses if required. auto inner_type_inst_id = types().GetInstId(inst.As().inner_id); if (GetTypePrecedence(insts().Get(inner_type_inst_id).kind()) < GetTypePrecedence(inst.kind())) { out << "("; steps.push_back(step.Next()); } steps.push_back({.inst_id = inner_type_inst_id}); } else if (step.index == 1) { out << ")"; } break; } case NameRef::Kind: { out << names().GetFormatted(inst.As().name_id); break; } case PointerType::Kind: { if (step.index == 0) { steps.push_back(step.Next()); steps.push_back({.inst_id = types().GetInstId( inst.As().pointee_id)}); } else if (step.index == 1) { out << "*"; } break; } case StructType::Kind: { auto refs = inst_blocks().Get(inst.As().fields_id); if (refs.empty()) { out << "{}"; break; } else if (step.index == 0) { out << "{"; } else if (step.index < static_cast(refs.size())) { out << ", "; } else { out << "}"; break; } steps.push_back(step.Next()); steps.push_back({.inst_id = refs[step.index]}); break; } case StructTypeField::Kind: { auto field = inst.As(); out << "." << names().GetFormatted(field.name_id) << ": "; steps.push_back({.inst_id = types().GetInstId(field.field_type_id)}); break; } case TupleType::Kind: { auto refs = type_blocks().Get(inst.As().elements_id); if (refs.empty()) { out << "()"; break; } else if (step.index == 0) { out << "("; } else if (step.index < static_cast(refs.size())) { out << ", "; } else { // A tuple of one element has a comma to disambiguate from an // expression. if (step.index == 1) { out << ","; } out << ")"; break; } steps.push_back(step.Next()); steps.push_back({.inst_id = types().GetInstId(refs[step.index])}); break; } case UnboundElementType::Kind: { if (step.index == 0) { out << "().class_type_id)}); } else { out << ">"; } break; } case AddressOf::Kind: case ArrayIndex::Kind: case ArrayInit::Kind: case Assign::Kind: case BaseDecl::Kind: case BindName::Kind: case BindValue::Kind: case BlockArg::Kind: case BoolLiteral::Kind: case BoundMethod::Kind: case Branch::Kind: case BranchIf::Kind: case BranchWithArg::Kind: case Builtin::Kind: case Call::Kind: case ClassDecl::Kind: case ClassElementAccess::Kind: case ClassInit::Kind: case Converted::Kind: case CrossRef::Kind: case Deref::Kind: case FieldDecl::Kind: case FunctionDecl::Kind: case Import::Kind: case InitializeFrom::Kind: case InterfaceDecl::Kind: case IntLiteral::Kind: case LazyImportRef::Kind: case Namespace::Kind: case NoOp::Kind: case Param::Kind: case RealLiteral::Kind: case Return::Kind: case ReturnExpr::Kind: case SelfParam::Kind: case SpliceBlock::Kind: case StringLiteral::Kind: case StructAccess::Kind: case StructLiteral::Kind: case StructInit::Kind: case StructValue::Kind: case Temporary::Kind: case TemporaryStorage::Kind: case TupleAccess::Kind: case TupleIndex::Kind: case TupleLiteral::Kind: case TupleInit::Kind: case TupleValue::Kind: case UnaryOperatorNot::Kind: case ValueAsRef::Kind: case ValueOfInitializer::Kind: case VarStorage::Kind: // We don't need to handle stringification for instructions that don't // show up in errors, but make it clear what's going on so that it's // clearer when stringification is needed. out << ""; break; } } return str; } auto GetExprCategory(const File& file, InstId inst_id) -> ExprCategory { const File* ir = &file; // The overall expression category if the current instruction is a value // expression. ExprCategory value_category = ExprCategory::Value; while (true) { auto inst = ir->insts().Get(inst_id); // clang warns on unhandled enum values; clang-tidy is incorrect here. // NOLINTNEXTLINE(bugprone-switch-missing-default-case) switch (inst.kind()) { case Assign::Kind: case BaseDecl::Kind: case Branch::Kind: case BranchIf::Kind: case BranchWithArg::Kind: case ClassDecl::Kind: case FieldDecl::Kind: case FunctionDecl::Kind: case Import::Kind: case InterfaceDecl::Kind: case LazyImportRef::Kind: case Namespace::Kind: case NoOp::Kind: case Return::Kind: case ReturnExpr::Kind: case StructTypeField::Kind: return ExprCategory::NotExpr; case CrossRef::Kind: { auto xref = inst.As(); ir = ir->cross_ref_irs().Get(xref.ir_id); inst_id = xref.inst_id; continue; } case NameRef::Kind: { inst_id = inst.As().value_id; continue; } case Converted::Kind: { inst_id = inst.As().result_id; continue; } case AddressOf::Kind: case ArrayType::Kind: case BindValue::Kind: case BlockArg::Kind: case BoolLiteral::Kind: case BoundMethod::Kind: case ClassType::Kind: case ConstType::Kind: case IntLiteral::Kind: case Param::Kind: case PointerType::Kind: case RealLiteral::Kind: case SelfParam::Kind: case StringLiteral::Kind: case StructValue::Kind: case StructType::Kind: case TupleValue::Kind: case TupleType::Kind: case UnaryOperatorNot::Kind: case UnboundElementType::Kind: case ValueOfInitializer::Kind: return value_category; case Builtin::Kind: { if (inst.As().builtin_kind == BuiltinKind::Error) { return ExprCategory::Error; } return value_category; } case BindName::Kind: { inst_id = inst.As().value_id; continue; } case ArrayIndex::Kind: { inst_id = inst.As().array_id; continue; } case ClassElementAccess::Kind: { inst_id = inst.As().base_id; // A value of class type is a pointer to an object representation. // Therefore, if the base is a value, the result is an ephemeral // reference. value_category = ExprCategory::EphemeralRef; continue; } case StructAccess::Kind: { inst_id = inst.As().struct_id; continue; } case TupleAccess::Kind: { inst_id = inst.As().tuple_id; continue; } case TupleIndex::Kind: { inst_id = inst.As().tuple_id; continue; } case SpliceBlock::Kind: { inst_id = inst.As().result_id; continue; } case StructLiteral::Kind: case TupleLiteral::Kind: return ExprCategory::Mixed; case ArrayInit::Kind: case Call::Kind: case InitializeFrom::Kind: case ClassInit::Kind: case StructInit::Kind: case TupleInit::Kind: return ExprCategory::Initializing; case Deref::Kind: case VarStorage::Kind: return ExprCategory::DurableRef; case Temporary::Kind: case TemporaryStorage::Kind: case ValueAsRef::Kind: return ExprCategory::EphemeralRef; } } } auto GetInitRepr(const File& file, TypeId type_id) -> InitRepr { auto value_rep = GetValueRepr(file, type_id); switch (value_rep.kind) { case ValueRepr::None: return {.kind = InitRepr::None}; case ValueRepr::Copy: // TODO: Use in-place initialization for types that have non-trivial // destructive move. return {.kind = InitRepr::ByCopy}; case ValueRepr::Pointer: case ValueRepr::Custom: return {.kind = InitRepr::InPlace}; case ValueRepr::Unknown: CARBON_FATAL() << "Attempting to perform initialization of incomplete type"; } } } // namespace Carbon::SemIR