// Part of the Carbon Language project, under the Apache License v2.0 with LLVM // Exceptions. See /LICENSE for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception #include "toolchain/sem_ir/file.h" #include "common/check.h" #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallVector.h" #include "toolchain/base/kind_switch.h" #include "toolchain/base/value_store.h" #include "toolchain/base/yaml.h" #include "toolchain/parse/node_ids.h" #include "toolchain/sem_ir/builtin_inst_kind.h" #include "toolchain/sem_ir/ids.h" #include "toolchain/sem_ir/inst.h" #include "toolchain/sem_ir/inst_kind.h" #include "toolchain/sem_ir/typed_insts.h" namespace Carbon::SemIR { File::File(CheckIRId check_ir_id, IdentifierId package_id, LibraryNameId library_id, SharedValueStores& value_stores, std::string filename) : check_ir_id_(check_ir_id), package_id_(package_id), library_id_(library_id), value_stores_(&value_stores), filename_(std::move(filename)), type_blocks_(allocator_), name_scopes_(&insts_), constant_values_(ConstantId::NotConstant), inst_blocks_(allocator_), constants_(*this, allocator_) { // `type` and the error type are both complete types. types_.SetValueRepr(TypeId::TypeType, {.kind = ValueRepr::Copy, .type_id = TypeId::TypeType}); types_.SetValueRepr(TypeId::Error, {.kind = ValueRepr::Copy, .type_id = TypeId::Error}); insts_.Reserve(BuiltinInstKind::ValidCount); // Error uses a self-referential type so that it's not accidentally treated as // a normal type. Every other builtin is a type, including the // self-referential TypeType. #define CARBON_SEM_IR_BUILTIN_INST_KIND(Name, ...) \ insts_.AddInNoBlock(LocIdAndInst::NoLoc( \ {.type_id = BuiltinInstKind::Name == BuiltinInstKind::Error \ ? TypeId::Error \ : TypeId::TypeType, \ .builtin_inst_kind = BuiltinInstKind::Name})); #include "toolchain/sem_ir/builtin_inst_kind.def" CARBON_CHECK(insts_.size() == BuiltinInstKind::ValidCount, "Builtins should produce {0} insts, actual: {1}", BuiltinInstKind::ValidCount, insts_.size()); for (auto i : llvm::seq(BuiltinInstKind::ValidCount)) { auto builtin_id = SemIR::InstId(i); constant_values_.Set(builtin_id, SemIR::ConstantId::ForTemplateConstant(builtin_id)); } } auto File::Verify() const -> ErrorOr { // Invariants don't necessarily hold for invalid IR. if (has_errors_) { return Success(); } // Check that every code block has a terminator sequence that appears at the // end of the block. for (const Function& function : functions_.array_ref()) { for (InstBlockId block_id : function.body_block_ids) { TerminatorKind prior_kind = TerminatorKind::NotTerminator; for (InstId inst_id : inst_blocks().Get(block_id)) { TerminatorKind inst_kind = insts().Get(inst_id).kind().terminator_kind(); if (prior_kind == TerminatorKind::Terminator) { return Error(llvm::formatv("Inst {0} in block {1} follows terminator", inst_id, block_id)); } if (prior_kind > inst_kind) { return Error( llvm::formatv("Non-terminator inst {0} in block {1} follows " "terminator sequence", inst_id, block_id)); } prior_kind = inst_kind; } if (prior_kind != TerminatorKind::Terminator) { return Error(llvm::formatv("No terminator in block {0}", block_id)); } } } // TODO: Check that an instruction only references other instructions that are // either global or that dominate it. return Success(); } auto File::OutputYaml(bool include_builtins) const -> Yaml::OutputMapping { return Yaml::OutputMapping([this, include_builtins](Yaml::OutputMapping::Map map) { map.Add("filename", filename_); map.Add( "sem_ir", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { map.Add("import_irs", import_irs_.OutputYaml()); map.Add("import_ir_insts", import_ir_insts_.OutputYaml()); map.Add("name_scopes", name_scopes_.OutputYaml()); map.Add("entity_names", entity_names_.OutputYaml()); map.Add("functions", functions_.OutputYaml()); map.Add("classes", classes_.OutputYaml()); map.Add("generics", generics_.OutputYaml()); map.Add("specifics", specifics_.OutputYaml()); map.Add("types", types_.OutputYaml()); map.Add("type_blocks", type_blocks_.OutputYaml()); map.Add( "insts", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { int start = include_builtins ? 0 : BuiltinInstKind::ValidCount; for (int i : llvm::seq(start, insts_.size())) { auto id = InstId(i); map.Add(PrintToString(id), Yaml::OutputScalar(insts_.Get(id))); } })); map.Add("constant_values", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { int start = include_builtins ? 0 : BuiltinInstKind::ValidCount; for (int i : llvm::seq(start, insts_.size())) { auto id = InstId(i); auto value = constant_values_.Get(id); if (!value.is_valid() || value.is_constant()) { map.Add(PrintToString(id), Yaml::OutputScalar(value)); } } })); map.Add( "symbolic_constants", Yaml::OutputMapping([&](Yaml::OutputMapping::Map map) { for (const auto& [i, symbolic] : llvm::enumerate(constant_values().symbolic_constants())) { map.Add( PrintToString(ConstantId::ForSymbolicConstantIndex(i)), Yaml::OutputScalar(symbolic)); } })); map.Add("inst_blocks", inst_blocks_.OutputYaml()); })); }); } auto File::CollectMemUsage(MemUsage& mem_usage, llvm::StringRef label) const -> void { mem_usage.Add(MemUsage::ConcatLabel(label, "allocator_"), allocator_); mem_usage.Collect(MemUsage::ConcatLabel(label, "entity_names_"), entity_names_); mem_usage.Collect(MemUsage::ConcatLabel(label, "functions_"), functions_); mem_usage.Collect(MemUsage::ConcatLabel(label, "classes_"), classes_); mem_usage.Collect(MemUsage::ConcatLabel(label, "interfaces_"), interfaces_); mem_usage.Collect(MemUsage::ConcatLabel(label, "impls_"), impls_); mem_usage.Collect(MemUsage::ConcatLabel(label, "generics_"), generics_); mem_usage.Collect(MemUsage::ConcatLabel(label, "specifics_"), specifics_); mem_usage.Collect(MemUsage::ConcatLabel(label, "import_irs_"), import_irs_); mem_usage.Collect(MemUsage::ConcatLabel(label, "import_ir_insts_"), import_ir_insts_); mem_usage.Collect(MemUsage::ConcatLabel(label, "type_blocks_"), type_blocks_); mem_usage.Collect(MemUsage::ConcatLabel(label, "insts_"), insts_); mem_usage.Collect(MemUsage::ConcatLabel(label, "name_scopes_"), name_scopes_); mem_usage.Collect(MemUsage::ConcatLabel(label, "constant_values_"), constant_values_); mem_usage.Collect(MemUsage::ConcatLabel(label, "inst_blocks_"), inst_blocks_); mem_usage.Collect(MemUsage::ConcatLabel(label, "constants_"), constants_); mem_usage.Collect(MemUsage::ConcatLabel(label, "types_"), types_); } // Map an instruction kind representing a type into an integer describing the // precedence of that type's syntax. Higher numbers correspond to higher // precedence. static auto GetTypePrecedence(InstKind kind) -> int { CARBON_CHECK(kind.is_type() != InstIsType::Never, "Only called for kinds which can define a type."); if (kind == ConstType::Kind) { return -1; } if (kind == PointerType::Kind) { return -2; } return 0; } // Implements File::StringifyTypeExpr. Static to prevent accidental use of // member functions while traversing IRs. static auto StringifyTypeExprImpl(const SemIR::File& outer_sem_ir, InstId outer_inst_id) { std::string str; llvm::raw_string_ostream out(str); struct Step { // The instruction's file. const File& sem_ir; // The instruction to print. InstId inst_id; // The index into inst_id to print. Not used by all types. int index = 0; auto Next() const -> Step { return {.sem_ir = sem_ir, .inst_id = inst_id, .index = index + 1}; } }; llvm::SmallVector steps = { Step{.sem_ir = outer_sem_ir, .inst_id = outer_inst_id}}; while (!steps.empty()) { auto step = steps.pop_back_val(); if (!step.inst_id.is_valid()) { out << ""; continue; } // Builtins have designated labels. if (step.inst_id.is_builtin()) { out << step.inst_id.builtin_inst_kind().label(); continue; } const auto& sem_ir = step.sem_ir; // Helper for instructions with the current sem_ir. auto push_inst_id = [&](InstId inst_id) { steps.push_back({.sem_ir = sem_ir, .inst_id = inst_id}); }; auto untyped_inst = sem_ir.insts().Get(step.inst_id); CARBON_KIND_SWITCH(untyped_inst) { case CARBON_KIND(ArrayType inst): { if (step.index == 0) { out << "["; steps.push_back(step.Next()); push_inst_id(sem_ir.types().GetInstId(inst.element_type_id)); } else if (step.index == 1) { out << "; " << sem_ir.GetArrayBoundValue(inst.bound_id) << "]"; } break; } case CARBON_KIND(AssociatedEntityType inst): { if (step.index == 0) { out << ""; } break; } case BindAlias::Kind: case BindSymbolicName::Kind: case ExportDecl::Kind: { auto name_id = untyped_inst.As().entity_name_id; out << sem_ir.names().GetFormatted( sem_ir.entity_names().Get(name_id).name_id); break; } case CARBON_KIND(ClassType inst): { auto class_name_id = sem_ir.classes().Get(inst.class_id).name_id; out << sem_ir.names().GetFormatted(class_name_id); break; } case CARBON_KIND(ConstType inst): { if (step.index == 0) { out << "const "; // Add parentheses if required. auto inner_type_inst_id = sem_ir.types().GetInstId(inst.inner_id); if (GetTypePrecedence(sem_ir.insts().Get(inner_type_inst_id).kind()) < GetTypePrecedence(SemIR::ConstType::Kind)) { out << "("; steps.push_back(step.Next()); } push_inst_id(inner_type_inst_id); } else if (step.index == 1) { out << ")"; } break; } case CARBON_KIND(FacetTypeAccess inst): { // Print `T as type` as simply `T`. push_inst_id(inst.facet_id); break; } case CARBON_KIND(FloatType inst): { // TODO: Is this okay? if (step.index == 1) { out << ")"; } else if (auto width_value = sem_ir.insts().TryGetAs(inst.bit_width_id)) { out << "f"; sem_ir.ints().Get(width_value->int_id).print(out, /*isSigned=*/false); } else { out << "Core.Float("; steps.push_back(step.Next()); push_inst_id(inst.bit_width_id); } break; } case CARBON_KIND(FunctionType inst): { auto fn_name_id = sem_ir.functions().Get(inst.function_id).name_id; out << ""; break; } case CARBON_KIND(GenericClassType inst): { auto class_name_id = sem_ir.classes().Get(inst.class_id).name_id; out << ""; break; } case CARBON_KIND(GenericInterfaceType inst): { auto interface_name_id = sem_ir.interfaces().Get(inst.interface_id).name_id; out << ""; break; } case CARBON_KIND(InterfaceType inst): { auto interface_name_id = sem_ir.interfaces().Get(inst.interface_id).name_id; out << sem_ir.names().GetFormatted(interface_name_id); break; } case CARBON_KIND(IntType inst): { if (step.index == 1) { out << ")"; } else if (auto width_value = sem_ir.insts().TryGetAs(inst.bit_width_id)) { out << (inst.int_kind.is_signed() ? "i" : "u"); sem_ir.ints().Get(width_value->int_id).print(out, /*isSigned=*/false); } else { out << (inst.int_kind.is_signed() ? "Core.Int(" : "Core.UInt("); steps.push_back(step.Next()); push_inst_id(inst.bit_width_id); } break; } case CARBON_KIND(NameRef inst): { out << sem_ir.names().GetFormatted(inst.name_id); break; } case CARBON_KIND(PointerType inst): { if (step.index == 0) { steps.push_back(step.Next()); push_inst_id(sem_ir.types().GetInstId(inst.pointee_id)); } else if (step.index == 1) { out << "*"; } break; } case CARBON_KIND(StructType inst): { auto refs = sem_ir.inst_blocks().Get(inst.fields_id); if (refs.empty()) { out << "{}"; break; } else if (step.index == 0) { out << "{"; } else if (step.index < static_cast(refs.size())) { out << ", "; } else { out << "}"; break; } steps.push_back(step.Next()); push_inst_id(refs[step.index]); break; } case CARBON_KIND(StructTypeField inst): { out << "." << sem_ir.names().GetFormatted(inst.name_id) << ": "; push_inst_id(sem_ir.types().GetInstId(inst.field_type_id)); break; } case CARBON_KIND(TupleType inst): { auto refs = sem_ir.type_blocks().Get(inst.elements_id); if (refs.empty()) { out << "()"; break; } else if (step.index == 0) { out << "("; } else if (step.index < static_cast(refs.size())) { out << ", "; } else { // A tuple of one element has a comma to disambiguate from an // expression. if (step.index == 1) { out << ","; } out << ")"; break; } steps.push_back(step.Next()); push_inst_id(sem_ir.types().GetInstId(refs[step.index])); break; } case CARBON_KIND(UnboundElementType inst): { if (step.index == 0) { out << ""; } break; } case AdaptDecl::Kind: case AddrOf::Kind: case AddrPattern::Kind: case ArrayIndex::Kind: case ArrayInit::Kind: case AsCompatible::Kind: case Assign::Kind: case AssociatedConstantDecl::Kind: case AssociatedEntity::Kind: case BaseDecl::Kind: case BindName::Kind: case BindValue::Kind: case BlockArg::Kind: case BoolLiteral::Kind: case BoundMethod::Kind: case Branch::Kind: case BranchIf::Kind: case BranchWithArg::Kind: case BuiltinInst::Kind: case Call::Kind: case ClassDecl::Kind: case ClassElementAccess::Kind: case ClassInit::Kind: case CompleteTypeWitness::Kind: case Converted::Kind: case Deref::Kind: case FieldDecl::Kind: case FloatLiteral::Kind: case FunctionDecl::Kind: case ImplDecl::Kind: case ImportDecl::Kind: case ImportRefLoaded::Kind: case ImportRefUnloaded::Kind: case InitializeFrom::Kind: case SpecificConstant::Kind: case InterfaceDecl::Kind: case InterfaceWitness::Kind: case InterfaceWitnessAccess::Kind: case IntLiteral::Kind: case Namespace::Kind: case Param::Kind: case Return::Kind: case ReturnExpr::Kind: case SpliceBlock::Kind: case StringLiteral::Kind: case StructAccess::Kind: case StructLiteral::Kind: case StructInit::Kind: case StructValue::Kind: case Temporary::Kind: case TemporaryStorage::Kind: case TupleAccess::Kind: case TupleLiteral::Kind: case TupleInit::Kind: case TupleValue::Kind: case UnaryOperatorNot::Kind: case ValueAsRef::Kind: case ValueOfInitializer::Kind: case VarStorage::Kind: // We don't need to handle stringification for instructions that don't // show up in errors, but make it clear what's going on so that it's // clearer when stringification is needed. out << ""; break; } } return str; } auto File::StringifyType(TypeId type_id) const -> std::string { return StringifyTypeExprImpl(*this, types().GetInstId(type_id)); } auto File::StringifyType(ConstantId type_const_id) const -> std::string { return StringifyTypeExprImpl(*this, constant_values().GetInstId(type_const_id)); } auto File::StringifyTypeExpr(InstId outer_inst_id) const -> std::string { return StringifyTypeExprImpl(*this, outer_inst_id); } auto GetExprCategory(const File& file, InstId inst_id) -> ExprCategory { const File* ir = &file; // The overall expression category if the current instruction is a value // expression. ExprCategory value_category = ExprCategory::Value; while (true) { auto untyped_inst = ir->insts().Get(inst_id); CARBON_KIND_SWITCH(untyped_inst) { case AdaptDecl::Kind: case Assign::Kind: case BaseDecl::Kind: case Branch::Kind: case BranchIf::Kind: case BranchWithArg::Kind: case FieldDecl::Kind: case FunctionDecl::Kind: case ImplDecl::Kind: case Namespace::Kind: case Return::Kind: case ReturnExpr::Kind: case StructTypeField::Kind: return ExprCategory::NotExpr; case ImportRefUnloaded::Kind: case ImportRefLoaded::Kind: { auto import_ir_inst = ir->import_ir_insts().Get( untyped_inst.As().import_ir_inst_id); ir = ir->import_irs().Get(import_ir_inst.ir_id).sem_ir; inst_id = import_ir_inst.inst_id; continue; } case CARBON_KIND(AsCompatible inst): { inst_id = inst.source_id; continue; } case CARBON_KIND(BindAlias inst): { inst_id = inst.value_id; continue; } case CARBON_KIND(ExportDecl inst): { inst_id = inst.value_id; continue; } case CARBON_KIND(NameRef inst): { inst_id = inst.value_id; continue; } case CARBON_KIND(Converted inst): { inst_id = inst.result_id; continue; } case CARBON_KIND(SpecificConstant inst): { inst_id = inst.inst_id; continue; } case AddrOf::Kind: case AddrPattern::Kind: case ArrayType::Kind: case AssociatedConstantDecl::Kind: case AssociatedEntity::Kind: case AssociatedEntityType::Kind: case BindSymbolicName::Kind: case BindValue::Kind: case BlockArg::Kind: case BoolLiteral::Kind: case BoundMethod::Kind: case ClassDecl::Kind: case ClassType::Kind: case CompleteTypeWitness::Kind: case ConstType::Kind: case FacetTypeAccess::Kind: case FloatLiteral::Kind: case FloatType::Kind: case FunctionType::Kind: case GenericClassType::Kind: case GenericInterfaceType::Kind: case ImportDecl::Kind: case InterfaceDecl::Kind: case InterfaceType::Kind: case InterfaceWitness::Kind: case InterfaceWitnessAccess::Kind: case IntLiteral::Kind: case IntType::Kind: case Param::Kind: case PointerType::Kind: case StringLiteral::Kind: case StructValue::Kind: case StructType::Kind: case TupleValue::Kind: case TupleType::Kind: case UnaryOperatorNot::Kind: case UnboundElementType::Kind: case ValueOfInitializer::Kind: return value_category; case CARBON_KIND(BuiltinInst inst): { if (inst.builtin_inst_kind == BuiltinInstKind::Error) { return ExprCategory::Error; } return value_category; } case CARBON_KIND(BindName inst): { inst_id = inst.value_id; continue; } case CARBON_KIND(ArrayIndex inst): { inst_id = inst.array_id; continue; } case CARBON_KIND(ClassElementAccess inst): { inst_id = inst.base_id; // A value of class type is a pointer to an object representation. // Therefore, if the base is a value, the result is an ephemeral // reference. value_category = ExprCategory::EphemeralRef; continue; } case CARBON_KIND(StructAccess inst): { inst_id = inst.struct_id; continue; } case CARBON_KIND(TupleAccess inst): { inst_id = inst.tuple_id; continue; } case CARBON_KIND(SpliceBlock inst): { inst_id = inst.result_id; continue; } case StructLiteral::Kind: case TupleLiteral::Kind: return ExprCategory::Mixed; case ArrayInit::Kind: case Call::Kind: case InitializeFrom::Kind: case ClassInit::Kind: case StructInit::Kind: case TupleInit::Kind: return ExprCategory::Initializing; case Deref::Kind: case VarStorage::Kind: return ExprCategory::DurableRef; case Temporary::Kind: case TemporaryStorage::Kind: case ValueAsRef::Kind: return ExprCategory::EphemeralRef; } } } } // namespace Carbon::SemIR