// Part of the Carbon Language project, under the Apache License v2.0 with LLVM // Exceptions. See /LICENSE for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception #include "toolchain/check/check_unit.h" #include #include "llvm/ADT/IntrusiveRefCntPtr.h" #include "llvm/ADT/StringRef.h" #include "llvm/Support/VirtualFileSystem.h" #include "toolchain/base/kind_switch.h" #include "toolchain/base/pretty_stack_trace_function.h" #include "toolchain/check/generic.h" #include "toolchain/check/handle.h" #include "toolchain/check/impl.h" #include "toolchain/check/import.h" #include "toolchain/check/import_cpp.h" #include "toolchain/check/import_ref.h" #include "toolchain/check/node_id_traversal.h" namespace Carbon::Check { // Returns the number of imported IRs, to assist in Context construction. static auto GetImportedIRCount(UnitAndImports* unit_and_imports) -> int { int count = 0; for (auto& package_imports : unit_and_imports->package_imports) { count += package_imports.imports.size(); } if (!unit_and_imports->api_for_impl) { // Leave an empty slot for ImportIRId::ApiForImpl. ++count; } return count; } CheckUnit::CheckUnit(UnitAndImports* unit_and_imports, int total_ir_count, llvm::IntrusiveRefCntPtr fs, llvm::raw_ostream* vlog_stream) : unit_and_imports_(unit_and_imports), total_ir_count_(total_ir_count), fs_(std::move(fs)), vlog_stream_(vlog_stream), emitter_(*unit_and_imports_->unit->sem_ir_converter, unit_and_imports_->err_tracker), context_(&emitter_, unit_and_imports_->unit->get_parse_tree_and_subtrees, unit_and_imports_->unit->sem_ir, GetImportedIRCount(unit_and_imports), total_ir_count, vlog_stream) {} auto CheckUnit::Run() -> void { Timings::ScopedTiming timing(unit_and_imports_->unit->timings, "check"); // We can safely mark this as checked at the start. unit_and_imports_->is_checked = true; PrettyStackTraceFunction context_dumper( [&](llvm::raw_ostream& output) { context_.PrintForStackDump(output); }); // Add a block for the file. context_.inst_block_stack().Push(); InitPackageScopeAndImports(); // Eagerly import the impls declared in the api file to prepare to redeclare // them. ImportImplsFromApiFile(context_); if (!ProcessNodeIds()) { context_.sem_ir().set_has_errors(true); return; } CheckRequiredDefinitions(); context_.Finalize(); context_.VerifyOnFinish(); context_.sem_ir().set_has_errors(unit_and_imports_->err_tracker.seen_error()); #ifndef NDEBUG if (auto verify = context_.sem_ir().Verify(); !verify.ok()) { CARBON_FATAL("{0}Built invalid semantics IR: {1}\n", context_.sem_ir(), verify.error()); } #endif } auto CheckUnit::InitPackageScopeAndImports() -> void { // Importing makes many namespaces, so only canonicalize the type once. auto namespace_type_id = context_.GetSingletonType(SemIR::NamespaceType::SingletonInstId); // Define the package scope, with an instruction for `package` expressions to // reference. auto package_scope_id = context_.name_scopes().Add( SemIR::Namespace::PackageInstId, SemIR::NameId::PackageNamespace, SemIR::NameScopeId::None); CARBON_CHECK(package_scope_id == SemIR::NameScopeId::Package); auto package_inst_id = context_.AddInst( Parse::NodeId::None, {.type_id = namespace_type_id, .name_scope_id = SemIR::NameScopeId::Package, .import_id = SemIR::InstId::None}); CARBON_CHECK(package_inst_id == SemIR::Namespace::PackageInstId); // If there is an implicit `api` import, set it first so that it uses the // ImportIRId::ApiForImpl when processed for imports. if (unit_and_imports_->api_for_impl) { const auto& names = context_.parse_tree().packaging_decl()->names; auto import_decl_id = context_.AddInst( names.node_id, {.package_id = SemIR::NameId::ForIdentifier(names.package_id)}); SetApiImportIR(context_, {.decl_id = import_decl_id, .is_export = false, .sem_ir = unit_and_imports_->api_for_impl->unit->sem_ir}); } else { SetApiImportIR(context_, {.decl_id = SemIR::InstId::None, .sem_ir = nullptr}); } // Add import instructions for everything directly imported. Implicit imports // are handled separately. for (auto& package_imports : unit_and_imports_->package_imports) { CARBON_CHECK(!package_imports.import_decl_id.has_value()); package_imports.import_decl_id = context_.AddInst( package_imports.node_id, {.package_id = SemIR::NameId::ForIdentifier( package_imports.package_id)}); } // Process the imports. if (unit_and_imports_->api_for_impl) { ImportApiFile(context_, namespace_type_id, *unit_and_imports_->api_for_impl->unit->sem_ir); } ImportCurrentPackage(package_inst_id, namespace_type_id); CARBON_CHECK(context_.scope_stack().PeekIndex() == ScopeIndex::Package); ImportOtherPackages(namespace_type_id); ImportCppPackages(); } auto CheckUnit::CollectDirectImports( llvm::SmallVector& results, llvm::MutableArrayRef ir_to_result_index, SemIR::InstId import_decl_id, const PackageImports& imports, bool is_local) -> void { for (const auto& import : imports.imports) { const auto& direct_ir = *import.unit_info->unit->sem_ir; auto& index = ir_to_result_index[direct_ir.check_ir_id().index]; if (index != -1) { // This should only happen when doing API imports for an implementation // file. Don't change the entry; is_export doesn't matter. continue; } index = results.size(); results.push_back({.decl_id = import_decl_id, // Only tag exports in API files, ignoring the value in // implementation files. .is_export = is_local && import.names.is_export, .sem_ir = &direct_ir}); } } auto CheckUnit::CollectTransitiveImports(SemIR::InstId import_decl_id, const PackageImports* local_imports, const PackageImports* api_imports) -> llvm::SmallVector { llvm::SmallVector results; // Track whether an IR was imported in full, including `export import`. This // distinguishes from IRs that are indirectly added without all names being // exported to this IR. llvm::SmallVector ir_to_result_index(total_ir_count_, -1); // First add direct imports. This means that if an entity is imported both // directly and indirectly, the import path will reflect the direct import. if (local_imports) { CollectDirectImports(results, ir_to_result_index, import_decl_id, *local_imports, /*is_local=*/true); } if (api_imports) { CollectDirectImports(results, ir_to_result_index, import_decl_id, *api_imports, /*is_local=*/false); } // Loop through direct imports for any indirect exports. The underlying vector // is appended during iteration, so take the size first. const int direct_imports = results.size(); for (int direct_index : llvm::seq(direct_imports)) { bool is_export = results[direct_index].is_export; for (const auto& indirect_ir : results[direct_index].sem_ir->import_irs().array_ref()) { if (!indirect_ir.is_export) { continue; } auto& indirect_index = ir_to_result_index[indirect_ir.sem_ir->check_ir_id().index]; if (indirect_index == -1) { indirect_index = results.size(); // TODO: In the case of a recursive `export import`, this only points at // the outermost import. May want something that better reflects the // recursion. results.push_back({.decl_id = results[direct_index].decl_id, .is_export = is_export, .sem_ir = indirect_ir.sem_ir}); } else if (is_export) { results[indirect_index].is_export = true; } } } return results; } auto CheckUnit::ImportCurrentPackage(SemIR::InstId package_inst_id, SemIR::TypeId namespace_type_id) -> void { // Add imports from the current package. auto import_map_lookup = unit_and_imports_->package_imports_map.Lookup(IdentifierId::None); if (!import_map_lookup) { // Push the scope; there are no names to add. context_.scope_stack().Push(package_inst_id, SemIR::NameScopeId::Package); return; } PackageImports& self_import = unit_and_imports_->package_imports[import_map_lookup.value()]; if (self_import.has_load_error) { context_.name_scopes().Get(SemIR::NameScopeId::Package).set_has_error(); } ImportLibrariesFromCurrentPackage( context_, namespace_type_id, CollectTransitiveImports(self_import.import_decl_id, &self_import, /*api_imports=*/nullptr)); context_.scope_stack().Push( package_inst_id, SemIR::NameScopeId::Package, SemIR::SpecificId::None, context_.name_scopes().Get(SemIR::NameScopeId::Package).has_error()); } auto CheckUnit::ImportOtherPackages(SemIR::TypeId namespace_type_id) -> void { // api_imports_list is initially the size of the current file's imports, // including for API files, for simplicity in iteration. It's only really used // when processing an implementation file, in order to combine the API file // imports. // // For packages imported by the API file, the IdentifierId is the package name // and the index is into the API's import list. Otherwise, the initial // {None, -1} state remains. llvm::SmallVector> api_imports_list; api_imports_list.resize(unit_and_imports_->package_imports.size(), {IdentifierId::None, -1}); // When there's an API file, add the mapping to api_imports_list. if (unit_and_imports_->api_for_impl) { const auto& api_identifiers = unit_and_imports_->api_for_impl->unit->value_stores->identifiers(); auto& impl_identifiers = unit_and_imports_->unit->value_stores->identifiers(); for (auto [api_imports_index, api_imports] : llvm::enumerate(unit_and_imports_->api_for_impl->package_imports)) { // Skip the current package. if (!api_imports.package_id.has_value()) { continue; } // Translate the package ID from the API file to the implementation file. auto impl_package_id = impl_identifiers.Add(api_identifiers.Get(api_imports.package_id)); if (auto lookup = unit_and_imports_->package_imports_map.Lookup(impl_package_id)) { // On a hit, replace the entry to unify the API and implementation // imports. api_imports_list[lookup.value()] = {impl_package_id, api_imports_index}; } else { // On a miss, add the package as API-only. api_imports_list.push_back({impl_package_id, api_imports_index}); } } } for (auto [i, api_imports_entry] : llvm::enumerate(api_imports_list)) { // These variables are updated after figuring out which imports are present. auto import_decl_id = SemIR::InstId::None; IdentifierId package_id = IdentifierId::None; bool has_load_error = false; // Identify the local package imports if present. PackageImports* local_imports = nullptr; if (i < unit_and_imports_->package_imports.size()) { local_imports = &unit_and_imports_->package_imports[i]; if (!local_imports->package_id.has_value()) { // Skip the current package. continue; } import_decl_id = local_imports->import_decl_id; package_id = local_imports->package_id; has_load_error |= local_imports->has_load_error; } // Identify the API package imports if present. PackageImports* api_imports = nullptr; if (api_imports_entry.second != -1) { api_imports = &unit_and_imports_->api_for_impl ->package_imports[api_imports_entry.second]; if (local_imports) { CARBON_CHECK(package_id == api_imports_entry.first); } else { auto import_ir_inst_id = context_.import_ir_insts().Add( {.ir_id = SemIR::ImportIRId::ApiForImpl, .inst_id = api_imports->import_decl_id}); import_decl_id = context_.AddInst(context_.MakeImportedLocAndInst( import_ir_inst_id, {.package_id = SemIR::NameId::ForIdentifier( api_imports_entry.first)})); package_id = api_imports_entry.first; } has_load_error |= api_imports->has_load_error; } // Do the actual import. ImportLibrariesFromOtherPackage( context_, namespace_type_id, import_decl_id, package_id, CollectTransitiveImports(import_decl_id, local_imports, api_imports), has_load_error); } } auto CheckUnit::ImportCppPackages() -> void { const auto& imports = unit_and_imports_->cpp_imports; if (imports.empty()) { return; } llvm::SmallVector> import_pairs; import_pairs.reserve(imports.size()); for (const auto& import : imports) { import_pairs.push_back( {unit_and_imports_->unit->value_stores->string_literal_values().Get( import.library_id), import.node_id}); } ImportCppFiles(context_, unit_and_imports_->unit->sem_ir->filename(), import_pairs, fs_); } // Loops over all nodes in the tree. On some errors, this may return early, // for example if an unrecoverable state is encountered. // NOLINTNEXTLINE(readability-function-size) auto CheckUnit::ProcessNodeIds() -> bool { NodeIdTraversal traversal(context_, vlog_stream_); Parse::NodeId node_id = Parse::NodeId::None; // On crash, report which token we were handling. PrettyStackTraceFunction node_dumper([&](llvm::raw_ostream& output) { const auto& tree = unit_and_imports_->unit->get_parse_tree_and_subtrees(); auto converted = tree.NodeToDiagnosticLoc(node_id, /*token_only=*/false); converted.loc.FormatLocation(output); output << "checking " << context_.parse_tree().node_kind(node_id) << "\n"; // Crash output has a tab indent; try to indent slightly past that. converted.loc.FormatSnippet(output, /*indent=*/10); }); while (auto maybe_node_id = traversal.Next()) { node_id = *maybe_node_id; unit_and_imports_->unit->sem_ir_converter->AdvanceToken( context_.parse_tree().node_token(node_id)); if (context_.parse_tree().node_has_error(node_id)) { context_.TODO(node_id, "handle invalid parse trees in `check`"); return false; } bool result; auto parse_kind = context_.parse_tree().node_kind(node_id); switch (parse_kind) { #define CARBON_PARSE_NODE_KIND(Name) \ case Parse::NodeKind::Name: { \ result = HandleParseNode(context_, Parse::Name##Id(node_id)); \ break; \ } #include "toolchain/parse/node_kind.def" } if (!result) { CARBON_CHECK( unit_and_imports_->err_tracker.seen_error(), "HandleParseNode for `{0}` returned false without diagnosing.", parse_kind); return false; } traversal.Handle(parse_kind); } return true; } auto CheckUnit::CheckRequiredDefinitions() -> void { CARBON_DIAGNOSTIC(MissingDefinitionInImpl, Error, "no definition found for declaration in impl file"); // Note that more required definitions can be added during this loop. for (size_t i = 0; i != context_.definitions_required().size(); ++i) { SemIR::InstId decl_inst_id = context_.definitions_required()[i]; SemIR::Inst decl_inst = context_.insts().Get(decl_inst_id); CARBON_KIND_SWITCH(context_.insts().Get(decl_inst_id)) { case CARBON_KIND(SemIR::ClassDecl class_decl): { if (!context_.classes().Get(class_decl.class_id).is_defined()) { emitter_.Emit(decl_inst_id, MissingDefinitionInImpl); } break; } case CARBON_KIND(SemIR::FunctionDecl function_decl): { if (context_.functions().Get(function_decl.function_id).definition_id == SemIR::InstId::None) { emitter_.Emit(decl_inst_id, MissingDefinitionInImpl); } break; } case CARBON_KIND(SemIR::ImplDecl impl_decl): { auto& impl = context_.impls().Get(impl_decl.impl_id); if (!impl.is_defined()) { FillImplWitnessWithErrors(context_, impl); CARBON_DIAGNOSTIC(ImplMissingDefinition, Error, "impl declared but not defined"); emitter_.Emit(decl_inst_id, ImplMissingDefinition); } break; } case SemIR::InterfaceDecl::Kind: { // TODO: Handle `interface` as well, once we can test it without // triggering // https://github.com/carbon-language/carbon-lang/issues/4071. CARBON_FATAL("TODO: Support interfaces in DiagnoseMissingDefinitions"); } case CARBON_KIND(SemIR::SpecificFunction specific_function): { // TODO: Track a location for the use. In general we may want to track a // list of enclosing locations if this was used from a generic. SemIRLoc use_loc = decl_inst_id; if (!ResolveSpecificDefinition(context_, use_loc, specific_function.specific_id)) { CARBON_DIAGNOSTIC(MissingGenericFunctionDefinition, Error, "use of undefined generic function"); CARBON_DIAGNOSTIC(MissingGenericFunctionDefinitionHere, Note, "generic function declared here"); auto generic_decl_id = context_.generics() .Get(context_.specifics() .Get(specific_function.specific_id) .generic_id) .decl_id; emitter_.Build(decl_inst_id, MissingGenericFunctionDefinition) .Note(generic_decl_id, MissingGenericFunctionDefinitionHere) .Emit(); } break; } default: { CARBON_FATAL("Unexpected inst in definitions_required: {0}", decl_inst); } } } } } // namespace Carbon::Check