| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- #ifndef CARBON_TOOLCHAIN_CHECK_CONTEXT_H_
- #define CARBON_TOOLCHAIN_CHECK_CONTEXT_H_
- #include <string>
- #include "common/map.h"
- #include "common/ostream.h"
- #include "llvm/ADT/SmallVector.h"
- #include "toolchain/base/canonical_value_store.h"
- #include "toolchain/base/value_store.h"
- #include "toolchain/check/core_identifier.h"
- #include "toolchain/check/cpp/context.h"
- #include "toolchain/check/decl_introducer_state.h"
- #include "toolchain/check/decl_name_stack.h"
- #include "toolchain/check/deferred_definition_worklist.h"
- #include "toolchain/check/diagnostic_helpers.h"
- #include "toolchain/check/full_pattern_stack.h"
- #include "toolchain/check/generic_region_stack.h"
- #include "toolchain/check/global_init.h"
- #include "toolchain/check/inst_block_stack.h"
- #include "toolchain/check/node_stack.h"
- #include "toolchain/check/param_and_arg_refs_stack.h"
- #include "toolchain/check/region_stack.h"
- #include "toolchain/check/require_impls_stack.h"
- #include "toolchain/check/scope_stack.h"
- #include "toolchain/diagnostics/emitter.h"
- #include "toolchain/parse/node_ids.h"
- #include "toolchain/parse/tree.h"
- #include "toolchain/parse/tree_and_subtrees.h"
- #include "toolchain/sem_ir/facet_type_info.h"
- #include "toolchain/sem_ir/file.h"
- #include "toolchain/sem_ir/ids.h"
- #include "toolchain/sem_ir/import_ir.h"
- #include "toolchain/sem_ir/inst.h"
- #include "toolchain/sem_ir/name_scope.h"
- #include "toolchain/sem_ir/specific_interface.h"
- #include "toolchain/sem_ir/typed_insts.h"
- namespace Carbon::Check {
- // Context stored during check.
- //
- // This file stores state, and members objects may provide an API. Other files
- // may also have helpers that operate on Context. To keep this file manageable,
- // please put logic into other files.
- //
- // For example, consider the API for functions:
- // - `context.functions()`: Exposes storage of `SemIR::Function` objects.
- // - `toolchain/check/function.h`: Contains helper functions which use
- // `Check::Context`.
- // - `toolchain/sem_ir/function.h`: Contains helper functions which only need
- // `SemIR` objects, for which it's helpful not to depend on `Check::Context`
- // (for example, shared with lowering).
- class Context {
- public:
- // Stores references for work.
- explicit Context(DiagnosticEmitterBase* emitter,
- Parse::GetTreeAndSubtreesFn tree_and_subtrees_getter,
- SemIR::File* sem_ir, int imported_ir_count,
- int total_ir_count, llvm::raw_ostream* vlog_stream);
- // Marks an implementation TODO. Always returns false.
- auto TODO(SemIR::LocId loc_id, std::string label) -> bool;
- auto TODO(SemIR::InstId loc_inst_id, std::string label) -> bool;
- // Runs verification that the processing cleanly finished.
- auto VerifyOnFinish() const -> void;
- // Prints information for a stack dump.
- auto PrintForStackDump(llvm::raw_ostream& output) const -> void;
- // Get the Lex::TokenKind of a node for diagnostics.
- auto token_kind(Parse::NodeId node_id) -> Lex::TokenKind {
- return tokens().GetKind(parse_tree().node_token(node_id));
- }
- auto emitter() -> DiagnosticEmitterBase& { return *emitter_; }
- auto parse_tree_and_subtrees() -> const Parse::TreeAndSubtrees& {
- return tree_and_subtrees_getter_();
- }
- auto sem_ir() -> SemIR::File& { return *sem_ir_; }
- auto sem_ir() const -> const SemIR::File& { return *sem_ir_; }
- auto cpp_context() -> CppContext* { return cpp_context_.get(); }
- // TODO: Remove this and pass the C++ context to the constructor.
- auto set_cpp_context(std::unique_ptr<CppContext> cpp_context) {
- CARBON_CHECK(!cpp_context_ || !cpp_context, "Already have a C++ context");
- cpp_context_ = std::move(cpp_context);
- }
- // Convenience functions for major phase data.
- auto parse_tree() const -> const Parse::Tree& {
- return sem_ir_->parse_tree();
- }
- auto tokens() const -> const Lex::TokenizedBuffer& {
- return parse_tree().tokens();
- }
- auto vlog_stream() -> llvm::raw_ostream* { return vlog_stream_; }
- auto node_stack() -> NodeStack& { return node_stack_; }
- auto inst_block_stack() -> InstBlockStack& { return inst_block_stack_; }
- auto pattern_block_stack() -> InstBlockStack& { return pattern_block_stack_; }
- auto param_and_arg_refs_stack() -> ParamAndArgRefsStack& {
- return param_and_arg_refs_stack_;
- }
- auto args_type_info_stack() -> InstBlockStack& {
- return args_type_info_stack_;
- }
- auto struct_type_fields_stack() -> ArrayStack<SemIR::StructTypeField>& {
- return struct_type_fields_stack_;
- }
- auto field_decls_stack() -> ArrayStack<SemIR::InstId>& {
- return field_decls_stack_;
- }
- auto require_impls_stack() -> RequireImplsStack& {
- return require_impls_stack_;
- }
- auto decl_name_stack() -> DeclNameStack& { return decl_name_stack_; }
- auto decl_introducer_state_stack() -> DeclIntroducerStateStack& {
- return decl_introducer_state_stack_;
- }
- auto scope_stack() -> ScopeStack& { return scope_stack_; }
- // Convenience functions for frequently-used `scope_stack` members.
- auto break_continue_stack()
- -> llvm::SmallVector<ScopeStack::BreakContinueScope>& {
- return scope_stack().break_continue_stack();
- }
- auto full_pattern_stack() -> FullPatternStack& {
- return scope_stack_.full_pattern_stack();
- }
- auto deferred_definition_worklist() -> DeferredDefinitionWorklist& {
- return deferred_definition_worklist_;
- }
- auto generic_region_stack() -> GenericRegionStack& {
- return generic_region_stack_;
- }
- auto vtable_stack() -> InstBlockStack& { return vtable_stack_; }
- auto exports() -> llvm::SmallVector<SemIR::InstId>& { return exports_; }
- using CheckIRToImportIRStore =
- FixedSizeValueStore<SemIR::CheckIRId, SemIR::ImportIRId>;
- auto check_ir_map() -> CheckIRToImportIRStore& { return check_ir_map_; }
- auto import_ir_constant_values()
- -> llvm::SmallVector<SemIR::ConstantValueStore, 0>& {
- return import_ir_constant_values_;
- }
- auto definitions_required_by_decl() -> llvm::SmallVector<SemIR::InstId>& {
- return definitions_required_by_decl_;
- }
- auto definitions_required_by_use()
- -> llvm::SmallVector<std::pair<SemIR::LocId, SemIR::SpecificId>>& {
- return definitions_required_by_use_;
- }
- auto global_init() -> GlobalInit& { return global_init_; }
- auto imports() -> llvm::SmallVector<SemIR::InstId>& { return imports_; }
- auto generated() -> llvm::SmallVector<SemIR::InstId>& { return generated_; }
- // Pre-computed parts of a binding pattern.
- // TODO: Consider putting this behind a narrower API to guard against emitting
- // multiple times.
- struct BindingPatternInfo {
- // The corresponding AnyBinding inst.
- SemIR::InstId bind_name_id;
- // The region of insts that computes the type of the binding.
- SemIR::ExprRegionId type_expr_region_id;
- };
- auto bind_name_map() -> Map<SemIR::InstId, BindingPatternInfo>& {
- return bind_name_map_;
- }
- auto var_storage_map() -> Map<SemIR::InstId, SemIR::InstId>& {
- return var_storage_map_;
- }
- // During Choice typechecking, each alternative turns into a name binding on
- // the Choice type, but this can't be done until the full Choice type is
- // known. This represents each binding to be done at the end of checking the
- // Choice type.
- struct ChoiceDeferredBinding {
- Parse::NodeIdOneOf<Parse::ChoiceAlternativeListCommaId,
- Parse::ChoiceDefinitionId>
- node_id;
- NameComponent name_component;
- };
- auto choice_deferred_bindings() -> llvm::SmallVector<ChoiceDeferredBinding>& {
- return choice_deferred_bindings_;
- }
- auto region_stack() -> RegionStack& { return region_stack_; }
- // An ongoing impl lookup, used to ensure termination.
- struct ImplLookupStackEntry {
- SemIR::ConstantId query_self_const_id;
- SemIR::ConstantId query_facet_type_const_id;
- // The location of the impl being looked at for the stack entry.
- SemIR::InstId impl_loc = SemIR::InstId::None;
- // TODO: If we make a proper stack class, we only need one `diagnosed_cycle`
- // field, which resets to false when the stack becomes empty.
- bool diagnosed_cycle = false;
- };
- auto impl_lookup_stack() -> llvm::SmallVector<ImplLookupStackEntry>& {
- return impl_lookup_stack_;
- }
- // A map from a (self, interface) pair to a final witness.
- using ImplLookupCacheKey =
- std::pair<SemIR::ConstantId, SemIR::SpecificInterfaceId>;
- using ImplLookupCacheMap = Map<ImplLookupCacheKey, SemIR::ConstantId>;
- auto impl_lookup_cache() -> ImplLookupCacheMap& { return impl_lookup_cache_; }
- // An impl lookup query that resulted in a concrete witness from finding an
- // `impl` declaration (not though a facet value), and its result. Used to look
- // for conflicting `impl` declarations.
- struct PoisonedConcreteImplLookupQuery {
- // The location the LookupImplWitness originated from.
- SemIR::LocId loc_id;
- // The query for a witness of an impl for an interface.
- SemIR::LookupImplWitness query;
- // The resulting final witness.
- SemIR::ConstantId witness_id;
- };
- auto poisoned_concrete_impl_lookup_queries()
- -> llvm::SmallVector<PoisonedConcreteImplLookupQuery>& {
- return poisoned_concrete_impl_lookup_queries_;
- }
- // A stack that tracks the rewrite constraints from a `where` expression being
- // checked. The back of the stack is the currently checked `where` expression.
- auto rewrites_stack()
- -> llvm::SmallVector<Map<SemIR::ConstantId, SemIR::InstId>>& {
- return rewrites_stack_;
- }
- // Data about a form expression.
- //
- // TODO: consider moving this out of Context.
- struct FormExpr {
- static const FormExpr Error;
- // The inst ID of the form expression itself. This is always a form inst,
- // such as InitForm or RefForm.
- // TODO: Consider creating an AnyForm inst category to refer to those insts.
- SemIR::InstId form_inst_id;
- // The inst ID of the form expression's type component.
- SemIR::TypeInstId type_component_inst_id;
- // The type ID corresponding to type_component_id.
- SemIR::TypeId type_component_id;
- };
- // Pushes form_expr onto the stack of return form declarations for in-progress
- // function declarations.
- //
- // Note: the "stack" currently can only have one element, but that restriction
- // can be relaxed if it becomes possible to have multiple pending return type
- // declarations.
- auto PushReturnForm(FormExpr form_expr) -> void {
- CARBON_CHECK(return_form_expr_ == std::nullopt,
- "TODO: make form_expr_ a stack if necessary");
- return_form_expr_ = form_expr;
- }
- // Pops a FormExpr off the stack of return form declarations for in-progress
- // function declarations.
- auto PopReturnForm() -> FormExpr {
- CARBON_CHECK(return_form_expr_ != std::nullopt);
- return *std::exchange(return_form_expr_, std::nullopt);
- }
- auto core_identifiers() -> CoreIdentifierCache& { return core_identifiers_; }
- // --------------------------------------------------------------------------
- // Directly expose SemIR::File data accessors for brevity in calls.
- // --------------------------------------------------------------------------
- auto identifiers() -> SharedValueStores::IdentifierStore& {
- return sem_ir().identifiers();
- }
- auto ints() -> SharedValueStores::IntStore& { return sem_ir().ints(); }
- auto reals() -> SharedValueStores::RealStore& { return sem_ir().reals(); }
- auto floats() -> SharedValueStores::FloatStore& { return sem_ir().floats(); }
- auto string_literal_values() -> SharedValueStores::StringLiteralStore& {
- return sem_ir().string_literal_values();
- }
- auto entity_names() -> SemIR::EntityNameStore& {
- return sem_ir().entity_names();
- }
- auto cpp_global_names() -> SemIR::CppGlobalVarStore& {
- return sem_ir().cpp_global_vars();
- }
- auto cpp_overload_sets() -> SemIR::CppOverloadSetStore& {
- return sem_ir().cpp_overload_sets();
- }
- auto functions() -> SemIR::FunctionStore& { return sem_ir().functions(); }
- auto classes() -> SemIR::ClassStore& { return sem_ir().classes(); }
- auto vtables() -> SemIR::VtableStore& { return sem_ir().vtables(); }
- auto interfaces() -> SemIR::InterfaceStore& { return sem_ir().interfaces(); }
- auto named_constraints() -> SemIR::NamedConstraintStore& {
- return sem_ir().named_constraints();
- }
- auto require_impls() -> SemIR::RequireImplsStore& {
- return sem_ir().require_impls();
- }
- auto require_impls_blocks() -> SemIR::RequireImplsBlockStore& {
- return sem_ir().require_impls_blocks();
- }
- auto associated_constants() -> SemIR::AssociatedConstantStore& {
- return sem_ir().associated_constants();
- }
- auto facet_types() -> SemIR::FacetTypeInfoStore& {
- return sem_ir().facet_types();
- }
- auto identified_facet_types() -> SemIR::IdentifiedFacetTypeStore& {
- return sem_ir().identified_facet_types();
- }
- auto impls() -> SemIR::ImplStore& { return sem_ir().impls(); }
- auto specific_interfaces() -> SemIR::SpecificInterfaceStore& {
- return sem_ir().specific_interfaces();
- }
- auto generics() -> SemIR::GenericStore& { return sem_ir().generics(); }
- auto specifics() -> SemIR::SpecificStore& { return sem_ir().specifics(); }
- auto import_irs() -> SemIR::ImportIRStore& { return sem_ir().import_irs(); }
- auto import_ir_insts() -> SemIR::ImportIRInstStore& {
- return sem_ir().import_ir_insts();
- }
- auto ast_context() -> clang::ASTContext& {
- return cpp_context()->ast_context();
- }
- auto clang_sema() -> clang::Sema& { return cpp_context()->sema(); }
- auto clang_decls() -> SemIR::ClangDeclStore& {
- return sem_ir().clang_decls();
- }
- auto names() -> SemIR::NameStoreWrapper { return sem_ir().names(); }
- auto name_scopes() -> SemIR::NameScopeStore& {
- return sem_ir().name_scopes();
- }
- auto struct_type_fields() -> SemIR::StructTypeFieldsStore& {
- return sem_ir().struct_type_fields();
- }
- auto custom_layouts() -> SemIR::CustomLayoutStore& {
- return sem_ir().custom_layouts();
- }
- auto types() -> SemIR::TypeStore& { return sem_ir().types(); }
- // Instructions should be added with `AddInst` or `AddInstInNoBlock` from
- // `inst.h`. This is `const` to prevent accidental misuse.
- auto insts() const -> const SemIR::InstStore& { return sem_ir().insts(); }
- auto constant_values() -> SemIR::ConstantValueStore& {
- return sem_ir().constant_values();
- }
- auto inst_blocks() -> SemIR::InstBlockStore& {
- return sem_ir().inst_blocks();
- }
- auto constants() -> SemIR::ConstantStore& { return sem_ir().constants(); }
- auto total_ir_count() const -> int { return total_ir_count_; }
- // --------------------------------------------------------------------------
- // End of SemIR::File members.
- // --------------------------------------------------------------------------
- private:
- // Handles diagnostics.
- DiagnosticEmitterBase* emitter_;
- // Returns a lazily constructed TreeAndSubtrees.
- Parse::GetTreeAndSubtreesFn tree_and_subtrees_getter_;
- // The SemIR::File being added to.
- SemIR::File* sem_ir_;
- // The total number of files.
- int total_ir_count_;
- // The C++ checking context.
- std::unique_ptr<CppContext> cpp_context_;
- // Whether to print verbose output.
- llvm::raw_ostream* vlog_stream_;
- // The stack during Build. Will contain file-level parse nodes on return.
- NodeStack node_stack_;
- // The stack of instruction blocks being used for general IR generation.
- InstBlockStack inst_block_stack_;
- // The stack of instruction blocks that contain pattern instructions.
- InstBlockStack pattern_block_stack_;
- // The stack of instruction blocks being used for param and arg ref blocks.
- ParamAndArgRefsStack param_and_arg_refs_stack_;
- // The stack of instruction blocks being used for type information while
- // processing arguments. This is used in parallel with
- // param_and_arg_refs_stack_. It's used for:
- // - Struct literals, where we need to track names for a type separate from
- // the literal arguments.
- // - The associated entries witness table, while parsing an interface.
- InstBlockStack args_type_info_stack_;
- // The stack of StructTypeFields for in-progress StructTypeLiterals.
- ArrayStack<SemIR::StructTypeField> struct_type_fields_stack_;
- // The stack of FieldDecls for in-progress Class definitions.
- ArrayStack<SemIR::InstId> field_decls_stack_;
- // The stack of RequireImpls for in-progress Interface and Constraint
- // definitions.
- RequireImplsStack require_impls_stack_;
- // The stack used for qualified declaration name construction.
- DeclNameStack decl_name_stack_;
- // The stack of declarations that could have modifiers.
- DeclIntroducerStateStack decl_introducer_state_stack_;
- // The stack of scopes we are currently within.
- ScopeStack scope_stack_;
- // The worklist of deferred definition tasks to perform at the end of the
- // enclosing deferred definition scope.
- DeferredDefinitionWorklist deferred_definition_worklist_;
- // The stack of generic regions we are currently within.
- GenericRegionStack generic_region_stack_;
- // Contains a vtable block for each `class` scope which is currently being
- // defined, regardless of whether the class can have virtual functions.
- InstBlockStack vtable_stack_;
- // Instructions which are operands to an `export` directive. This becomes
- // `InstBlockId::Exports`.
- llvm::SmallVector<SemIR::InstId> exports_;
- // Maps CheckIRId to ImportIRId.
- CheckIRToImportIRStore check_ir_map_;
- // Per-import constant values. These refer to the main IR and mainly serve as
- // a lookup table for quick access.
- //
- // Inline 0 elements because it's expected to require heap allocation.
- llvm::SmallVector<SemIR::ConstantValueStore, 0> import_ir_constant_values_;
- // Declaration instructions of entities that should have definitions by the
- // end of the current source file.
- llvm::SmallVector<SemIR::InstId> definitions_required_by_decl_;
- // Entities that should have definitions by the end of the current source
- // file, because of a generic was used a concrete specific. This is currently
- // only tracking specific functions that should have a definition emitted.
- llvm::SmallVector<std::pair<SemIR::LocId, SemIR::SpecificId>>
- definitions_required_by_use_;
- // State for global initialization.
- GlobalInit global_init_;
- // Instructions which are generated as a result of imports; both `ImportRef`s
- // and instructions they generate. For example, when a name reference resolves
- // an imported function, the `ImportRefLoaded` results in a `FunctionDecl`,
- // and both end up here. The `FunctionDecl` shouldn't use the current block on
- // inst_block_stack_ because it's not tied to the referencing scope.
- //
- // This becomes `InstBlockId::Imports`.
- llvm::SmallVector<SemIR::InstId> imports_;
- // Entities which are generated internally to the toolchain, to represent
- // builtin concepts which should be dumped as part of `SemIR`. For example,
- // when doing destruction, the `Destroy.Op` function is generated, and will be
- // found here.
- //
- // This becomes `InstBlockId::Generated`.
- llvm::SmallVector<SemIR::InstId> generated_;
- // Map from an AnyBindingPattern inst to precomputed parts of the
- // pattern-match SemIR for it.
- Map<SemIR::InstId, BindingPatternInfo> bind_name_map_;
- // Map from VarPattern insts to the corresponding VarStorage insts. The
- // VarStorage insts are allocated, emitted, and stored in the map after
- // processing the enclosing full-pattern.
- Map<SemIR::InstId, SemIR::InstId> var_storage_map_;
- // Each alternative in a Choice gets an entry here, they are stored in
- // declaration order. The vector is consumed and emptied at the end of the
- // Choice definition.
- //
- // TODO: This may need to be a stack of vectors if it becomes possible to
- // define a Choice type inside an alternative's parameter set.
- llvm::SmallVector<ChoiceDeferredBinding> choice_deferred_bindings_;
- // Stack of single-entry regions being built.
- RegionStack region_stack_;
- // Tracks all ongoing impl lookups in order to ensure that lookup terminates
- // via the acyclic rule and the termination rule.
- llvm::SmallVector<ImplLookupStackEntry> impl_lookup_stack_;
- // Tracks a mapping from (self, interface) to witness, for queries that had
- // final results.
- ImplLookupCacheMap impl_lookup_cache_;
- // Tracks impl lookup queries that lead to concrete witness results, along
- // with those results. Used to verify that the same queries produce the same
- // results at the end of the file. Any difference is diagnosed.
- llvm::SmallVector<PoisonedConcreteImplLookupQuery>
- poisoned_concrete_impl_lookup_queries_;
- // A map from an ImplWitnessAccess on the LHS of a rewrite constraint to its
- // value on the RHS. Used during checking of a `where` expression to allow
- // constraints to access values from earlier constraints.
- llvm::SmallVector<Map<SemIR::ConstantId, SemIR::InstId>> rewrites_stack_;
- // Declared return form for the in-progress function declaration, if any.
- std::optional<FormExpr> return_form_expr_;
- // See `CoreIdentifierCache` for details.
- CoreIdentifierCache core_identifiers_;
- };
- inline constexpr Context::FormExpr Context::FormExpr::Error = {
- .form_inst_id = SemIR::ErrorInst::InstId,
- .type_component_inst_id = SemIR::ErrorInst::TypeInstId,
- .type_component_id = SemIR::ErrorInst::TypeId};
- } // namespace Carbon::Check
- #endif // CARBON_TOOLCHAIN_CHECK_CONTEXT_H_
|