scope_stack.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #ifndef CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  5. #define CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  6. #include "common/array_stack.h"
  7. #include "common/move_only.h"
  8. #include "common/set.h"
  9. #include "llvm/ADT/SmallVector.h"
  10. #include "toolchain/check/full_pattern_stack.h"
  11. #include "toolchain/check/lexical_lookup.h"
  12. #include "toolchain/check/scope_index.h"
  13. #include "toolchain/sem_ir/file.h"
  14. #include "toolchain/sem_ir/ids.h"
  15. namespace Carbon::Check {
  16. // A stack of lexical and semantic scopes that we are currently performing
  17. // checking within.
  18. class ScopeStack {
  19. public:
  20. explicit ScopeStack(const SemIR::File* sem_ir)
  21. : sem_ir_(sem_ir),
  22. lexical_lookup_(sem_ir->identifiers()),
  23. full_pattern_stack_(&lexical_lookup_) {}
  24. // A scope in which `break` and `continue` can be used.
  25. struct BreakContinueScope {
  26. SemIR::InstBlockId break_target;
  27. SemIR::InstBlockId continue_target;
  28. };
  29. // A non-lexical scope in which unqualified lookup may be required.
  30. struct NonLexicalScope {
  31. // The index of the scope in the scope stack.
  32. ScopeIndex scope_index;
  33. // The corresponding name scope.
  34. SemIR::NameScopeId name_scope_id;
  35. // The corresponding specific.
  36. SemIR::SpecificId specific_id;
  37. };
  38. // Information about a scope that has been temporarily removed from the stack.
  39. // This type is large, so moves of this type should be avoided.
  40. struct SuspendedScope;
  41. // Pushes a scope for a declaration name's parameters.
  42. auto PushForDeclName() -> void;
  43. // Pushes a non-function entity scope. Functions must use
  44. // `PushForFunctionBody` instead.
  45. auto PushForEntity(SemIR::InstId scope_inst_id, SemIR::NameScopeId scope_id,
  46. SemIR::SpecificId specific_id,
  47. bool lexical_lookup_has_load_error = false) -> void;
  48. // Pushes a scope which should be in the same region as the current scope.
  49. // These can be in a function without breaking `return` scoping. For example,
  50. // this is used by struct literals and code blocks.
  51. auto PushForSameRegion() -> void;
  52. // Pushes a function scope.
  53. auto PushForFunctionBody(SemIR::InstId scope_inst_id) -> void;
  54. // Pops the top scope from scope_stack_. Removes names from lexical_lookup_.
  55. auto Pop() -> void;
  56. // Pops the top scope from scope_stack_ if it contains no names.
  57. auto PopIfEmpty() -> void {
  58. if (scope_stack_.back().num_names == 0) {
  59. Pop();
  60. }
  61. }
  62. // Pops scopes until we return to the specified scope index.
  63. auto PopTo(ScopeIndex index) -> void;
  64. // Returns the scope index associated with the current scope.
  65. auto PeekIndex() const -> ScopeIndex { return Peek().index; }
  66. // Returns the name scope associated with the current lexical scope, if any.
  67. auto PeekNameScopeId() const -> SemIR::NameScopeId { return Peek().scope_id; }
  68. // Returns the instruction associated with the current scope, or `None` if
  69. // there is no such instruction, such as for a block scope.
  70. auto PeekInstId() const -> SemIR::InstId { return Peek().scope_inst_id; }
  71. // Returns the specific associated with the innermost enclosing scope that is
  72. // associated with a specific. This will generally be the self specific of the
  73. // innermost enclosing generic, as there is no way to enter any other specific
  74. // scope.
  75. auto PeekSpecificId() const -> SemIR::SpecificId {
  76. return Peek().specific_id;
  77. }
  78. // Returns true if the current scope is inside a function scope (either the
  79. // scope itself, or a lexical scope), without an intervening entity scope.
  80. auto IsInFunctionScope() const -> bool {
  81. return !return_scope_stack_.empty() &&
  82. !return_scope_stack_.back().nested_scope_index.has_value();
  83. }
  84. // Returns the current scope, if it is of the specified kind. Otherwise,
  85. // returns nullopt.
  86. template <typename InstT>
  87. auto GetCurrentScopeAs() -> std::optional<InstT> {
  88. auto inst_id = PeekInstId();
  89. if (!inst_id.has_value()) {
  90. return std::nullopt;
  91. }
  92. return sem_ir_->insts().TryGetAs<InstT>(inst_id);
  93. }
  94. // If there is no `returned var` in scope, sets the given instruction to be
  95. // the current `returned var` and returns an `None`. If there
  96. // is already a `returned var`, returns it instead.
  97. auto SetReturnedVarOrGetExisting(SemIR::InstId inst_id) -> SemIR::InstId;
  98. // Returns the `returned var` instruction that's currently in scope, or `None`
  99. // if there isn't one.
  100. auto GetReturnedVar() -> SemIR::InstId {
  101. CARBON_CHECK(IsInFunctionScope(), "Handling return but not in a function");
  102. return return_scope_stack_.back().returned_var;
  103. }
  104. // Returns the decl ID for the current return scope.
  105. auto GetReturnScopeDeclId() -> SemIR::InstId {
  106. CARBON_CHECK(IsInFunctionScope(), "Handling return but not in a function");
  107. return return_scope_stack_.back().decl_id;
  108. }
  109. // Looks up the name `name_id` in the current scope and enclosing scopes, but
  110. // do not look past `scope_index`. Returns the existing lookup result, if any.
  111. auto LookupInLexicalScopesWithin(SemIR::NameId name_id,
  112. ScopeIndex scope_index) -> SemIR::InstId;
  113. // Looks up the name `name_id` in the current scope and related lexical
  114. // scopes. Returns the innermost lexical lookup result, if any, along with a
  115. // list of non-lexical scopes in which lookup should also be performed,
  116. // ordered from outermost to innermost.
  117. auto LookupInLexicalScopes(SemIR::NameId name_id)
  118. -> std::pair<SemIR::InstId, llvm::ArrayRef<NonLexicalScope>>;
  119. // Looks up the name `name_id` in the current scope, or in `scope_index` if
  120. // specified. Returns the existing instruction if the name is already declared
  121. // in that scope or any unfinished scope within it, and otherwise adds the
  122. // name with the value `target_id` and returns `None`.
  123. auto LookupOrAddName(SemIR::NameId name_id, SemIR::InstId target_id,
  124. ScopeIndex scope_index = ScopeIndex::None)
  125. -> SemIR::InstId;
  126. // Prepares to add a compile-time binding in the current scope, and returns
  127. // its index. The added binding must then be pushed using
  128. // `PushCompileTimeBinding`.
  129. auto AddCompileTimeBinding() -> SemIR::CompileTimeBindIndex {
  130. auto index = scope_stack_.back().next_compile_time_bind_index;
  131. ++scope_stack_.back().next_compile_time_bind_index.index;
  132. return index;
  133. }
  134. // Pushes a compile-time binding into the current scope.
  135. auto PushCompileTimeBinding(SemIR::InstId bind_id) -> void {
  136. compile_time_binding_stack_.AppendToTop(bind_id);
  137. }
  138. // Temporarily removes the top of the stack and its lexical lookup results.
  139. auto Suspend() -> SuspendedScope;
  140. // Restores a suspended scope stack entry.
  141. auto Restore(SuspendedScope&& scope) -> void;
  142. // Runs verification that the processing cleanly finished.
  143. auto VerifyOnFinish() const -> void;
  144. auto break_continue_stack() -> llvm::SmallVector<BreakContinueScope>& {
  145. return break_continue_stack_;
  146. }
  147. auto destroy_id_stack() -> ArrayStack<SemIR::InstId>& {
  148. return destroy_id_stack_;
  149. }
  150. auto compile_time_bindings_stack() -> ArrayStack<SemIR::InstId>& {
  151. return compile_time_binding_stack_;
  152. }
  153. auto full_pattern_stack() -> FullPatternStack& { return full_pattern_stack_; }
  154. private:
  155. // An entry in scope_stack_.
  156. struct ScopeStackEntry : public MoveOnly<ScopeStackEntry> {
  157. auto is_lexical_scope() const -> bool { return !scope_id.has_value(); }
  158. // The sequential index of this scope entry within the file.
  159. ScopeIndex index;
  160. // The instruction associated with this entry, if any. This can be one of:
  161. //
  162. // - A `ClassDecl`, for a class definition scope.
  163. // - A `FunctionDecl`, for the outermost scope in a function
  164. // definition.
  165. // - Invalid, for any other scope.
  166. SemIR::InstId scope_inst_id;
  167. // The name scope associated with this entry, if any.
  168. SemIR::NameScopeId scope_id;
  169. // The specific associated with this entry, if any.
  170. SemIR::SpecificId specific_id;
  171. // The next compile-time binding index to allocate in this scope.
  172. SemIR::CompileTimeBindIndex next_compile_time_bind_index;
  173. // Whether lexical_lookup_ has load errors from this scope or an ancestor
  174. // scope.
  175. bool lexical_lookup_has_load_error;
  176. // Whether a `returned var` was introduced in this scope, and needs to be
  177. // unregistered when the scope ends.
  178. bool has_returned_var = false;
  179. // Whether there are any ids in the `names` set.
  180. int num_names = 0;
  181. // Names which are registered with lexical_lookup_, and will need to be
  182. // unregistered when the scope ends.
  183. Set<SemIR::NameId> names = {};
  184. };
  185. // A scope in which `return` can be used.
  186. struct ReturnScope {
  187. // The `FunctionDecl`.
  188. SemIR::InstId decl_id;
  189. // The value corresponding to the current `returned var`, if any. Will be
  190. // set and unset as `returned var`s are declared and go out of scope.
  191. SemIR::InstId returned_var = SemIR::InstId::None;
  192. // When a nested scope interrupts a return scope, this is the index of the
  193. // outermost interrupting scope (the one closest to the function scope).
  194. // This can then be used to determine whether we're actually inside the most
  195. // recent `ReturnScope`, or inside a different entity scope.
  196. //
  197. // This won't be set for functions directly inside functions, because they
  198. // will have their own `ReturnScope`.
  199. // For example, when a `class` is inside a `fn`, it interrupts the function
  200. // body by setting this on `PushEntity`; `Pop` will set it back to `None`.
  201. ScopeIndex nested_scope_index = ScopeIndex::None;
  202. };
  203. // Pushes a scope onto scope_stack_. NameScopeId::None is used for new scopes.
  204. // lexical_lookup_has_load_error is used to limit diagnostics when a given
  205. // namespace may contain a mix of both successful and failed name imports.
  206. auto Push(SemIR::InstId scope_inst_id, SemIR::NameScopeId scope_id,
  207. SemIR::SpecificId specific_id, bool lexical_lookup_has_load_error)
  208. -> void;
  209. auto Peek() const -> const ScopeStackEntry& { return scope_stack_.back(); }
  210. // Returns whether lexical lookup currently has any load errors.
  211. auto LexicalLookupHasLoadError() const -> bool {
  212. return !scope_stack_.empty() &&
  213. scope_stack_.back().lexical_lookup_has_load_error;
  214. }
  215. // If inside a return scope, marks a nested scope (see `nested_scope_index`).
  216. // Called after pushing the new scope.
  217. auto MarkNestingIfInReturnScope() -> void {
  218. if (!return_scope_stack_.empty() &&
  219. !return_scope_stack_.back().nested_scope_index.has_value()) {
  220. return_scope_stack_.back().nested_scope_index = scope_stack_.back().index;
  221. }
  222. }
  223. // Checks that the provided scope's `next_compile_time_bind_index` matches the
  224. // full size of the current `compile_time_binding_stack_`. The values should
  225. // always match, and this is used to validate the correspondence during
  226. // significant changes.
  227. auto VerifyNextCompileTimeBindIndex(llvm::StringLiteral label,
  228. const ScopeStackEntry& scope) -> void;
  229. // The current file.
  230. const SemIR::File* sem_ir_;
  231. // A stack of scopes from which we can `return`.
  232. llvm::SmallVector<ReturnScope> return_scope_stack_;
  233. // A stack of `break` and `continue` targets.
  234. llvm::SmallVector<BreakContinueScope> break_continue_stack_;
  235. // A stack for scope context.
  236. llvm::SmallVector<ScopeStackEntry> scope_stack_;
  237. // A stack of `destroy` functions to call. This only has entries inside of
  238. // function bodies, where destruction on scope exit is required.
  239. ArrayStack<SemIR::InstId> destroy_id_stack_;
  240. // Information about non-lexical scopes. This is a subset of the entries and
  241. // the information in scope_stack_.
  242. llvm::SmallVector<NonLexicalScope> non_lexical_scope_stack_;
  243. // A stack of the current compile time bindings.
  244. ArrayStack<SemIR::InstId> compile_time_binding_stack_;
  245. // The index of the next scope that will be pushed onto scope_stack_. The
  246. // first is always the package scope.
  247. ScopeIndex next_scope_index_ = ScopeIndex::Package;
  248. // Tracks lexical lookup results.
  249. LexicalLookup lexical_lookup_;
  250. // Stack of full-patterns currently being checked.
  251. FullPatternStack full_pattern_stack_;
  252. };
  253. struct ScopeStack::SuspendedScope : public MoveOnly<SuspendedScope> {
  254. // An item that was suspended within this scope. This represents either a
  255. // lexical lookup entry in this scope, or a compile time binding entry in this
  256. // scope.
  257. //
  258. // TODO: For compile-time bindings, the common case is that they will both
  259. // have a suspended lexical lookup entry and a suspended compile time binding
  260. // entry. We should be able to store that as a single ScopeItem rather than
  261. // two.
  262. struct ScopeItem {
  263. static constexpr uint32_t IndexForCompileTimeBinding = -1;
  264. // The scope index for a LexicalLookup::SuspendedResult, or
  265. // CompileTimeBindingIndex for a suspended compile time binding.
  266. uint32_t index;
  267. // The instruction within the scope.
  268. SemIR::InstId inst_id;
  269. };
  270. // The suspended scope stack entry.
  271. ScopeStackEntry entry;
  272. // The list of items that were within this scope when it was suspended. The
  273. // inline size is an attempt to keep the size of a `SuspendedFunction`
  274. // reasonable while avoiding heap allocations most of the time.
  275. llvm::SmallVector<ScopeItem, 8> suspended_items;
  276. };
  277. } // namespace Carbon::Check
  278. #endif // CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_