scope_stack.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #ifndef CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  5. #define CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  6. #include "common/array_stack.h"
  7. #include "common/set.h"
  8. #include "llvm/ADT/SmallVector.h"
  9. #include "toolchain/check/full_pattern_stack.h"
  10. #include "toolchain/check/lexical_lookup.h"
  11. #include "toolchain/check/scope_index.h"
  12. #include "toolchain/sem_ir/file.h"
  13. #include "toolchain/sem_ir/ids.h"
  14. namespace Carbon::Check {
  15. // A stack of lexical and semantic scopes that we are currently performing
  16. // checking within.
  17. class ScopeStack {
  18. public:
  19. explicit ScopeStack(const SemIR::File* sem_ir)
  20. : sem_ir_(sem_ir),
  21. lexical_lookup_(sem_ir->identifiers()),
  22. full_pattern_stack_(&lexical_lookup_) {}
  23. // A scope in which `break` and `continue` can be used.
  24. struct BreakContinueScope {
  25. SemIR::InstBlockId break_target;
  26. SemIR::InstBlockId continue_target;
  27. };
  28. // A non-lexical scope in which unqualified lookup may be required.
  29. struct NonLexicalScope {
  30. // The index of the scope in the scope stack.
  31. ScopeIndex scope_index;
  32. // The corresponding name scope.
  33. SemIR::NameScopeId name_scope_id;
  34. // The corresponding specific.
  35. SemIR::SpecificId specific_id;
  36. };
  37. // Information about a scope that has been temporarily removed from the stack.
  38. struct SuspendedScope;
  39. // Pushes a scope for a declaration name's parameters.
  40. auto PushForDeclName() -> void;
  41. // Pushes a non-function entity scope. Functions must use
  42. // `PushForFunctionBody` instead.
  43. auto PushForEntity(SemIR::InstId scope_inst_id, SemIR::NameScopeId scope_id,
  44. SemIR::SpecificId specific_id,
  45. bool lexical_lookup_has_load_error = false) -> void;
  46. // Pushes a scope which should be in the same region as the current scope.
  47. // These can be in a function without breaking `return` scoping. For example,
  48. // this is used by struct literals and code blocks.
  49. auto PushForSameRegion() -> void;
  50. // Pushes a function scope.
  51. auto PushForFunctionBody(SemIR::InstId scope_inst_id) -> void;
  52. // Pops the top scope from scope_stack_. Removes names from lexical_lookup_.
  53. auto Pop() -> void;
  54. // Pops the top scope from scope_stack_ if it contains no names.
  55. auto PopIfEmpty() -> void {
  56. if (scope_stack_.back().num_names == 0) {
  57. Pop();
  58. }
  59. }
  60. // Pops scopes until we return to the specified scope index.
  61. auto PopTo(ScopeIndex index) -> void;
  62. // Returns the scope index associated with the current scope.
  63. auto PeekIndex() const -> ScopeIndex { return Peek().index; }
  64. // Returns the name scope associated with the current lexical scope, if any.
  65. auto PeekNameScopeId() const -> SemIR::NameScopeId { return Peek().scope_id; }
  66. // Returns the instruction associated with the current scope, or `None` if
  67. // there is no such instruction, such as for a block scope.
  68. auto PeekInstId() const -> SemIR::InstId { return Peek().scope_inst_id; }
  69. // Returns the specific associated with the innermost enclosing scope that is
  70. // associated with a specific. This will generally be the self specific of the
  71. // innermost enclosing generic, as there is no way to enter any other specific
  72. // scope.
  73. auto PeekSpecificId() const -> SemIR::SpecificId {
  74. return Peek().specific_id;
  75. }
  76. // Returns true if the current scope is inside a function scope (either the
  77. // scope itself, or a lexical scope), without an intervening entity scope.
  78. auto IsInFunctionScope() const -> bool {
  79. return !return_scope_stack_.empty() &&
  80. !return_scope_stack_.back().nested_scope_index.has_value();
  81. }
  82. // Returns the current scope, if it is of the specified kind. Otherwise,
  83. // returns nullopt.
  84. template <typename InstT>
  85. auto GetCurrentScopeAs() -> std::optional<InstT> {
  86. auto inst_id = PeekInstId();
  87. if (!inst_id.has_value()) {
  88. return std::nullopt;
  89. }
  90. return sem_ir_->insts().TryGetAs<InstT>(inst_id);
  91. }
  92. // If there is no `returned var` in scope, sets the given instruction to be
  93. // the current `returned var` and returns an `None`. If there
  94. // is already a `returned var`, returns it instead.
  95. auto SetReturnedVarOrGetExisting(SemIR::InstId inst_id) -> SemIR::InstId;
  96. // Returns the `returned var` instruction that's currently in scope, or `None`
  97. // if there isn't one.
  98. auto GetReturnedVar() -> SemIR::InstId {
  99. CARBON_CHECK(IsInFunctionScope(), "Handling return but not in a function");
  100. return return_scope_stack_.back().returned_var;
  101. }
  102. // Returns the decl ID for the current return scope.
  103. auto GetReturnScopeDeclId() -> SemIR::InstId {
  104. CARBON_CHECK(IsInFunctionScope(), "Handling return but not in a function");
  105. return return_scope_stack_.back().decl_id;
  106. }
  107. // Looks up the name `name_id` in the current scope and enclosing scopes, but
  108. // do not look past `scope_index`. Returns the existing lookup result, if any.
  109. auto LookupInLexicalScopesWithin(SemIR::NameId name_id,
  110. ScopeIndex scope_index) -> SemIR::InstId;
  111. // Looks up the name `name_id` in the current scope and related lexical
  112. // scopes. Returns the innermost lexical lookup result, if any, along with a
  113. // list of non-lexical scopes in which lookup should also be performed,
  114. // ordered from outermost to innermost.
  115. auto LookupInLexicalScopes(SemIR::NameId name_id)
  116. -> std::pair<SemIR::InstId, llvm::ArrayRef<NonLexicalScope>>;
  117. // Looks up the name `name_id` in the current scope, or in `scope_index` if
  118. // specified. Returns the existing instruction if the name is already declared
  119. // in that scope or any unfinished scope within it, and otherwise adds the
  120. // name with the value `target_id` and returns `None`.
  121. auto LookupOrAddName(SemIR::NameId name_id, SemIR::InstId target_id,
  122. ScopeIndex scope_index = ScopeIndex::None)
  123. -> SemIR::InstId;
  124. // Prepares to add a compile-time binding in the current scope, and returns
  125. // its index. The added binding must then be pushed using
  126. // `PushCompileTimeBinding`.
  127. auto AddCompileTimeBinding() -> SemIR::CompileTimeBindIndex {
  128. auto index = scope_stack_.back().next_compile_time_bind_index;
  129. ++scope_stack_.back().next_compile_time_bind_index.index;
  130. return index;
  131. }
  132. // Pushes a compile-time binding into the current scope.
  133. auto PushCompileTimeBinding(SemIR::InstId bind_id) -> void {
  134. compile_time_binding_stack_.AppendToTop(bind_id);
  135. }
  136. // Temporarily removes the top of the stack and its lexical lookup results.
  137. auto Suspend() -> SuspendedScope;
  138. // Restores a suspended scope stack entry.
  139. auto Restore(SuspendedScope scope) -> void;
  140. // Runs verification that the processing cleanly finished.
  141. auto VerifyOnFinish() const -> void;
  142. auto break_continue_stack() -> llvm::SmallVector<BreakContinueScope>& {
  143. return break_continue_stack_;
  144. }
  145. auto destroy_id_stack() -> ArrayStack<SemIR::InstId>& {
  146. return destroy_id_stack_;
  147. }
  148. auto compile_time_bindings_stack() -> ArrayStack<SemIR::InstId>& {
  149. return compile_time_binding_stack_;
  150. }
  151. auto full_pattern_stack() -> FullPatternStack& { return full_pattern_stack_; }
  152. private:
  153. // An entry in scope_stack_.
  154. struct ScopeStackEntry {
  155. auto is_lexical_scope() const -> bool { return !scope_id.has_value(); }
  156. // The sequential index of this scope entry within the file.
  157. ScopeIndex index;
  158. // The instruction associated with this entry, if any. This can be one of:
  159. //
  160. // - A `ClassDecl`, for a class definition scope.
  161. // - A `FunctionDecl`, for the outermost scope in a function
  162. // definition.
  163. // - Invalid, for any other scope.
  164. SemIR::InstId scope_inst_id;
  165. // The name scope associated with this entry, if any.
  166. SemIR::NameScopeId scope_id;
  167. // The specific associated with this entry, if any.
  168. SemIR::SpecificId specific_id;
  169. // The next compile-time binding index to allocate in this scope.
  170. SemIR::CompileTimeBindIndex next_compile_time_bind_index;
  171. // Whether lexical_lookup_ has load errors from this scope or an ancestor
  172. // scope.
  173. bool lexical_lookup_has_load_error;
  174. // Whether a `returned var` was introduced in this scope, and needs to be
  175. // unregistered when the scope ends.
  176. bool has_returned_var = false;
  177. // Whether there are any ids in the `names` set.
  178. int num_names = 0;
  179. // Names which are registered with lexical_lookup_, and will need to be
  180. // unregistered when the scope ends.
  181. Set<SemIR::NameId> names = {};
  182. };
  183. // A scope in which `return` can be used.
  184. struct ReturnScope {
  185. // The `FunctionDecl`.
  186. SemIR::InstId decl_id;
  187. // The value corresponding to the current `returned var`, if any. Will be
  188. // set and unset as `returned var`s are declared and go out of scope.
  189. SemIR::InstId returned_var = SemIR::InstId::None;
  190. // When a nested scope interrupts a return scope, this is the index of the
  191. // outermost interrupting scope (the one closest to the function scope).
  192. // This can then be used to determine whether we're actually inside the most
  193. // recent `ReturnScope`, or inside a different entity scope.
  194. //
  195. // This won't be set for functions directly inside functions, because they
  196. // will have their own `ReturnScope`.
  197. // For example, when a `class` is inside a `fn`, it interrupts the function
  198. // body by setting this on `PushEntity`; `Pop` will set it back to `None`.
  199. ScopeIndex nested_scope_index = ScopeIndex::None;
  200. };
  201. // Pushes a scope onto scope_stack_. NameScopeId::None is used for new scopes.
  202. // lexical_lookup_has_load_error is used to limit diagnostics when a given
  203. // namespace may contain a mix of both successful and failed name imports.
  204. auto Push(SemIR::InstId scope_inst_id, SemIR::NameScopeId scope_id,
  205. SemIR::SpecificId specific_id, bool lexical_lookup_has_load_error)
  206. -> void;
  207. auto Peek() const -> const ScopeStackEntry& { return scope_stack_.back(); }
  208. // Returns whether lexical lookup currently has any load errors.
  209. auto LexicalLookupHasLoadError() const -> bool {
  210. return !scope_stack_.empty() &&
  211. scope_stack_.back().lexical_lookup_has_load_error;
  212. }
  213. // If inside a return scope, marks a nested scope (see `nested_scope_index`).
  214. // Called after pushing the new scope.
  215. auto MarkNestingIfInReturnScope() -> void {
  216. if (!return_scope_stack_.empty() &&
  217. !return_scope_stack_.back().nested_scope_index.has_value()) {
  218. return_scope_stack_.back().nested_scope_index = scope_stack_.back().index;
  219. }
  220. }
  221. // Checks that the provided scope's `next_compile_time_bind_index` matches the
  222. // full size of the current `compile_time_binding_stack_`. The values should
  223. // always match, and this is used to validate the correspondence during
  224. // significant changes.
  225. auto VerifyNextCompileTimeBindIndex(llvm::StringLiteral label,
  226. const ScopeStackEntry& scope) -> void;
  227. // The current file.
  228. const SemIR::File* sem_ir_;
  229. // A stack of scopes from which we can `return`.
  230. llvm::SmallVector<ReturnScope> return_scope_stack_;
  231. // A stack of `break` and `continue` targets.
  232. llvm::SmallVector<BreakContinueScope> break_continue_stack_;
  233. // A stack for scope context.
  234. llvm::SmallVector<ScopeStackEntry> scope_stack_;
  235. // A stack of `destroy` functions to call. This only has entries inside of
  236. // function bodies, where destruction on scope exit is required.
  237. ArrayStack<SemIR::InstId> destroy_id_stack_;
  238. // Information about non-lexical scopes. This is a subset of the entries and
  239. // the information in scope_stack_.
  240. llvm::SmallVector<NonLexicalScope> non_lexical_scope_stack_;
  241. // A stack of the current compile time bindings.
  242. ArrayStack<SemIR::InstId> compile_time_binding_stack_;
  243. // The index of the next scope that will be pushed onto scope_stack_. The
  244. // first is always the package scope.
  245. ScopeIndex next_scope_index_ = ScopeIndex::Package;
  246. // Tracks lexical lookup results.
  247. LexicalLookup lexical_lookup_;
  248. // Stack of full-patterns currently being checked.
  249. FullPatternStack full_pattern_stack_;
  250. };
  251. struct ScopeStack::SuspendedScope {
  252. // An item that was suspended within this scope. This represents either a
  253. // lexical lookup entry in this scope, or a compile time binding entry in this
  254. // scope.
  255. //
  256. // TODO: For compile-time bindings, the common case is that they will both
  257. // have a suspended lexical lookup entry and a suspended compile time binding
  258. // entry. We should be able to store that as a single ScopeItem rather than
  259. // two.
  260. struct ScopeItem {
  261. static constexpr uint32_t IndexForCompileTimeBinding = -1;
  262. // The scope index for a LexicalLookup::SuspendedResult, or
  263. // CompileTimeBindingIndex for a suspended compile time binding.
  264. uint32_t index;
  265. // The instruction within the scope.
  266. SemIR::InstId inst_id;
  267. };
  268. // The suspended scope stack entry.
  269. ScopeStackEntry entry;
  270. // The list of items that were within this scope when it was suspended. The
  271. // inline size is an attempt to keep the size of a `SuspendedFunction`
  272. // reasonable while avoiding heap allocations most of the time.
  273. llvm::SmallVector<ScopeItem, 8> suspended_items;
  274. };
  275. } // namespace Carbon::Check
  276. #endif // CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_