scope_stack.h 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #ifndef CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  5. #define CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_
  6. #include "common/array_stack.h"
  7. #include "common/set.h"
  8. #include "llvm/ADT/SmallVector.h"
  9. #include "toolchain/check/lexical_lookup.h"
  10. #include "toolchain/check/scope_index.h"
  11. #include "toolchain/sem_ir/file.h"
  12. #include "toolchain/sem_ir/ids.h"
  13. namespace Carbon::Check {
  14. // A stack of lexical and semantic scopes that we are currently performing
  15. // checking within.
  16. class ScopeStack {
  17. public:
  18. explicit ScopeStack(const CanonicalValueStore<IdentifierId>& identifiers)
  19. : lexical_lookup_(identifiers) {}
  20. // A scope in which `break` and `continue` can be used.
  21. struct BreakContinueScope {
  22. SemIR::InstBlockId break_target;
  23. SemIR::InstBlockId continue_target;
  24. };
  25. // A scope in which `return` can be used.
  26. struct ReturnScope {
  27. // The declaration from which we can return. Inside a function, this will
  28. // be a `FunctionDecl`.
  29. SemIR::InstId decl_id;
  30. // The value corresponding to the current `returned var`, if any. Will be
  31. // set and unset as `returned var`s are declared and go out of scope.
  32. SemIR::InstId returned_var = SemIR::InstId::Invalid;
  33. };
  34. // A non-lexical scope in which unqualified lookup may be required.
  35. struct NonLexicalScope {
  36. // The index of the scope in the scope stack.
  37. ScopeIndex scope_index;
  38. // The corresponding name scope.
  39. SemIR::NameScopeId name_scope_id;
  40. // The corresponding specific.
  41. SemIR::SpecificId specific_id;
  42. };
  43. // Information about a scope that has been temporarily removed from the stack.
  44. struct SuspendedScope;
  45. // Pushes a scope onto scope_stack_. NameScopeId::Invalid is used for new
  46. // scopes. lexical_lookup_has_load_error is used to limit diagnostics when a
  47. // given namespace may contain a mix of both successful and failed name
  48. // imports.
  49. auto Push(SemIR::InstId scope_inst_id = SemIR::InstId::Invalid,
  50. SemIR::NameScopeId scope_id = SemIR::NameScopeId::Invalid,
  51. SemIR::SpecificId specific_id = SemIR::SpecificId::Invalid,
  52. bool lexical_lookup_has_load_error = false) -> void;
  53. // Pops the top scope from scope_stack_, cleaning up names from
  54. // lexical_lookup_.
  55. auto Pop() -> void;
  56. // Pops the top scope from scope_stack_ if it contains no names.
  57. auto PopIfEmpty() -> void {
  58. if (scope_stack_.back().num_names == 0) {
  59. Pop();
  60. }
  61. }
  62. // Pops scopes until we return to the specified scope index.
  63. auto PopTo(ScopeIndex index) -> void;
  64. // Returns the scope index associated with the current scope.
  65. auto PeekIndex() const -> ScopeIndex { return Peek().index; }
  66. // Returns the name scope associated with the current lexical scope, if any.
  67. auto PeekNameScopeId() const -> SemIR::NameScopeId { return Peek().scope_id; }
  68. // Returns the instruction associated with the current scope, or Invalid if
  69. // there is no such instruction, such as for a block scope.
  70. auto PeekInstId() const -> SemIR::InstId { return Peek().scope_inst_id; }
  71. // Returns the specific associated with the innermost enclosing scope that is
  72. // associated with a specific. This will generally be the self specific of the
  73. // innermost enclosing generic, as there is no way to enter any other specific
  74. // scope.
  75. auto PeekSpecificId() const -> SemIR::SpecificId {
  76. return Peek().specific_id;
  77. }
  78. // Returns the current scope, if it is of the specified kind. Otherwise,
  79. // returns nullopt.
  80. template <typename InstT>
  81. auto GetCurrentScopeAs(const SemIR::File& sem_ir) -> std::optional<InstT> {
  82. auto inst_id = PeekInstId();
  83. if (!inst_id.is_valid()) {
  84. return std::nullopt;
  85. }
  86. return sem_ir.insts().TryGetAs<InstT>(inst_id);
  87. }
  88. // If there is no `returned var` in scope, sets the given instruction to be
  89. // the current `returned var` and returns an invalid instruction ID. If there
  90. // is already a `returned var`, returns it instead.
  91. auto SetReturnedVarOrGetExisting(SemIR::InstId inst_id) -> SemIR::InstId;
  92. // Looks up the name `name_id` in the current scope and enclosing scopes, but
  93. // do not look past `scope_index`. Returns the existing lookup result, if any.
  94. auto LookupInLexicalScopesWithin(SemIR::NameId name_id,
  95. ScopeIndex scope_index) -> SemIR::InstId;
  96. // Looks up the name `name_id` in the current scope and related lexical
  97. // scopes. Returns the innermost lexical lookup result, if any, along with a
  98. // list of non-lexical scopes in which lookup should also be performed,
  99. // ordered from outermost to innermost.
  100. auto LookupInLexicalScopes(SemIR::NameId name_id)
  101. -> std::pair<SemIR::InstId, llvm::ArrayRef<NonLexicalScope>>;
  102. // Looks up the name `name_id` in the current scope, or in `scope_index` if
  103. // specified. Returns the existing instruction if the name is already declared
  104. // in that scope or any unfinished scope within it, and otherwise adds the
  105. // name with the value `target_id` and returns Invalid.
  106. auto LookupOrAddName(SemIR::NameId name_id, SemIR::InstId target_id,
  107. ScopeIndex scope_index = ScopeIndex::Invalid)
  108. -> SemIR::InstId;
  109. // Prepares to add a compile-time binding in the current scope, and returns
  110. // its index. The added binding must then be pushed using
  111. // `PushCompileTimeBinding`.
  112. auto AddCompileTimeBinding() -> SemIR::CompileTimeBindIndex {
  113. auto index = scope_stack_.back().next_compile_time_bind_index;
  114. ++scope_stack_.back().next_compile_time_bind_index.index;
  115. return index;
  116. }
  117. // Pushes a compile-time binding into the current scope.
  118. auto PushCompileTimeBinding(SemIR::InstId bind_id) -> void {
  119. compile_time_binding_stack_.AppendToTop(bind_id);
  120. }
  121. // Temporarily removes the top of the stack and its lexical lookup results.
  122. auto Suspend() -> SuspendedScope;
  123. // Restores a suspended scope stack entry.
  124. auto Restore(SuspendedScope scope) -> void;
  125. // Runs verification that the processing cleanly finished.
  126. auto VerifyOnFinish() -> void;
  127. auto return_scope_stack() -> llvm::SmallVector<ReturnScope>& {
  128. return return_scope_stack_;
  129. }
  130. auto break_continue_stack() -> llvm::SmallVector<BreakContinueScope>& {
  131. return break_continue_stack_;
  132. }
  133. auto compile_time_bindings_stack() -> ArrayStack<SemIR::InstId>& {
  134. return compile_time_binding_stack_;
  135. }
  136. private:
  137. // An entry in scope_stack_.
  138. struct ScopeStackEntry {
  139. // The sequential index of this scope entry within the file.
  140. ScopeIndex index;
  141. // The instruction associated with this entry, if any. This can be one of:
  142. //
  143. // - A `ClassDecl`, for a class definition scope.
  144. // - A `FunctionDecl`, for the outermost scope in a function
  145. // definition.
  146. // - Invalid, for any other scope.
  147. SemIR::InstId scope_inst_id;
  148. // The name scope associated with this entry, if any.
  149. SemIR::NameScopeId scope_id;
  150. // The specific associated with this entry, if any.
  151. SemIR::SpecificId specific_id;
  152. // The next compile-time binding index to allocate in this scope.
  153. SemIR::CompileTimeBindIndex next_compile_time_bind_index;
  154. // Whether lexical_lookup_ has load errors from this scope or an ancestor
  155. // scope.
  156. bool lexical_lookup_has_load_error;
  157. // Whether a `returned var` was introduced in this scope, and needs to be
  158. // unregistered when the scope ends.
  159. bool has_returned_var = false;
  160. // Whether there are any ids in the `names` set.
  161. int num_names = 0;
  162. // Names which are registered with lexical_lookup_, and will need to be
  163. // unregistered when the scope ends.
  164. Set<SemIR::NameId> names = {};
  165. // TODO: This likely needs to track things which need to be destructed.
  166. };
  167. auto Peek() const -> const ScopeStackEntry& { return scope_stack_.back(); }
  168. // Returns whether lexical lookup currently has any load errors.
  169. auto LexicalLookupHasLoadError() const -> bool {
  170. return !scope_stack_.empty() &&
  171. scope_stack_.back().lexical_lookup_has_load_error;
  172. }
  173. // Checks that the provided scope's `next_compile_time_bind_index` matches the
  174. // full size of the current `compile_time_binding_stack_`. The values should
  175. // always match, and this is used to validate the correspondence during
  176. // significant changes.
  177. auto VerifyNextCompileTimeBindIndex(llvm::StringLiteral label,
  178. const ScopeStackEntry& scope) -> void;
  179. // A stack of scopes from which we can `return`.
  180. llvm::SmallVector<ReturnScope> return_scope_stack_;
  181. // A stack of `break` and `continue` targets.
  182. llvm::SmallVector<BreakContinueScope> break_continue_stack_;
  183. // A stack for scope context.
  184. llvm::SmallVector<ScopeStackEntry> scope_stack_;
  185. // Information about non-lexical scopes. This is a subset of the entries and
  186. // the information in scope_stack_.
  187. llvm::SmallVector<NonLexicalScope> non_lexical_scope_stack_;
  188. // A stack of the current compile time bindings.
  189. ArrayStack<SemIR::InstId> compile_time_binding_stack_;
  190. // The index of the next scope that will be pushed onto scope_stack_. The
  191. // first is always the package scope.
  192. ScopeIndex next_scope_index_ = ScopeIndex::Package;
  193. // Tracks lexical lookup results.
  194. LexicalLookup lexical_lookup_;
  195. };
  196. struct ScopeStack::SuspendedScope {
  197. // An item that was suspended within this scope. This represents either a
  198. // lexical lookup entry in this scope, or a compile time binding entry in this
  199. // scope.
  200. //
  201. // TODO: For compile-time bindings, the common case is that they will both
  202. // have a suspended lexical lookup entry and a suspended compile time binding
  203. // entry. We should be able to store that as a single ScopeItem rather than
  204. // two.
  205. struct ScopeItem {
  206. static constexpr uint32_t IndexForCompileTimeBinding = -1;
  207. // The scope index for a LexicalLookup::SuspendedResult, or
  208. // CompileTimeBindingIndex for a suspended compile time binding.
  209. uint32_t index;
  210. // The instruction within the scope.
  211. SemIR::InstId inst_id;
  212. };
  213. // The suspended scope stack entry.
  214. ScopeStackEntry entry;
  215. // The list of items that were within this scope when it was suspended. The
  216. // inline size is an attempt to keep the size of a `SuspendedFunction`
  217. // reasonable while avoiding heap allocations most of the time.
  218. llvm::SmallVector<ScopeItem, 8> suspended_items;
  219. };
  220. } // namespace Carbon::Check
  221. #endif // CARBON_TOOLCHAIN_CHECK_SCOPE_STACK_H_