context.h 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #ifndef CARBON_TOOLCHAIN_CHECK_CONTEXT_H_
  5. #define CARBON_TOOLCHAIN_CHECK_CONTEXT_H_
  6. #include "common/map.h"
  7. #include "llvm/ADT/FoldingSet.h"
  8. #include "llvm/ADT/SmallVector.h"
  9. #include "toolchain/check/decl_introducer_state.h"
  10. #include "toolchain/check/decl_name_stack.h"
  11. #include "toolchain/check/diagnostic_helpers.h"
  12. #include "toolchain/check/full_pattern_stack.h"
  13. #include "toolchain/check/generic_region_stack.h"
  14. #include "toolchain/check/global_init.h"
  15. #include "toolchain/check/inst_block_stack.h"
  16. #include "toolchain/check/node_stack.h"
  17. #include "toolchain/check/param_and_arg_refs_stack.h"
  18. #include "toolchain/check/region_stack.h"
  19. #include "toolchain/check/scope_index.h"
  20. #include "toolchain/check/scope_stack.h"
  21. #include "toolchain/parse/node_ids.h"
  22. #include "toolchain/parse/tree.h"
  23. #include "toolchain/parse/tree_and_subtrees.h"
  24. #include "toolchain/sem_ir/file.h"
  25. #include "toolchain/sem_ir/ids.h"
  26. #include "toolchain/sem_ir/import_ir.h"
  27. #include "toolchain/sem_ir/inst.h"
  28. #include "toolchain/sem_ir/name_scope.h"
  29. #include "toolchain/sem_ir/typed_insts.h"
  30. namespace Carbon::Check {
  31. // Context stored during check.
  32. //
  33. // This file stores state, and members objects may provide an API. Other files
  34. // may also have helpers that operate on Context. To keep this file manageable,
  35. // please put logic into other files.
  36. //
  37. // For example, consider the API for functions:
  38. // - `context.functions()`: Exposes storage of `SemIR::Function` objects.
  39. // - `toolchain/check/function.h`: Contains helper functions which use
  40. // `Check::Context`.
  41. // - `toolchain/sem_ir/function.h`: Contains helper functions which only need
  42. // `SemIR` objects, for which it's helpful not to depend on `Check::Context`
  43. // (for example, shared with lowering).
  44. class Context {
  45. public:
  46. using DiagnosticEmitter = Carbon::DiagnosticEmitter<SemIRLoc>;
  47. using DiagnosticBuilder = DiagnosticEmitter::DiagnosticBuilder;
  48. // A function that forms a diagnostic for some kind of problem. The
  49. // DiagnosticBuilder is returned rather than emitted so that the caller can
  50. // add contextual notes as appropriate.
  51. using BuildDiagnosticFn = llvm::function_ref<auto()->DiagnosticBuilder>;
  52. // Stores references for work.
  53. explicit Context(DiagnosticEmitter* emitter,
  54. Parse::GetTreeAndSubtreesFn tree_and_subtrees_getter,
  55. SemIR::File* sem_ir, int imported_ir_count,
  56. int total_ir_count, llvm::raw_ostream* vlog_stream);
  57. // Marks an implementation TODO. Always returns false.
  58. auto TODO(SemIRLoc loc, std::string label) -> bool;
  59. // Runs verification that the processing cleanly finished.
  60. auto VerifyOnFinish() const -> void;
  61. // Prints information for a stack dump.
  62. auto PrintForStackDump(llvm::raw_ostream& output) const -> void;
  63. // Get the Lex::TokenKind of a node for diagnostics.
  64. auto token_kind(Parse::NodeId node_id) -> Lex::TokenKind {
  65. return tokens().GetKind(parse_tree().node_token(node_id));
  66. }
  67. auto emitter() -> DiagnosticEmitter& { return *emitter_; }
  68. auto parse_tree_and_subtrees() -> const Parse::TreeAndSubtrees& {
  69. return tree_and_subtrees_getter_();
  70. }
  71. auto sem_ir() -> SemIR::File& { return *sem_ir_; }
  72. auto sem_ir() const -> const SemIR::File& { return *sem_ir_; }
  73. // Convenience functions for major phase data.
  74. auto parse_tree() const -> const Parse::Tree& {
  75. return sem_ir_->parse_tree();
  76. }
  77. auto tokens() const -> const Lex::TokenizedBuffer& {
  78. return parse_tree().tokens();
  79. }
  80. auto vlog_stream() -> llvm::raw_ostream* { return vlog_stream_; }
  81. auto node_stack() -> NodeStack& { return node_stack_; }
  82. auto inst_block_stack() -> InstBlockStack& { return inst_block_stack_; }
  83. auto pattern_block_stack() -> InstBlockStack& { return pattern_block_stack_; }
  84. auto param_and_arg_refs_stack() -> ParamAndArgRefsStack& {
  85. return param_and_arg_refs_stack_;
  86. }
  87. auto args_type_info_stack() -> InstBlockStack& {
  88. return args_type_info_stack_;
  89. }
  90. auto struct_type_fields_stack() -> ArrayStack<SemIR::StructTypeField>& {
  91. return struct_type_fields_stack_;
  92. }
  93. auto field_decls_stack() -> ArrayStack<SemIR::InstId>& {
  94. return field_decls_stack_;
  95. }
  96. auto decl_name_stack() -> DeclNameStack& { return decl_name_stack_; }
  97. auto decl_introducer_state_stack() -> DeclIntroducerStateStack& {
  98. return decl_introducer_state_stack_;
  99. }
  100. auto scope_stack() -> ScopeStack& { return scope_stack_; }
  101. // Conveneicne functions for frequently-used `scope_stack` members.
  102. auto return_scope_stack() -> llvm::SmallVector<ScopeStack::ReturnScope>& {
  103. return scope_stack().return_scope_stack();
  104. }
  105. auto break_continue_stack()
  106. -> llvm::SmallVector<ScopeStack::BreakContinueScope>& {
  107. return scope_stack().break_continue_stack();
  108. }
  109. auto full_pattern_stack() -> FullPatternStack& {
  110. return scope_stack_.full_pattern_stack();
  111. }
  112. auto generic_region_stack() -> GenericRegionStack& {
  113. return generic_region_stack_;
  114. }
  115. auto vtable_stack() -> InstBlockStack& { return vtable_stack_; }
  116. auto exports() -> llvm::SmallVector<SemIR::InstId>& { return exports_; }
  117. auto check_ir_map() -> llvm::MutableArrayRef<SemIR::ImportIRId> {
  118. return check_ir_map_;
  119. }
  120. auto import_ir_constant_values()
  121. -> llvm::SmallVector<SemIR::ConstantValueStore, 0>& {
  122. return import_ir_constant_values_;
  123. }
  124. auto definitions_required() -> llvm::SmallVector<SemIR::InstId>& {
  125. return definitions_required_;
  126. }
  127. auto global_init() -> GlobalInit& { return global_init_; }
  128. auto import_ref_ids() -> llvm::SmallVector<SemIR::InstId>& {
  129. return import_ref_ids_;
  130. }
  131. // Pre-computed parts of a binding pattern.
  132. // TODO: Consider putting this behind a narrower API to guard against emitting
  133. // multiple times.
  134. struct BindingPatternInfo {
  135. // The corresponding AnyBindName inst.
  136. SemIR::InstId bind_name_id;
  137. // The region of insts that computes the type of the binding.
  138. SemIR::ExprRegionId type_expr_region_id;
  139. };
  140. auto bind_name_map() -> Map<SemIR::InstId, BindingPatternInfo>& {
  141. return bind_name_map_;
  142. }
  143. auto var_storage_map() -> Map<SemIR::InstId, SemIR::InstId>& {
  144. return var_storage_map_;
  145. }
  146. // During Choice typechecking, each alternative turns into a name binding on
  147. // the Choice type, but this can't be done until the full Choice type is
  148. // known. This represents each binding to be done at the end of checking the
  149. // Choice type.
  150. struct ChoiceDeferredBinding {
  151. Parse::NodeId node_id;
  152. NameComponent name_component;
  153. };
  154. auto choice_deferred_bindings() -> llvm::SmallVector<ChoiceDeferredBinding>& {
  155. return choice_deferred_bindings_;
  156. }
  157. auto region_stack() -> RegionStack& { return region_stack_; }
  158. // An ongoing impl lookup, used to ensure termination.
  159. struct ImplLookupStackEntry {
  160. SemIR::ConstantId type_const_id;
  161. SemIR::ConstantId interface_const_id;
  162. };
  163. auto impl_lookup_stack() -> llvm::SmallVector<ImplLookupStackEntry>& {
  164. return impl_lookup_stack_;
  165. }
  166. // --------------------------------------------------------------------------
  167. // Directly expose SemIR::File data accessors for brevity in calls.
  168. // --------------------------------------------------------------------------
  169. auto identifiers() -> SharedValueStores::IdentifierStore& {
  170. return sem_ir().identifiers();
  171. }
  172. auto ints() -> SharedValueStores::IntStore& { return sem_ir().ints(); }
  173. auto reals() -> SharedValueStores::RealStore& { return sem_ir().reals(); }
  174. auto floats() -> SharedValueStores::FloatStore& { return sem_ir().floats(); }
  175. auto string_literal_values() -> SharedValueStores::StringLiteralStore& {
  176. return sem_ir().string_literal_values();
  177. }
  178. auto entity_names() -> SemIR::EntityNameStore& {
  179. return sem_ir().entity_names();
  180. }
  181. auto functions() -> ValueStore<SemIR::FunctionId>& {
  182. return sem_ir().functions();
  183. }
  184. auto classes() -> ValueStore<SemIR::ClassId>& { return sem_ir().classes(); }
  185. auto interfaces() -> ValueStore<SemIR::InterfaceId>& {
  186. return sem_ir().interfaces();
  187. }
  188. auto associated_constants() -> ValueStore<SemIR::AssociatedConstantId>& {
  189. return sem_ir().associated_constants();
  190. }
  191. auto facet_types() -> CanonicalValueStore<SemIR::FacetTypeId>& {
  192. return sem_ir().facet_types();
  193. }
  194. auto complete_facet_types() -> SemIR::File::CompleteFacetTypeStore& {
  195. return sem_ir().complete_facet_types();
  196. }
  197. auto impls() -> SemIR::ImplStore& { return sem_ir().impls(); }
  198. auto generics() -> SemIR::GenericStore& { return sem_ir().generics(); }
  199. auto specifics() -> SemIR::SpecificStore& { return sem_ir().specifics(); }
  200. auto import_irs() -> ValueStore<SemIR::ImportIRId>& {
  201. return sem_ir().import_irs();
  202. }
  203. auto import_ir_insts() -> ValueStore<SemIR::ImportIRInstId>& {
  204. return sem_ir().import_ir_insts();
  205. }
  206. auto names() -> SemIR::NameStoreWrapper { return sem_ir().names(); }
  207. auto name_scopes() -> SemIR::NameScopeStore& {
  208. return sem_ir().name_scopes();
  209. }
  210. auto struct_type_fields() -> SemIR::StructTypeFieldsStore& {
  211. return sem_ir().struct_type_fields();
  212. }
  213. auto types() -> SemIR::TypeStore& { return sem_ir().types(); }
  214. auto type_blocks() -> SemIR::BlockValueStore<SemIR::TypeBlockId>& {
  215. return sem_ir().type_blocks();
  216. }
  217. // Instructions should be added with `AddInst` or `AddInstInNoBlock` from
  218. // `inst.h`. This is `const` to prevent accidental misuse.
  219. auto insts() -> const SemIR::InstStore& { return sem_ir().insts(); }
  220. auto constant_values() -> SemIR::ConstantValueStore& {
  221. return sem_ir().constant_values();
  222. }
  223. auto inst_blocks() -> SemIR::InstBlockStore& {
  224. return sem_ir().inst_blocks();
  225. }
  226. auto constants() -> SemIR::ConstantStore& { return sem_ir().constants(); }
  227. // --------------------------------------------------------------------------
  228. // End of SemIR::File members.
  229. // --------------------------------------------------------------------------
  230. private:
  231. // Handles diagnostics.
  232. DiagnosticEmitter* emitter_;
  233. // Returns a lazily constructed TreeAndSubtrees.
  234. Parse::GetTreeAndSubtreesFn tree_and_subtrees_getter_;
  235. // The SemIR::File being added to.
  236. SemIR::File* sem_ir_;
  237. // Whether to print verbose output.
  238. llvm::raw_ostream* vlog_stream_;
  239. // The stack during Build. Will contain file-level parse nodes on return.
  240. NodeStack node_stack_;
  241. // The stack of instruction blocks being used for general IR generation.
  242. InstBlockStack inst_block_stack_;
  243. // The stack of instruction blocks that contain pattern instructions.
  244. InstBlockStack pattern_block_stack_;
  245. // The stack of instruction blocks being used for param and arg ref blocks.
  246. ParamAndArgRefsStack param_and_arg_refs_stack_;
  247. // The stack of instruction blocks being used for type information while
  248. // processing arguments. This is used in parallel with
  249. // param_and_arg_refs_stack_. It's currently only used for struct literals,
  250. // where we need to track names for a type separate from the literal
  251. // arguments.
  252. InstBlockStack args_type_info_stack_;
  253. // The stack of StructTypeFields for in-progress StructTypeLiterals.
  254. ArrayStack<SemIR::StructTypeField> struct_type_fields_stack_;
  255. // The stack of FieldDecls for in-progress Class definitions.
  256. ArrayStack<SemIR::InstId> field_decls_stack_;
  257. // The stack used for qualified declaration name construction.
  258. DeclNameStack decl_name_stack_;
  259. // The stack of declarations that could have modifiers.
  260. DeclIntroducerStateStack decl_introducer_state_stack_;
  261. // The stack of scopes we are currently within.
  262. ScopeStack scope_stack_;
  263. // The stack of generic regions we are currently within.
  264. GenericRegionStack generic_region_stack_;
  265. // Contains a vtable block for each `class` scope which is currently being
  266. // defined, regardless of whether the class can have virtual functions.
  267. InstBlockStack vtable_stack_;
  268. // The list which will form NodeBlockId::Exports.
  269. llvm::SmallVector<SemIR::InstId> exports_;
  270. // Maps CheckIRId to ImportIRId.
  271. llvm::SmallVector<SemIR::ImportIRId> check_ir_map_;
  272. // Per-import constant values. These refer to the main IR and mainly serve as
  273. // a lookup table for quick access.
  274. //
  275. // Inline 0 elements because it's expected to require heap allocation.
  276. llvm::SmallVector<SemIR::ConstantValueStore, 0> import_ir_constant_values_;
  277. // Declaration instructions of entities that should have definitions by the
  278. // end of the current source file.
  279. llvm::SmallVector<SemIR::InstId> definitions_required_;
  280. // State for global initialization.
  281. GlobalInit global_init_;
  282. // A list of import refs which can't be inserted into their current context.
  283. // They're typically added during name lookup or import ref resolution, where
  284. // the current block on inst_block_stack_ is unrelated.
  285. //
  286. // These are instead added here because they're referenced by other
  287. // instructions and needs to be visible in textual IR.
  288. // FinalizeImportRefBlock() will produce an inst block for them.
  289. llvm::SmallVector<SemIR::InstId> import_ref_ids_;
  290. // Map from an AnyBindingPattern inst to precomputed parts of the
  291. // pattern-match SemIR for it.
  292. Map<SemIR::InstId, BindingPatternInfo> bind_name_map_;
  293. // Map from VarPattern insts to the corresponding VarStorage insts. The
  294. // VarStorage insts are allocated, emitted, and stored in the map after
  295. // processing the enclosing full-pattern.
  296. Map<SemIR::InstId, SemIR::InstId> var_storage_map_;
  297. // Each alternative in a Choice gets an entry here, they are stored in
  298. // declaration order. The vector is consumed and emptied at the end of the
  299. // Choice definition.
  300. //
  301. // TODO: This may need to be a stack of vectors if it becomes possible to
  302. // define a Choice type inside an alternative's parameter set.
  303. llvm::SmallVector<ChoiceDeferredBinding> choice_deferred_bindings_;
  304. // Stack of single-entry regions being built.
  305. RegionStack region_stack_;
  306. // Tracks all ongoing impl lookups in order to ensure that lookup terminates
  307. // via the acyclic rule and the termination rule.
  308. llvm::SmallVector<ImplLookupStackEntry> impl_lookup_stack_;
  309. };
  310. } // namespace Carbon::Check
  311. #endif // CARBON_TOOLCHAIN_CHECK_CONTEXT_H_