parser.cpp 56 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/parser/parser.h"
  5. #include <cstdlib>
  6. #include <memory>
  7. #include <optional>
  8. #include "common/check.h"
  9. #include "llvm/Support/PrettyStackTrace.h"
  10. #include "toolchain/lexer/token_kind.h"
  11. #include "toolchain/lexer/tokenized_buffer.h"
  12. #include "toolchain/parser/parse_node_kind.h"
  13. #include "toolchain/parser/parse_tree.h"
  14. namespace Carbon {
  15. // May be emitted a couple different ways as part of operator parsing.
  16. CARBON_DIAGNOSTIC(
  17. OperatorRequiresParentheses, Error,
  18. "Parentheses are required to disambiguate operator precedence.");
  19. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error, "Expected `(` after `{0}`.",
  20. TokenKind);
  21. CARBON_DIAGNOSTIC(ExpectedSemiAfterExpression, Error,
  22. "Expected `;` after expression.");
  23. // A relative location for characters in errors.
  24. enum class RelativeLocation : int8_t {
  25. Around,
  26. After,
  27. Before,
  28. };
  29. // Adapts RelativeLocation for use with formatv.
  30. static auto operator<<(llvm::raw_ostream& out, RelativeLocation loc)
  31. -> llvm::raw_ostream& {
  32. switch (loc) {
  33. case RelativeLocation::Around:
  34. out << "around";
  35. break;
  36. case RelativeLocation::After:
  37. out << "after";
  38. break;
  39. case RelativeLocation::Before:
  40. out << "before";
  41. break;
  42. }
  43. return out;
  44. }
  45. class Parser::PrettyStackTraceParseState : public llvm::PrettyStackTraceEntry {
  46. public:
  47. explicit PrettyStackTraceParseState(const Parser* parser) : parser_(parser) {}
  48. ~PrettyStackTraceParseState() override = default;
  49. auto print(llvm::raw_ostream& output) const -> void override {
  50. output << "Parser stack:\n";
  51. for (int i = 0; i < static_cast<int>(parser_->state_stack_.size()); ++i) {
  52. const auto& entry = parser_->state_stack_[i];
  53. output << "\t" << i << ".\t" << entry.state;
  54. Print(output, entry.token);
  55. }
  56. output << "\tcursor\tposition_";
  57. Print(output, *parser_->position_);
  58. }
  59. private:
  60. auto Print(llvm::raw_ostream& output, TokenizedBuffer::Token token) const
  61. -> void {
  62. auto line = parser_->tokens_->GetLine(token);
  63. output << " @ " << parser_->tokens_->GetLineNumber(line) << ":"
  64. << parser_->tokens_->GetColumnNumber(token) << ":"
  65. << " token " << token << " : "
  66. << parser_->tokens_->GetKind(token).Name() << "\n";
  67. }
  68. const Parser* parser_;
  69. };
  70. Parser::Parser(ParseTree& tree, TokenizedBuffer& tokens,
  71. TokenDiagnosticEmitter& emitter, llvm::raw_ostream* vlog_stream)
  72. : tree_(&tree),
  73. tokens_(&tokens),
  74. emitter_(&emitter),
  75. vlog_stream_(vlog_stream),
  76. position_(tokens_->tokens().begin()),
  77. end_(tokens_->tokens().end()) {
  78. CARBON_CHECK(position_ != end_) << "Empty TokenizedBuffer";
  79. --end_;
  80. CARBON_CHECK(tokens_->GetKind(*end_) == TokenKind::EndOfFile())
  81. << "TokenizedBuffer should end with EndOfFile, ended with "
  82. << tokens_->GetKind(*end_).Name();
  83. }
  84. auto Parser::AddLeafNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  85. bool has_error) -> void {
  86. tree_->node_impls_.push_back(
  87. ParseTree::NodeImpl(kind, has_error, token, /*subtree_size=*/1));
  88. if (has_error) {
  89. tree_->has_errors_ = true;
  90. }
  91. }
  92. auto Parser::AddNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  93. int subtree_start, bool has_error) -> void {
  94. int subtree_size = tree_->size() - subtree_start + 1;
  95. tree_->node_impls_.push_back(
  96. ParseTree::NodeImpl(kind, has_error, token, subtree_size));
  97. if (has_error) {
  98. tree_->has_errors_ = true;
  99. }
  100. }
  101. auto Parser::ConsumeAndAddOpenParen(TokenizedBuffer::Token default_token,
  102. ParseNodeKind start_kind) -> void {
  103. if (auto open_paren = ConsumeIf(TokenKind::OpenParen())) {
  104. AddLeafNode(start_kind, *open_paren, /*has_error=*/false);
  105. } else {
  106. emitter_->Emit(*position_, ExpectedParenAfter,
  107. tokens_->GetKind(default_token));
  108. AddLeafNode(start_kind, default_token, /*has_error=*/true);
  109. }
  110. }
  111. auto Parser::ConsumeAndAddCloseParen(StateStackEntry state,
  112. ParseNodeKind close_kind) -> void {
  113. // state.token should point at the introducer, with the paren one after the
  114. // introducer.
  115. auto expected_paren = *(TokenizedBuffer::TokenIterator(state.token) + 1);
  116. if (tokens_->GetKind(expected_paren) != TokenKind::OpenParen()) {
  117. AddNode(close_kind, state.token, state.subtree_start, /*has_error=*/true);
  118. } else if (auto close_token = ConsumeIf(TokenKind::CloseParen())) {
  119. AddNode(close_kind, *close_token, state.subtree_start, state.has_error);
  120. } else {
  121. // TODO: Include the location of the matching open_paren in the diagnostic.
  122. CARBON_DIAGNOSTIC(ExpectedCloseParen, Error,
  123. "Unexpected tokens before `)`.");
  124. emitter_->Emit(*position_, ExpectedCloseParen);
  125. SkipTo(tokens_->GetMatchedClosingToken(expected_paren));
  126. AddNode(close_kind, Consume(), state.subtree_start, /*has_error=*/true);
  127. }
  128. }
  129. auto Parser::ConsumeAndAddLeafNodeIf(TokenKind token_kind,
  130. ParseNodeKind node_kind) -> bool {
  131. auto token = ConsumeIf(token_kind);
  132. if (!token) {
  133. return false;
  134. }
  135. AddLeafNode(node_kind, *token);
  136. return true;
  137. }
  138. auto Parser::ConsumeChecked(TokenKind kind) -> TokenizedBuffer::Token {
  139. CARBON_CHECK(PositionIs(kind))
  140. << "Required " << kind.Name() << ", found " << PositionKind().Name();
  141. return Consume();
  142. }
  143. auto Parser::ConsumeIf(TokenKind kind)
  144. -> std::optional<TokenizedBuffer::Token> {
  145. if (!PositionIs(kind)) {
  146. return std::nullopt;
  147. }
  148. return Consume();
  149. }
  150. auto Parser::FindNextOf(std::initializer_list<TokenKind> desired_kinds)
  151. -> std::optional<TokenizedBuffer::Token> {
  152. auto new_position = position_;
  153. while (true) {
  154. TokenizedBuffer::Token token = *new_position;
  155. TokenKind kind = tokens_->GetKind(token);
  156. if (kind.IsOneOf(desired_kinds)) {
  157. return token;
  158. }
  159. // Step to the next token at the current bracketing level.
  160. if (kind.IsClosingSymbol() || kind == TokenKind::EndOfFile()) {
  161. // There are no more tokens at this level.
  162. return std::nullopt;
  163. } else if (kind.IsOpeningSymbol()) {
  164. new_position = TokenizedBuffer::TokenIterator(
  165. tokens_->GetMatchedClosingToken(token));
  166. // Advance past the closing token.
  167. ++new_position;
  168. } else {
  169. ++new_position;
  170. }
  171. }
  172. }
  173. auto Parser::SkipMatchingGroup() -> bool {
  174. if (!PositionKind().IsOpeningSymbol()) {
  175. return false;
  176. }
  177. SkipTo(tokens_->GetMatchedClosingToken(*position_));
  178. ++position_;
  179. return true;
  180. }
  181. auto Parser::SkipPastLikelyEnd(TokenizedBuffer::Token skip_root)
  182. -> std::optional<TokenizedBuffer::Token> {
  183. if (position_ == end_) {
  184. return std::nullopt;
  185. }
  186. TokenizedBuffer::Line root_line = tokens_->GetLine(skip_root);
  187. int root_line_indent = tokens_->GetIndentColumnNumber(root_line);
  188. // We will keep scanning through tokens on the same line as the root or
  189. // lines with greater indentation than root's line.
  190. auto is_same_line_or_indent_greater_than_root =
  191. [&](TokenizedBuffer::Token t) {
  192. TokenizedBuffer::Line l = tokens_->GetLine(t);
  193. if (l == root_line) {
  194. return true;
  195. }
  196. return tokens_->GetIndentColumnNumber(l) > root_line_indent;
  197. };
  198. do {
  199. if (PositionIs(TokenKind::CloseCurlyBrace())) {
  200. // Immediately bail out if we hit an unmatched close curly, this will
  201. // pop us up a level of the syntax grouping.
  202. return std::nullopt;
  203. }
  204. // We assume that a semicolon is always intended to be the end of the
  205. // current construct.
  206. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  207. return semi;
  208. }
  209. // Skip over any matching group of tokens_->
  210. if (SkipMatchingGroup()) {
  211. continue;
  212. }
  213. // Otherwise just step forward one token.
  214. ++position_;
  215. } while (position_ != end_ &&
  216. is_same_line_or_indent_greater_than_root(*position_));
  217. return std::nullopt;
  218. }
  219. auto Parser::SkipTo(TokenizedBuffer::Token t) -> void {
  220. CARBON_CHECK(t >= *position_) << "Tried to skip backwards from " << position_
  221. << " to " << TokenizedBuffer::TokenIterator(t);
  222. position_ = TokenizedBuffer::TokenIterator(t);
  223. CARBON_CHECK(position_ != end_) << "Skipped past EOF.";
  224. }
  225. auto Parser::HandleCodeBlockState() -> void {
  226. PopAndDiscardState();
  227. PushState(ParserState::CodeBlockFinish());
  228. if (ConsumeAndAddLeafNodeIf(TokenKind::OpenCurlyBrace(),
  229. ParseNodeKind::CodeBlockStart())) {
  230. PushState(ParserState::StatementScopeLoop());
  231. } else {
  232. AddLeafNode(ParseNodeKind::CodeBlockStart(), *position_,
  233. /*has_error=*/true);
  234. // Recover by parsing a single statement.
  235. CARBON_DIAGNOSTIC(ExpectedCodeBlock, Error, "Expected braced code block.");
  236. emitter_->Emit(*position_, ExpectedCodeBlock);
  237. PushState(ParserState::Statement());
  238. }
  239. }
  240. // Determines whether the given token is considered to be the start of an
  241. // operand according to the rules for infix operator parsing.
  242. static auto IsAssumedStartOfOperand(TokenKind kind) -> bool {
  243. return kind.IsOneOf({TokenKind::OpenParen(), TokenKind::Identifier(),
  244. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  245. TokenKind::StringLiteral()});
  246. }
  247. // Determines whether the given token is considered to be the end of an
  248. // operand according to the rules for infix operator parsing.
  249. static auto IsAssumedEndOfOperand(TokenKind kind) -> bool {
  250. return kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  251. TokenKind::CloseSquareBracket(), TokenKind::Identifier(),
  252. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  253. TokenKind::StringLiteral()});
  254. }
  255. // Determines whether the given token could possibly be the start of an
  256. // operand. This is conservatively correct, and will never incorrectly return
  257. // `false`, but can incorrectly return `true`.
  258. static auto IsPossibleStartOfOperand(TokenKind kind) -> bool {
  259. return !kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  260. TokenKind::CloseSquareBracket(), TokenKind::Comma(),
  261. TokenKind::Semi(), TokenKind::Colon()});
  262. }
  263. auto Parser::IsLexicallyValidInfixOperator() -> bool {
  264. CARBON_CHECK(position_ != end_) << "Expected an operator token.";
  265. bool leading_space = tokens_->HasLeadingWhitespace(*position_);
  266. bool trailing_space = tokens_->HasTrailingWhitespace(*position_);
  267. // If there's whitespace on both sides, it's an infix operator.
  268. if (leading_space && trailing_space) {
  269. return true;
  270. }
  271. // If there's whitespace on exactly one side, it's not an infix operator.
  272. if (leading_space || trailing_space) {
  273. return false;
  274. }
  275. // Otherwise, for an infix operator, the preceding token must be any close
  276. // bracket, identifier, or literal and the next token must be an open paren,
  277. // identifier, or literal.
  278. if (position_ == tokens_->tokens().begin() ||
  279. !IsAssumedEndOfOperand(tokens_->GetKind(*(position_ - 1))) ||
  280. !IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  281. return false;
  282. }
  283. return true;
  284. }
  285. auto Parser::IsTrailingOperatorInfix() -> bool {
  286. if (position_ == end_) {
  287. return false;
  288. }
  289. // An operator that follows the infix operator rules is parsed as
  290. // infix, unless the next token means that it can't possibly be.
  291. if (IsLexicallyValidInfixOperator() &&
  292. IsPossibleStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  293. return true;
  294. }
  295. // A trailing operator with leading whitespace that's not valid as infix is
  296. // not valid at all. If the next token looks like the start of an operand,
  297. // then parse as infix, otherwise as postfix. Either way we'll produce a
  298. // diagnostic later on.
  299. if (tokens_->HasLeadingWhitespace(*position_) &&
  300. IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  301. return true;
  302. }
  303. return false;
  304. }
  305. auto Parser::DiagnoseOperatorFixity(OperatorFixity fixity) -> void {
  306. if (fixity == OperatorFixity::Infix) {
  307. // Infix operators must satisfy the infix operator rules.
  308. if (!IsLexicallyValidInfixOperator()) {
  309. CARBON_DIAGNOSTIC(BinaryOperatorRequiresWhitespace, Error,
  310. "Whitespace missing {0} binary operator.",
  311. RelativeLocation);
  312. emitter_->Emit(*position_, BinaryOperatorRequiresWhitespace,
  313. tokens_->HasLeadingWhitespace(*position_)
  314. ? RelativeLocation::After
  315. : (tokens_->HasTrailingWhitespace(*position_)
  316. ? RelativeLocation::Before
  317. : RelativeLocation::Around));
  318. }
  319. } else {
  320. bool prefix = fixity == OperatorFixity::Prefix;
  321. // Whitespace is not permitted between a symbolic pre/postfix operator and
  322. // its operand.
  323. if (PositionKind().IsSymbol() &&
  324. (prefix ? tokens_->HasTrailingWhitespace(*position_)
  325. : tokens_->HasLeadingWhitespace(*position_))) {
  326. CARBON_DIAGNOSTIC(UnaryOperatorHasWhitespace, Error,
  327. "Whitespace is not allowed {0} this unary operator.",
  328. RelativeLocation);
  329. emitter_->Emit(
  330. *position_, UnaryOperatorHasWhitespace,
  331. prefix ? RelativeLocation::After : RelativeLocation::Before);
  332. }
  333. // Pre/postfix operators must not satisfy the infix operator rules.
  334. if (IsLexicallyValidInfixOperator()) {
  335. CARBON_DIAGNOSTIC(UnaryOperatorRequiresWhitespace, Error,
  336. "Whitespace is required {0} this unary operator.",
  337. RelativeLocation);
  338. emitter_->Emit(
  339. *position_, UnaryOperatorRequiresWhitespace,
  340. prefix ? RelativeLocation::Before : RelativeLocation::After);
  341. }
  342. }
  343. }
  344. auto Parser::ConsumeListToken(ParseNodeKind comma_kind, TokenKind close_kind,
  345. bool already_has_error) -> ListTokenKind {
  346. if (!PositionIs(TokenKind::Comma()) && !PositionIs(close_kind)) {
  347. // Don't error a second time on the same element.
  348. if (!already_has_error) {
  349. CARBON_DIAGNOSTIC(UnexpectedTokenAfterListElement, Error,
  350. "Expected `,` or `{0}`.", TokenKind);
  351. emitter_->Emit(*position_, UnexpectedTokenAfterListElement, close_kind);
  352. ReturnErrorOnState();
  353. }
  354. // Recover from the invalid token.
  355. auto end_of_element = FindNextOf({TokenKind::Comma(), close_kind});
  356. // The lexer guarantees that parentheses are balanced.
  357. CARBON_CHECK(end_of_element)
  358. << "missing matching `" << close_kind.GetOpeningSymbol() << "` for `"
  359. << close_kind << "`";
  360. SkipTo(*end_of_element);
  361. }
  362. if (PositionIs(close_kind)) {
  363. return ListTokenKind::Close;
  364. } else {
  365. AddLeafNode(comma_kind, Consume());
  366. return PositionIs(close_kind) ? ListTokenKind::CommaClose
  367. : ListTokenKind::Comma;
  368. }
  369. }
  370. auto Parser::Parse() -> void {
  371. // Traces state_stack_. This runs even in opt because it's low overhead.
  372. PrettyStackTraceParseState pretty_stack(this);
  373. CARBON_VLOG() << "*** Parser::Parse Begin ***\n";
  374. PushState(ParserState::DeclarationLoop());
  375. while (!state_stack_.empty()) {
  376. switch (state_stack_.back().state) {
  377. #define CARBON_PARSER_STATE(Name) \
  378. case ParserState::Name(): \
  379. Handle##Name##State(); \
  380. break;
  381. #include "toolchain/parser/parser_state.def"
  382. }
  383. }
  384. AddLeafNode(ParseNodeKind::FileEnd(), *position_);
  385. CARBON_VLOG() << "*** Parser::Parse End ***\n";
  386. }
  387. auto Parser::HandleBraceExpressionState() -> void {
  388. auto state = PopState();
  389. state.state = ParserState::BraceExpressionFinishAsUnknown();
  390. PushState(state);
  391. CARBON_CHECK(ConsumeAndAddLeafNodeIf(
  392. TokenKind::OpenCurlyBrace(),
  393. ParseNodeKind::StructLiteralOrStructTypeLiteralStart()));
  394. if (!PositionIs(TokenKind::CloseCurlyBrace())) {
  395. PushState(ParserState::BraceExpressionParameterAsUnknown());
  396. }
  397. }
  398. auto Parser::BraceExpressionKindToParserState(BraceExpressionKind kind,
  399. ParserState type,
  400. ParserState value,
  401. ParserState unknown)
  402. -> ParserState {
  403. switch (kind) {
  404. case BraceExpressionKind::Type: {
  405. return type;
  406. }
  407. case BraceExpressionKind::Value: {
  408. return value;
  409. }
  410. case BraceExpressionKind::Unknown: {
  411. return unknown;
  412. }
  413. }
  414. }
  415. auto Parser::HandleBraceExpressionParameterError(StateStackEntry state,
  416. BraceExpressionKind kind)
  417. -> void {
  418. CARBON_DIAGNOSTIC(ExpectedStructLiteralField, Error, "Expected {0}{1}{2}.",
  419. llvm::StringRef, llvm::StringRef, llvm::StringRef);
  420. bool can_be_type = kind != BraceExpressionKind::Value;
  421. bool can_be_value = kind != BraceExpressionKind::Type;
  422. emitter_->Emit(*position_, ExpectedStructLiteralField,
  423. can_be_type ? "`.field: type`" : "",
  424. (can_be_type && can_be_value) ? " or " : "",
  425. can_be_value ? "`.field = value`" : "");
  426. state.state = BraceExpressionKindToParserState(
  427. kind, ParserState::BraceExpressionParameterFinishAsType(),
  428. ParserState::BraceExpressionParameterFinishAsValue(),
  429. ParserState::BraceExpressionParameterFinishAsUnknown());
  430. state.has_error = true;
  431. PushState(state);
  432. }
  433. auto Parser::HandleBraceExpressionParameter(BraceExpressionKind kind) -> void {
  434. auto state = PopState();
  435. if (!PositionIs(TokenKind::Period())) {
  436. HandleBraceExpressionParameterError(state, kind);
  437. return;
  438. }
  439. state.state = BraceExpressionKindToParserState(
  440. kind, ParserState::BraceExpressionParameterAfterDesignatorAsType(),
  441. ParserState::BraceExpressionParameterAfterDesignatorAsValue(),
  442. ParserState::BraceExpressionParameterAfterDesignatorAsUnknown());
  443. PushState(state);
  444. PushState(ParserState::DesignatorAsStruct());
  445. }
  446. auto Parser::HandleBraceExpressionParameterAsTypeState() -> void {
  447. HandleBraceExpressionParameter(BraceExpressionKind::Type);
  448. }
  449. auto Parser::HandleBraceExpressionParameterAsValueState() -> void {
  450. HandleBraceExpressionParameter(BraceExpressionKind::Value);
  451. }
  452. auto Parser::HandleBraceExpressionParameterAsUnknownState() -> void {
  453. HandleBraceExpressionParameter(BraceExpressionKind::Unknown);
  454. }
  455. auto Parser::HandleBraceExpressionParameterAfterDesignator(
  456. BraceExpressionKind kind) -> void {
  457. auto state = PopState();
  458. if (state.has_error) {
  459. auto recovery_pos = FindNextOf(
  460. {TokenKind::Equal(), TokenKind::Colon(), TokenKind::Comma()});
  461. if (!recovery_pos ||
  462. tokens_->GetKind(*recovery_pos) == TokenKind::Comma()) {
  463. state.state = BraceExpressionKindToParserState(
  464. kind, ParserState::BraceExpressionParameterFinishAsType(),
  465. ParserState::BraceExpressionParameterFinishAsValue(),
  466. ParserState::BraceExpressionParameterFinishAsUnknown());
  467. PushState(state);
  468. return;
  469. }
  470. SkipTo(*recovery_pos);
  471. }
  472. // Work out the kind of this element.
  473. auto elem_kind = BraceExpressionKind::Unknown;
  474. if (PositionIs(TokenKind::Colon())) {
  475. elem_kind = BraceExpressionKind::Type;
  476. } else if (PositionIs(TokenKind::Equal())) {
  477. elem_kind = BraceExpressionKind::Value;
  478. }
  479. // Unknown kinds and changes between type and value are errors.
  480. if (elem_kind == BraceExpressionKind::Unknown ||
  481. (kind != BraceExpressionKind::Unknown && elem_kind != kind)) {
  482. HandleBraceExpressionParameterError(state, kind);
  483. return;
  484. }
  485. // If we're setting the kind, update the BraceExpressionFinish state.
  486. if (kind == BraceExpressionKind::Unknown) {
  487. kind = elem_kind;
  488. auto finish_state = PopState();
  489. CARBON_CHECK(finish_state.state ==
  490. ParserState::BraceExpressionFinishAsUnknown());
  491. finish_state.state = BraceExpressionKindToParserState(
  492. kind, ParserState::BraceExpressionFinishAsType(),
  493. ParserState::BraceExpressionFinishAsValue(),
  494. ParserState::BraceExpressionFinishAsUnknown());
  495. PushState(finish_state);
  496. }
  497. state.state = BraceExpressionKindToParserState(
  498. kind, ParserState::BraceExpressionParameterFinishAsType(),
  499. ParserState::BraceExpressionParameterFinishAsValue(),
  500. ParserState::BraceExpressionParameterFinishAsUnknown());
  501. state.token = Consume();
  502. // Struct type fields and value fields use the same grammar except
  503. // that one has a `:` separator and the other has an `=` separator.
  504. PushState(state);
  505. PushState(ParserState::Expression());
  506. }
  507. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsTypeState()
  508. -> void {
  509. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Type);
  510. }
  511. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsValueState()
  512. -> void {
  513. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Value);
  514. }
  515. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsUnknownState()
  516. -> void {
  517. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Unknown);
  518. }
  519. auto Parser::HandleBraceExpressionParameterFinish(BraceExpressionKind kind)
  520. -> void {
  521. auto state = PopState();
  522. if (state.has_error) {
  523. AddLeafNode(ParseNodeKind::StructFieldUnknown(), state.token,
  524. /*has_error=*/true);
  525. } else {
  526. AddNode(kind == BraceExpressionKind::Type
  527. ? ParseNodeKind::StructFieldType()
  528. : ParseNodeKind::StructFieldValue(),
  529. state.token, state.subtree_start, /*has_error=*/false);
  530. }
  531. if (ConsumeListToken(ParseNodeKind::StructComma(),
  532. TokenKind::CloseCurlyBrace(),
  533. state.has_error) == ListTokenKind::Comma) {
  534. PushState(BraceExpressionKindToParserState(
  535. kind, ParserState::BraceExpressionParameterAsType(),
  536. ParserState::BraceExpressionParameterAsValue(),
  537. ParserState::BraceExpressionParameterAsUnknown()));
  538. }
  539. }
  540. auto Parser::HandleBraceExpressionParameterFinishAsTypeState() -> void {
  541. HandleBraceExpressionParameterFinish(BraceExpressionKind::Type);
  542. }
  543. auto Parser::HandleBraceExpressionParameterFinishAsValueState() -> void {
  544. HandleBraceExpressionParameterFinish(BraceExpressionKind::Value);
  545. }
  546. auto Parser::HandleBraceExpressionParameterFinishAsUnknownState() -> void {
  547. HandleBraceExpressionParameterFinish(BraceExpressionKind::Unknown);
  548. }
  549. auto Parser::HandleBraceExpressionFinish(BraceExpressionKind kind) -> void {
  550. auto state = PopState();
  551. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructTypeLiteral()
  552. : ParseNodeKind::StructLiteral(),
  553. Consume(), state.subtree_start, state.has_error);
  554. }
  555. auto Parser::HandleBraceExpressionFinishAsTypeState() -> void {
  556. HandleBraceExpressionFinish(BraceExpressionKind::Type);
  557. }
  558. auto Parser::HandleBraceExpressionFinishAsValueState() -> void {
  559. HandleBraceExpressionFinish(BraceExpressionKind::Value);
  560. }
  561. auto Parser::HandleBraceExpressionFinishAsUnknownState() -> void {
  562. HandleBraceExpressionFinish(BraceExpressionKind::Unknown);
  563. }
  564. auto Parser::HandleCallExpressionState() -> void {
  565. auto state = PopState();
  566. state.state = ParserState::CallExpressionFinish();
  567. PushState(state);
  568. AddNode(ParseNodeKind::CallExpressionStart(), Consume(), state.subtree_start,
  569. state.has_error);
  570. if (!PositionIs(TokenKind::CloseParen())) {
  571. PushState(ParserState::CallExpressionParameterFinish());
  572. PushState(ParserState::Expression());
  573. }
  574. }
  575. auto Parser::HandleCallExpressionParameterFinishState() -> void {
  576. auto state = PopState();
  577. if (state.has_error) {
  578. ReturnErrorOnState();
  579. }
  580. if (ConsumeListToken(ParseNodeKind::CallExpressionComma(),
  581. TokenKind::CloseParen(),
  582. state.has_error) == ListTokenKind::Comma) {
  583. PushState(ParserState::CallExpressionParameterFinish());
  584. PushState(ParserState::Expression());
  585. }
  586. }
  587. auto Parser::HandleCallExpressionFinishState() -> void {
  588. auto state = PopState();
  589. AddNode(ParseNodeKind::CallExpression(), Consume(), state.subtree_start,
  590. state.has_error);
  591. }
  592. auto Parser::HandleCodeBlockFinishState() -> void {
  593. auto state = PopState();
  594. // If the block started with an open curly, this is a close curly.
  595. if (tokens_->GetKind(state.token) == TokenKind::OpenCurlyBrace()) {
  596. AddNode(ParseNodeKind::CodeBlock(), Consume(), state.subtree_start,
  597. state.has_error);
  598. } else {
  599. AddNode(ParseNodeKind::CodeBlock(), state.token, state.subtree_start,
  600. /*has_error=*/true);
  601. }
  602. }
  603. auto Parser::HandleDeclarationLoopState() -> void {
  604. // This maintains the current state unless we're at the end of the file.
  605. switch (PositionKind()) {
  606. case TokenKind::EndOfFile(): {
  607. PopAndDiscardState();
  608. break;
  609. }
  610. case TokenKind::Fn(): {
  611. PushState(ParserState::FunctionIntroducer());
  612. AddLeafNode(ParseNodeKind::FunctionIntroducer(), Consume());
  613. break;
  614. }
  615. case TokenKind::Package(): {
  616. PushState(ParserState::Package());
  617. break;
  618. }
  619. case TokenKind::Semi(): {
  620. AddLeafNode(ParseNodeKind::EmptyDeclaration(), Consume());
  621. break;
  622. }
  623. case TokenKind::Var(): {
  624. PushState(ParserState::VarAsSemicolon());
  625. break;
  626. }
  627. case TokenKind::Interface(): {
  628. PushState(ParserState::InterfaceIntroducer());
  629. ++position_;
  630. break;
  631. }
  632. default: {
  633. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  634. "Unrecognized declaration introducer.");
  635. emitter_->Emit(*position_, UnrecognizedDeclaration);
  636. auto cursor = *position_;
  637. auto semi = SkipPastLikelyEnd(cursor);
  638. // Locate the EmptyDeclaration at the semi when found, but use the
  639. // original cursor location for an error when not.
  640. AddLeafNode(ParseNodeKind::EmptyDeclaration(), semi ? *semi : cursor,
  641. /*has_error=*/true);
  642. break;
  643. }
  644. }
  645. }
  646. auto Parser::HandleDesignator(bool as_struct) -> void {
  647. auto state = PopState();
  648. // `.` identifier
  649. auto dot = ConsumeChecked(TokenKind::Period());
  650. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  651. ParseNodeKind::DesignatedName())) {
  652. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterDot, Error,
  653. "Expected identifier after `.`.");
  654. emitter_->Emit(*position_, ExpectedIdentifierAfterDot);
  655. // If we see a keyword, assume it was intended to be the designated name.
  656. // TODO: Should keywords be valid in designators?
  657. if (PositionKind().IsKeyword()) {
  658. AddLeafNode(ParseNodeKind::DesignatedName(), Consume(),
  659. /*has_error=*/true);
  660. } else {
  661. AddLeafNode(ParseNodeKind::DesignatedName(), *position_,
  662. /*has_error=*/true);
  663. // Indicate the error to the parent state so that it can avoid producing
  664. // more errors.
  665. ReturnErrorOnState();
  666. }
  667. }
  668. AddNode(as_struct ? ParseNodeKind::StructFieldDesignator()
  669. : ParseNodeKind::DesignatorExpression(),
  670. dot, state.subtree_start, state.has_error);
  671. }
  672. auto Parser::HandleDesignatorAsExpressionState() -> void {
  673. HandleDesignator(/*as_struct=*/false);
  674. }
  675. auto Parser::HandleDesignatorAsStructState() -> void {
  676. HandleDesignator(/*as_struct=*/true);
  677. }
  678. auto Parser::HandleExpressionState() -> void {
  679. auto state = PopState();
  680. // Check for a prefix operator.
  681. if (auto operator_precedence = PrecedenceGroup::ForLeading(PositionKind())) {
  682. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  683. *operator_precedence) !=
  684. OperatorPriority::RightFirst) {
  685. // The precedence rules don't permit this prefix operator in this
  686. // context. Diagnose this, but carry on and parse it anyway.
  687. emitter_->Emit(*position_, OperatorRequiresParentheses);
  688. } else {
  689. // Check that this operator follows the proper whitespace rules.
  690. DiagnoseOperatorFixity(OperatorFixity::Prefix);
  691. }
  692. PushStateForExpressionLoop(ParserState::ExpressionLoopForPrefix(),
  693. state.ambient_precedence, *operator_precedence);
  694. ++position_;
  695. PushStateForExpression(*operator_precedence);
  696. } else {
  697. PushStateForExpressionLoop(ParserState::ExpressionLoop(),
  698. state.ambient_precedence,
  699. PrecedenceGroup::ForPostfixExpression());
  700. PushState(ParserState::ExpressionInPostfix());
  701. }
  702. }
  703. auto Parser::HandleExpressionInPostfixState() -> void {
  704. auto state = PopState();
  705. // Continue to the loop state.
  706. state.state = ParserState::ExpressionInPostfixLoop();
  707. // Parses a primary expression, which is either a terminal portion of an
  708. // expression tree, such as an identifier or literal, or a parenthesized
  709. // expression.
  710. switch (PositionKind()) {
  711. case TokenKind::Identifier(): {
  712. AddLeafNode(ParseNodeKind::NameReference(), Consume());
  713. PushState(state);
  714. break;
  715. }
  716. case TokenKind::IntegerLiteral():
  717. case TokenKind::RealLiteral():
  718. case TokenKind::StringLiteral():
  719. case TokenKind::IntegerTypeLiteral():
  720. case TokenKind::UnsignedIntegerTypeLiteral():
  721. case TokenKind::FloatingPointTypeLiteral(): {
  722. AddLeafNode(ParseNodeKind::Literal(), Consume());
  723. PushState(state);
  724. break;
  725. }
  726. case TokenKind::OpenCurlyBrace(): {
  727. PushState(state);
  728. PushState(ParserState::BraceExpression());
  729. break;
  730. }
  731. case TokenKind::OpenParen(): {
  732. PushState(state);
  733. PushState(ParserState::ParenExpression());
  734. break;
  735. }
  736. default: {
  737. CARBON_DIAGNOSTIC(ExpectedExpression, Error, "Expected expression.");
  738. emitter_->Emit(*position_, ExpectedExpression);
  739. ReturnErrorOnState();
  740. break;
  741. }
  742. }
  743. }
  744. auto Parser::HandleExpressionInPostfixLoopState() -> void {
  745. // This is a cyclic state that repeats, so this state is typically pushed back
  746. // on.
  747. auto state = PopState();
  748. state.token = *position_;
  749. switch (PositionKind()) {
  750. case TokenKind::Period(): {
  751. PushState(state);
  752. state.state = ParserState::DesignatorAsExpression();
  753. PushState(state);
  754. break;
  755. }
  756. case TokenKind::OpenParen(): {
  757. PushState(state);
  758. state.state = ParserState::CallExpression();
  759. PushState(state);
  760. break;
  761. }
  762. default: {
  763. if (state.has_error) {
  764. ReturnErrorOnState();
  765. }
  766. break;
  767. }
  768. }
  769. }
  770. auto Parser::HandleExpressionLoopState() -> void {
  771. auto state = PopState();
  772. auto trailing_operator =
  773. PrecedenceGroup::ForTrailing(PositionKind(), IsTrailingOperatorInfix());
  774. if (!trailing_operator) {
  775. if (state.has_error) {
  776. ReturnErrorOnState();
  777. }
  778. return;
  779. }
  780. auto [operator_precedence, is_binary] = *trailing_operator;
  781. // TODO: If this operator is ambiguous with either the ambient precedence
  782. // or the LHS precedence, and there's a variant with a different fixity
  783. // that would work, use that one instead for error recovery.
  784. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  785. operator_precedence) !=
  786. OperatorPriority::RightFirst) {
  787. // The precedence rules don't permit this operator in this context. Try
  788. // again in the enclosing expression context.
  789. if (state.has_error) {
  790. ReturnErrorOnState();
  791. }
  792. return;
  793. }
  794. if (PrecedenceGroup::GetPriority(state.lhs_precedence, operator_precedence) !=
  795. OperatorPriority::LeftFirst) {
  796. // Either the LHS operator and this operator are ambiguous, or the
  797. // LHS operator is a unary operator that can't be nested within
  798. // this operator. Either way, parentheses are required.
  799. emitter_->Emit(*position_, OperatorRequiresParentheses);
  800. state.has_error = true;
  801. } else {
  802. DiagnoseOperatorFixity(is_binary ? OperatorFixity::Infix
  803. : OperatorFixity::Postfix);
  804. }
  805. state.token = Consume();
  806. state.lhs_precedence = operator_precedence;
  807. if (is_binary) {
  808. state.state = ParserState::ExpressionLoopForBinary();
  809. PushState(state);
  810. PushStateForExpression(operator_precedence);
  811. } else {
  812. AddNode(ParseNodeKind::PostfixOperator(), state.token, state.subtree_start,
  813. state.has_error);
  814. state.has_error = false;
  815. PushState(state);
  816. }
  817. }
  818. auto Parser::HandleExpressionLoopForBinaryState() -> void {
  819. auto state = PopState();
  820. AddNode(ParseNodeKind::InfixOperator(), state.token, state.subtree_start,
  821. state.has_error);
  822. state.state = ParserState::ExpressionLoop();
  823. state.has_error = false;
  824. PushState(state);
  825. }
  826. auto Parser::HandleExpressionLoopForPrefixState() -> void {
  827. auto state = PopState();
  828. AddNode(ParseNodeKind::PrefixOperator(), state.token, state.subtree_start,
  829. state.has_error);
  830. state.state = ParserState::ExpressionLoop();
  831. state.has_error = false;
  832. PushState(state);
  833. }
  834. auto Parser::HandleExpressionStatementFinishState() -> void {
  835. auto state = PopState();
  836. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  837. AddNode(ParseNodeKind::ExpressionStatement(), *semi, state.subtree_start,
  838. state.has_error);
  839. return;
  840. }
  841. if (!state.has_error) {
  842. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  843. }
  844. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  845. AddNode(ParseNodeKind::ExpressionStatement(), *semi_token,
  846. state.subtree_start,
  847. /*has_error=*/true);
  848. return;
  849. }
  850. // Found junk not even followed by a `;`, no node to add.
  851. ReturnErrorOnState();
  852. }
  853. auto Parser::HandleFunctionError(StateStackEntry state,
  854. bool skip_past_likely_end) -> void {
  855. auto token = state.token;
  856. if (skip_past_likely_end) {
  857. if (auto semi = SkipPastLikelyEnd(token)) {
  858. token = *semi;
  859. }
  860. }
  861. AddNode(ParseNodeKind::FunctionDeclaration(), token, state.subtree_start,
  862. /*has_error=*/true);
  863. }
  864. auto Parser::HandleFunctionIntroducerState() -> void {
  865. auto state = PopState();
  866. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  867. ParseNodeKind::DeclaredName())) {
  868. CARBON_DIAGNOSTIC(ExpectedFunctionName, Error,
  869. "Expected function name after `fn` keyword.");
  870. emitter_->Emit(*position_, ExpectedFunctionName);
  871. // TODO: We could change the lexer to allow us to synthesize certain
  872. // kinds of tokens and try to "recover" here, but unclear that this is
  873. // really useful.
  874. HandleFunctionError(state, true);
  875. return;
  876. }
  877. if (!PositionIs(TokenKind::OpenParen())) {
  878. CARBON_DIAGNOSTIC(ExpectedFunctionParams, Error,
  879. "Expected `(` after function name.");
  880. emitter_->Emit(*position_, ExpectedFunctionParams);
  881. HandleFunctionError(state, true);
  882. return;
  883. }
  884. // Parse the parameter list as its own subtree; once that pops, resume
  885. // function parsing.
  886. state.state = ParserState::FunctionAfterParameterList();
  887. PushState(state);
  888. PushState(ParserState::FunctionParameterListFinish());
  889. AddLeafNode(ParseNodeKind::ParameterListStart(), Consume());
  890. if (!PositionIs(TokenKind::CloseParen())) {
  891. PushState(ParserState::FunctionParameter());
  892. }
  893. }
  894. auto Parser::HandleFunctionParameterState() -> void {
  895. PopAndDiscardState();
  896. PushState(ParserState::FunctionParameterFinish());
  897. PushState(ParserState::PatternAsFunctionParameter());
  898. }
  899. auto Parser::HandleFunctionParameterFinishState() -> void {
  900. auto state = PopState();
  901. if (state.has_error) {
  902. ReturnErrorOnState();
  903. }
  904. if (ConsumeListToken(ParseNodeKind::ParameterListComma(),
  905. TokenKind::CloseParen(),
  906. state.has_error) == ListTokenKind::Comma) {
  907. PushState(ParserState::PatternAsFunctionParameter());
  908. }
  909. }
  910. auto Parser::HandleFunctionParameterListFinishState() -> void {
  911. auto state = PopState();
  912. AddNode(ParseNodeKind::ParameterList(),
  913. ConsumeChecked(TokenKind::CloseParen()), state.subtree_start,
  914. state.has_error);
  915. }
  916. auto Parser::HandleFunctionAfterParameterListState() -> void {
  917. auto state = PopState();
  918. // Regardless of whether there's a return type, we'll finish the signature.
  919. state.state = ParserState::FunctionSignatureFinish();
  920. PushState(state);
  921. // If there is a return type, parse the expression before adding the return
  922. // type nod.e
  923. if (PositionIs(TokenKind::MinusGreater())) {
  924. PushState(ParserState::FunctionReturnTypeFinish());
  925. ++position_;
  926. PushStateForExpression(PrecedenceGroup::ForType());
  927. }
  928. }
  929. auto Parser::HandleFunctionReturnTypeFinishState() -> void {
  930. auto state = PopState();
  931. AddNode(ParseNodeKind::ReturnType(), state.token, state.subtree_start,
  932. state.has_error);
  933. }
  934. auto Parser::HandleFunctionSignatureFinishState() -> void {
  935. auto state = PopState();
  936. switch (PositionKind()) {
  937. case TokenKind::Semi(): {
  938. AddNode(ParseNodeKind::FunctionDeclaration(), Consume(),
  939. state.subtree_start, state.has_error);
  940. break;
  941. }
  942. case TokenKind::OpenCurlyBrace(): {
  943. AddNode(ParseNodeKind::FunctionDefinitionStart(), Consume(),
  944. state.subtree_start, state.has_error);
  945. // Any error is recorded on the FunctionDefinitionStart.
  946. state.has_error = false;
  947. state.state = ParserState::FunctionDefinitionFinish();
  948. PushState(state);
  949. PushState(ParserState::StatementScopeLoop());
  950. break;
  951. }
  952. default: {
  953. CARBON_DIAGNOSTIC(
  954. ExpectedFunctionBodyOrSemi, Error,
  955. "Expected function definition or `;` after function declaration.");
  956. emitter_->Emit(*position_, ExpectedFunctionBodyOrSemi);
  957. // Only need to skip if we've not already found a new line.
  958. bool skip_past_likely_end =
  959. tokens_->GetLine(*position_) == tokens_->GetLine(state.token);
  960. HandleFunctionError(state, skip_past_likely_end);
  961. break;
  962. }
  963. }
  964. }
  965. auto Parser::HandleFunctionDefinitionFinishState() -> void {
  966. auto state = PopState();
  967. AddNode(ParseNodeKind::FunctionDefinition(), Consume(), state.subtree_start,
  968. state.has_error);
  969. }
  970. auto Parser::HandlePackageState() -> void {
  971. auto state = PopState();
  972. AddLeafNode(ParseNodeKind::PackageIntroducer(), Consume());
  973. auto exit_on_parse_error = [&]() {
  974. auto semi_token = SkipPastLikelyEnd(state.token);
  975. return AddNode(ParseNodeKind::PackageDirective(),
  976. semi_token ? *semi_token : state.token, state.subtree_start,
  977. /*has_error=*/true);
  978. };
  979. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  980. ParseNodeKind::DeclaredName())) {
  981. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterPackage, Error,
  982. "Expected identifier after `package`.");
  983. emitter_->Emit(*position_, ExpectedIdentifierAfterPackage);
  984. exit_on_parse_error();
  985. return;
  986. }
  987. bool library_parsed = false;
  988. if (auto library_token = ConsumeIf(TokenKind::Library())) {
  989. auto library_start = tree_->size();
  990. if (!ConsumeAndAddLeafNodeIf(TokenKind::StringLiteral(),
  991. ParseNodeKind::Literal())) {
  992. CARBON_DIAGNOSTIC(
  993. ExpectedLibraryName, Error,
  994. "Expected a string literal to specify the library name.");
  995. emitter_->Emit(*position_, ExpectedLibraryName);
  996. exit_on_parse_error();
  997. return;
  998. }
  999. AddNode(ParseNodeKind::PackageLibrary(), *library_token, library_start,
  1000. /*has_error=*/false);
  1001. library_parsed = true;
  1002. }
  1003. switch (auto api_or_impl_token = tokens_->GetKind(*(position_))) {
  1004. case TokenKind::Api(): {
  1005. AddLeafNode(ParseNodeKind::PackageApi(), Consume());
  1006. break;
  1007. }
  1008. case TokenKind::Impl(): {
  1009. AddLeafNode(ParseNodeKind::PackageImpl(), Consume());
  1010. break;
  1011. }
  1012. default: {
  1013. if (!library_parsed && api_or_impl_token == TokenKind::StringLiteral()) {
  1014. // If we come acroess a string literal and we didn't parse `library
  1015. // "..."` yet, then most probably the user forgot to add `library`
  1016. // before the library name.
  1017. CARBON_DIAGNOSTIC(MissingLibraryKeyword, Error,
  1018. "Missing `library` keyword.");
  1019. emitter_->Emit(*position_, MissingLibraryKeyword);
  1020. } else {
  1021. CARBON_DIAGNOSTIC(ExpectedApiOrImpl, Error,
  1022. "Expected a `api` or `impl`.");
  1023. emitter_->Emit(*position_, ExpectedApiOrImpl);
  1024. }
  1025. exit_on_parse_error();
  1026. return;
  1027. }
  1028. }
  1029. if (!PositionIs(TokenKind::Semi())) {
  1030. CARBON_DIAGNOSTIC(ExpectedSemiToEndPackageDirective, Error,
  1031. "Expected `;` to end package directive.");
  1032. emitter_->Emit(*position_, ExpectedSemiToEndPackageDirective);
  1033. exit_on_parse_error();
  1034. return;
  1035. }
  1036. AddNode(ParseNodeKind::PackageDirective(), Consume(), state.subtree_start,
  1037. /*has_error=*/false);
  1038. }
  1039. auto Parser::HandleParenCondition(ParseNodeKind start_kind,
  1040. ParserState finish_state) -> void {
  1041. auto state = PopState();
  1042. ConsumeAndAddOpenParen(state.token, start_kind);
  1043. state.state = finish_state;
  1044. PushState(state);
  1045. PushState(ParserState::Expression());
  1046. }
  1047. auto Parser::HandleParenConditionAsIfState() -> void {
  1048. HandleParenCondition(ParseNodeKind::IfConditionStart(),
  1049. ParserState::ParenConditionFinishAsIf());
  1050. }
  1051. auto Parser::HandleParenConditionAsWhileState() -> void {
  1052. HandleParenCondition(ParseNodeKind::WhileConditionStart(),
  1053. ParserState::ParenConditionFinishAsWhile());
  1054. }
  1055. auto Parser::HandleParenConditionFinishAsIfState() -> void {
  1056. auto state = PopState();
  1057. ConsumeAndAddCloseParen(state, ParseNodeKind::IfCondition());
  1058. }
  1059. auto Parser::HandleParenConditionFinishAsWhileState() -> void {
  1060. auto state = PopState();
  1061. ConsumeAndAddCloseParen(state, ParseNodeKind::WhileCondition());
  1062. }
  1063. auto Parser::HandleParenExpressionState() -> void {
  1064. auto state = PopState();
  1065. // Advance past the open paren.
  1066. AddLeafNode(ParseNodeKind::ParenExpressionOrTupleLiteralStart(),
  1067. ConsumeChecked(TokenKind::OpenParen()));
  1068. if (PositionIs(TokenKind::CloseParen())) {
  1069. state.state = ParserState::ParenExpressionFinishAsTuple();
  1070. PushState(state);
  1071. } else {
  1072. state.state = ParserState::ParenExpressionFinish();
  1073. PushState(state);
  1074. PushState(ParserState::ParenExpressionParameterFinishAsUnknown());
  1075. PushState(ParserState::Expression());
  1076. }
  1077. }
  1078. auto Parser::HandleParenExpressionParameterFinish(bool as_tuple) -> void {
  1079. auto state = PopState();
  1080. auto list_token_kind =
  1081. ConsumeListToken(ParseNodeKind::TupleLiteralComma(),
  1082. TokenKind::CloseParen(), state.has_error);
  1083. if (list_token_kind == ListTokenKind::Close) {
  1084. return;
  1085. }
  1086. // If this is the first item and a comma was found, switch to tuple handling.
  1087. // Note this could be `(expr,)` so we may not reuse the current state, but
  1088. // it's still necessary to switch the parent.
  1089. if (!as_tuple) {
  1090. state.state = ParserState::ParenExpressionParameterFinishAsTuple();
  1091. auto finish_state = PopState();
  1092. CARBON_CHECK(finish_state.state == ParserState::ParenExpressionFinish())
  1093. << "Unexpected parent state, found: " << finish_state.state;
  1094. finish_state.state = ParserState::ParenExpressionFinishAsTuple();
  1095. PushState(finish_state);
  1096. }
  1097. // On a comma, push another expression handler.
  1098. if (list_token_kind == ListTokenKind::Comma) {
  1099. PushState(state);
  1100. PushState(ParserState::Expression());
  1101. }
  1102. }
  1103. auto Parser::HandleParenExpressionParameterFinishAsUnknownState() -> void {
  1104. HandleParenExpressionParameterFinish(/*as_tuple=*/false);
  1105. }
  1106. auto Parser::HandleParenExpressionParameterFinishAsTupleState() -> void {
  1107. HandleParenExpressionParameterFinish(/*as_tuple=*/true);
  1108. }
  1109. auto Parser::HandleParenExpressionFinishState() -> void {
  1110. auto state = PopState();
  1111. AddNode(ParseNodeKind::ParenExpression(), Consume(), state.subtree_start,
  1112. state.has_error);
  1113. }
  1114. auto Parser::HandleParenExpressionFinishAsTupleState() -> void {
  1115. auto state = PopState();
  1116. AddNode(ParseNodeKind::TupleLiteral(), Consume(), state.subtree_start,
  1117. state.has_error);
  1118. }
  1119. auto Parser::HandlePattern(PatternKind pattern_kind) -> void {
  1120. auto state = PopState();
  1121. // Ensure the finish state always follows.
  1122. state.state = ParserState::PatternFinish();
  1123. // Handle an invalid pattern introducer.
  1124. if (!PositionIs(TokenKind::Identifier()) ||
  1125. tokens_->GetKind(*(position_ + 1)) != TokenKind::Colon()) {
  1126. switch (pattern_kind) {
  1127. case PatternKind::Parameter: {
  1128. CARBON_DIAGNOSTIC(ExpectedParameterName, Error,
  1129. "Expected parameter declaration.");
  1130. emitter_->Emit(*position_, ExpectedParameterName);
  1131. break;
  1132. }
  1133. case PatternKind::Variable: {
  1134. CARBON_DIAGNOSTIC(ExpectedVariableName, Error,
  1135. "Expected pattern in `var` declaration.");
  1136. emitter_->Emit(*position_, ExpectedVariableName);
  1137. break;
  1138. }
  1139. }
  1140. state.has_error = true;
  1141. PushState(state);
  1142. return;
  1143. }
  1144. // Switch the context token to the colon, so that it'll be used for the root
  1145. // node.
  1146. state.token = *(position_ + 1);
  1147. PushState(state);
  1148. PushStateForExpression(PrecedenceGroup::ForType());
  1149. AddLeafNode(ParseNodeKind::DeclaredName(), *position_);
  1150. position_ += 2;
  1151. }
  1152. auto Parser::HandlePatternAsFunctionParameterState() -> void {
  1153. HandlePattern(PatternKind::Parameter);
  1154. }
  1155. auto Parser::HandlePatternAsVariableState() -> void {
  1156. HandlePattern(PatternKind::Variable);
  1157. }
  1158. auto Parser::HandlePatternFinishState() -> void {
  1159. auto state = PopState();
  1160. // If an error was encountered, propagate it without adding a node.
  1161. if (state.has_error) {
  1162. ReturnErrorOnState();
  1163. return;
  1164. }
  1165. // TODO: may need to mark has_error if !type.
  1166. AddNode(ParseNodeKind::PatternBinding(), state.token, state.subtree_start,
  1167. /*has_error=*/false);
  1168. }
  1169. auto Parser::HandleStatementState() -> void {
  1170. PopAndDiscardState();
  1171. switch (PositionKind()) {
  1172. case TokenKind::Break(): {
  1173. PushState(ParserState::StatementBreakFinish());
  1174. AddLeafNode(ParseNodeKind::BreakStatementStart(), Consume());
  1175. break;
  1176. }
  1177. case TokenKind::Continue(): {
  1178. PushState(ParserState::StatementContinueFinish());
  1179. AddLeafNode(ParseNodeKind::ContinueStatementStart(), Consume());
  1180. break;
  1181. }
  1182. case TokenKind::For(): {
  1183. PushState(ParserState::StatementForFinish());
  1184. PushState(ParserState::StatementForHeader());
  1185. ++position_;
  1186. break;
  1187. }
  1188. case TokenKind::If(): {
  1189. PushState(ParserState::StatementIf());
  1190. break;
  1191. }
  1192. case TokenKind::Return(): {
  1193. PushState(ParserState::StatementReturn());
  1194. break;
  1195. }
  1196. case TokenKind::Var(): {
  1197. PushState(ParserState::VarAsSemicolon());
  1198. break;
  1199. }
  1200. case TokenKind::While(): {
  1201. PushState(ParserState::StatementWhile());
  1202. break;
  1203. }
  1204. default: {
  1205. PushState(ParserState::ExpressionStatementFinish());
  1206. PushState(ParserState::Expression());
  1207. break;
  1208. }
  1209. }
  1210. }
  1211. auto Parser::HandleStatementBreakFinishState() -> void {
  1212. HandleStatementKeywordFinish(ParseNodeKind::BreakStatement());
  1213. }
  1214. auto Parser::HandleStatementContinueFinishState() -> void {
  1215. HandleStatementKeywordFinish(ParseNodeKind::ContinueStatement());
  1216. }
  1217. auto Parser::HandleStatementForHeaderState() -> void {
  1218. auto state = PopState();
  1219. ConsumeAndAddOpenParen(state.token, ParseNodeKind::ForHeaderStart());
  1220. state.state = ParserState::StatementForHeaderIn();
  1221. if (PositionIs(TokenKind::Var())) {
  1222. PushState(state);
  1223. PushState(ParserState::VarAsFor());
  1224. } else {
  1225. CARBON_DIAGNOSTIC(ExpectedVariableDeclaration, Error,
  1226. "Expected `var` declaration.");
  1227. emitter_->Emit(*position_, ExpectedVariableDeclaration);
  1228. if (auto next_in = FindNextOf({TokenKind::In()})) {
  1229. SkipTo(*next_in);
  1230. ++position_;
  1231. }
  1232. state.has_error = true;
  1233. PushState(state);
  1234. }
  1235. }
  1236. auto Parser::HandleStatementForHeaderInState() -> void {
  1237. auto state = PopState();
  1238. state.state = ParserState::StatementForHeaderFinish();
  1239. PushState(state);
  1240. PushState(ParserState::Expression());
  1241. }
  1242. auto Parser::HandleStatementForHeaderFinishState() -> void {
  1243. auto state = PopState();
  1244. ConsumeAndAddCloseParen(state, ParseNodeKind::ForHeader());
  1245. PushState(ParserState::CodeBlock());
  1246. }
  1247. auto Parser::HandleStatementForFinishState() -> void {
  1248. auto state = PopState();
  1249. AddNode(ParseNodeKind::ForStatement(), state.token, state.subtree_start,
  1250. state.has_error);
  1251. }
  1252. auto Parser::HandleStatementIfState() -> void {
  1253. PopAndDiscardState();
  1254. PushState(ParserState::StatementIfConditionFinish());
  1255. PushState(ParserState::ParenConditionAsIf());
  1256. ++position_;
  1257. }
  1258. auto Parser::HandleStatementIfConditionFinishState() -> void {
  1259. auto state = PopState();
  1260. state.state = ParserState::StatementIfThenBlockFinish();
  1261. PushState(state);
  1262. PushState(ParserState::CodeBlock());
  1263. }
  1264. auto Parser::HandleStatementIfThenBlockFinishState() -> void {
  1265. auto state = PopState();
  1266. if (ConsumeAndAddLeafNodeIf(TokenKind::Else(),
  1267. ParseNodeKind::IfStatementElse())) {
  1268. state.state = ParserState::StatementIfElseBlockFinish();
  1269. PushState(state);
  1270. // `else if` is permitted as a special case.
  1271. PushState(PositionIs(TokenKind::If()) ? ParserState::StatementIf()
  1272. : ParserState::CodeBlock());
  1273. } else {
  1274. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1275. state.has_error);
  1276. }
  1277. }
  1278. auto Parser::HandleStatementIfElseBlockFinishState() -> void {
  1279. auto state = PopState();
  1280. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1281. state.has_error);
  1282. }
  1283. auto Parser::HandleStatementKeywordFinish(ParseNodeKind node_kind) -> void {
  1284. auto state = PopState();
  1285. auto semi = ConsumeIf(TokenKind::Semi());
  1286. if (!semi) {
  1287. CARBON_DIAGNOSTIC(ExpectedSemiAfter, Error, "Expected `;` after `{0}`.",
  1288. TokenKind);
  1289. emitter_->Emit(*position_, ExpectedSemiAfter,
  1290. tokens_->GetKind(state.token));
  1291. state.has_error = true;
  1292. // Recover to the next semicolon if possible, otherwise indicate the
  1293. // keyword for the error.
  1294. semi = SkipPastLikelyEnd(state.token);
  1295. if (!semi) {
  1296. semi = state.token;
  1297. }
  1298. }
  1299. AddNode(node_kind, *semi, state.subtree_start, state.has_error);
  1300. }
  1301. auto Parser::HandleStatementReturnState() -> void {
  1302. auto state = PopState();
  1303. state.state = ParserState::StatementReturnFinish();
  1304. PushState(state);
  1305. AddLeafNode(ParseNodeKind::ReturnStatementStart(), Consume());
  1306. if (!PositionIs(TokenKind::Semi())) {
  1307. PushState(ParserState::Expression());
  1308. }
  1309. }
  1310. auto Parser::HandleStatementReturnFinishState() -> void {
  1311. HandleStatementKeywordFinish(ParseNodeKind::ReturnStatement());
  1312. }
  1313. auto Parser::HandleStatementScopeLoopState() -> void {
  1314. // This maintains the current state until we're at the end of the scope.
  1315. auto token_kind = PositionKind();
  1316. if (token_kind == TokenKind::CloseCurlyBrace()) {
  1317. auto state = PopState();
  1318. if (state.has_error) {
  1319. ReturnErrorOnState();
  1320. }
  1321. } else {
  1322. PushState(ParserState::Statement());
  1323. }
  1324. }
  1325. auto Parser::HandleStatementWhileState() -> void {
  1326. PopAndDiscardState();
  1327. PushState(ParserState::StatementWhileConditionFinish());
  1328. PushState(ParserState::ParenConditionAsWhile());
  1329. ++position_;
  1330. }
  1331. auto Parser::HandleStatementWhileConditionFinishState() -> void {
  1332. auto state = PopState();
  1333. state.state = ParserState::StatementWhileBlockFinish();
  1334. PushState(state);
  1335. PushState(ParserState::CodeBlock());
  1336. }
  1337. auto Parser::HandleStatementWhileBlockFinishState() -> void {
  1338. auto state = PopState();
  1339. AddNode(ParseNodeKind::WhileStatement(), state.token, state.subtree_start,
  1340. state.has_error);
  1341. }
  1342. auto Parser::HandleVar(ParserState finish_state) -> void {
  1343. PopAndDiscardState();
  1344. // These will start at the `var`.
  1345. PushState(finish_state);
  1346. PushState(ParserState::VarAfterPattern());
  1347. AddLeafNode(ParseNodeKind::VariableIntroducer(), Consume());
  1348. // This will start at the pattern.
  1349. PushState(ParserState::PatternAsVariable());
  1350. }
  1351. auto Parser::HandleVarAsSemicolonState() -> void {
  1352. HandleVar(ParserState::VarFinishAsSemicolon());
  1353. }
  1354. auto Parser::HandleVarAsForState() -> void {
  1355. HandleVar(ParserState::VarFinishAsFor());
  1356. }
  1357. auto Parser::HandleVarAfterPatternState() -> void {
  1358. auto state = PopState();
  1359. if (state.has_error) {
  1360. if (auto after_pattern =
  1361. FindNextOf({TokenKind::Equal(), TokenKind::Semi()})) {
  1362. SkipTo(*after_pattern);
  1363. }
  1364. }
  1365. if (PositionIs(TokenKind::Equal())) {
  1366. PushState(ParserState::VarAfterInitializer());
  1367. ++position_;
  1368. PushState(ParserState::Expression());
  1369. return;
  1370. }
  1371. }
  1372. auto Parser::HandleVarAfterInitializerState() -> void {
  1373. auto state = PopState();
  1374. AddNode(ParseNodeKind::VariableInitializer(), state.token,
  1375. state.subtree_start, state.has_error);
  1376. }
  1377. auto Parser::HandleVarFinishAsSemicolonState() -> void {
  1378. auto state = PopState();
  1379. auto end_token = state.token;
  1380. if (PositionIs(TokenKind::Semi())) {
  1381. end_token = Consume();
  1382. } else {
  1383. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  1384. state.has_error = true;
  1385. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  1386. end_token = *semi_token;
  1387. }
  1388. }
  1389. AddNode(ParseNodeKind::VariableDeclaration(), end_token, state.subtree_start,
  1390. state.has_error);
  1391. }
  1392. auto Parser::HandleVarFinishAsForState() -> void {
  1393. auto state = PopState();
  1394. auto end_token = state.token;
  1395. if (PositionIs(TokenKind::In())) {
  1396. end_token = Consume();
  1397. } else if (PositionIs(TokenKind::Colon())) {
  1398. CARBON_DIAGNOSTIC(ExpectedIn, Error, "`:` should be replaced by `in`.");
  1399. emitter_->Emit(*position_, ExpectedIn);
  1400. state.has_error = true;
  1401. end_token = Consume();
  1402. } else {
  1403. CARBON_DIAGNOSTIC(ExpectedIn, Error,
  1404. "Expected `in` after loop `var` declaration.");
  1405. emitter_->Emit(*position_, ExpectedIn);
  1406. state.has_error = true;
  1407. }
  1408. AddNode(ParseNodeKind::ForIn(), end_token, state.subtree_start,
  1409. state.has_error);
  1410. }
  1411. auto Parser::HandleInterfaceIntroducerState() -> void {
  1412. auto state = PopState();
  1413. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  1414. ParseNodeKind::DeclaredName())) {
  1415. CARBON_DIAGNOSTIC(ExpectedInterfaceName, Error,
  1416. "Expected interface name after `interface` keyword.");
  1417. emitter_->Emit(*position_, ExpectedInterfaceName);
  1418. state.has_error = true;
  1419. // Add a name node even when it's not present because it's used for subtree
  1420. // bracketing on interfaces.
  1421. // TODO: Either fix this or normalize it, still deciding on the right
  1422. // approach.
  1423. AddLeafNode(ParseNodeKind::DeclaredName(), state.token, /*has_error=*/true);
  1424. }
  1425. bool parse_body = true;
  1426. if (!PositionIs(TokenKind::OpenCurlyBrace())) {
  1427. CARBON_DIAGNOSTIC(ExpectedInterfaceOpenCurlyBrace, Error,
  1428. "Expected `{{` to start interface definition.");
  1429. emitter_->Emit(*position_, ExpectedInterfaceOpenCurlyBrace);
  1430. state.has_error = true;
  1431. SkipPastLikelyEnd(state.token);
  1432. parse_body = false;
  1433. }
  1434. state.state = ParserState::InterfaceDefinitionFinish();
  1435. PushState(state);
  1436. if (parse_body) {
  1437. PushState(ParserState::InterfaceDefinitionLoop());
  1438. AddLeafNode(ParseNodeKind::InterfaceBodyStart(), Consume());
  1439. }
  1440. }
  1441. auto Parser::HandleInterfaceDefinitionLoopState() -> void {
  1442. // This maintains the current state unless we're at the end of the interface
  1443. // definition.
  1444. switch (PositionKind()) {
  1445. case TokenKind::CloseCurlyBrace(): {
  1446. auto state = PopState();
  1447. AddNode(ParseNodeKind::InterfaceBody(), Consume(), state.subtree_start,
  1448. state.has_error);
  1449. break;
  1450. }
  1451. // TODO: Handle possible declarations inside interface body.
  1452. default: {
  1453. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  1454. "Unrecognized declaration introducer.");
  1455. emitter_->Emit(*position_, UnrecognizedDeclaration);
  1456. if (auto semi = SkipPastLikelyEnd(*position_)) {
  1457. AddLeafNode(ParseNodeKind::EmptyDeclaration(), *semi,
  1458. /*has_error=*/true);
  1459. } else {
  1460. ReturnErrorOnState();
  1461. }
  1462. break;
  1463. }
  1464. }
  1465. }
  1466. auto Parser::HandleInterfaceDefinitionFinishState() -> void {
  1467. auto state = PopState();
  1468. AddNode(ParseNodeKind::InterfaceDefinition(), state.token,
  1469. state.subtree_start, state.has_error);
  1470. }
  1471. } // namespace Carbon