parser.cpp 53 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/parser/parser.h"
  5. #include <cstdlib>
  6. #include <memory>
  7. #include "common/check.h"
  8. #include "llvm/ADT/Optional.h"
  9. #include "llvm/Support/PrettyStackTrace.h"
  10. #include "toolchain/lexer/token_kind.h"
  11. #include "toolchain/lexer/tokenized_buffer.h"
  12. #include "toolchain/parser/parse_node_kind.h"
  13. #include "toolchain/parser/parse_tree.h"
  14. namespace Carbon {
  15. // May be emitted a couple different ways as part of operator parsing.
  16. CARBON_DIAGNOSTIC(
  17. OperatorRequiresParentheses, Error,
  18. "Parentheses are required to disambiguate operator precedence.");
  19. CARBON_DIAGNOSTIC(ExpectedSemiAfterExpression, Error,
  20. "Expected `;` after expression.");
  21. // A relative location for characters in errors.
  22. enum class RelativeLocation : int8_t {
  23. Around,
  24. After,
  25. Before,
  26. };
  27. // Adapts RelativeLocation for use with formatv.
  28. static auto operator<<(llvm::raw_ostream& out, RelativeLocation loc)
  29. -> llvm::raw_ostream& {
  30. switch (loc) {
  31. case RelativeLocation::Around:
  32. out << "around";
  33. break;
  34. case RelativeLocation::After:
  35. out << "after";
  36. break;
  37. case RelativeLocation::Before:
  38. out << "before";
  39. break;
  40. }
  41. return out;
  42. }
  43. class Parser::PrettyStackTraceParseState : public llvm::PrettyStackTraceEntry {
  44. public:
  45. explicit PrettyStackTraceParseState(const Parser* parser) : parser_(parser) {}
  46. ~PrettyStackTraceParseState() override = default;
  47. auto print(llvm::raw_ostream& output) const -> void override {
  48. output << "Parser stack:\n";
  49. for (int i = 0; i < static_cast<int>(parser_->state_stack_.size()); ++i) {
  50. const auto& entry = parser_->state_stack_[i];
  51. output << "\t" << i << ".\t" << entry.state;
  52. Print(output, entry.token);
  53. }
  54. output << "\tcursor\tposition_";
  55. Print(output, *parser_->position_);
  56. }
  57. private:
  58. auto Print(llvm::raw_ostream& output, TokenizedBuffer::Token token) const
  59. -> void {
  60. auto line = parser_->tokens_.GetLine(token);
  61. output << " @ " << parser_->tokens_.GetLineNumber(line) << ":"
  62. << parser_->tokens_.GetColumnNumber(token) << ":"
  63. << " token " << token << " : "
  64. << parser_->tokens_.GetKind(token).Name() << "\n";
  65. }
  66. const Parser* parser_;
  67. };
  68. Parser::Parser(ParseTree& tree_arg, TokenizedBuffer& tokens_arg,
  69. TokenDiagnosticEmitter& emitter)
  70. : tree_(tree_arg),
  71. tokens_(tokens_arg),
  72. emitter_(emitter),
  73. position_(tokens_.tokens().begin()),
  74. end_(tokens_.tokens().end()) {
  75. CARBON_CHECK(position_ != end_) << "Empty TokenizedBuffer";
  76. --end_;
  77. CARBON_CHECK(tokens_.GetKind(*end_) == TokenKind::EndOfFile())
  78. << "TokenizedBuffer should end with EndOfFile, ended with "
  79. << tokens_.GetKind(*end_).Name();
  80. }
  81. auto Parser::AddLeafNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  82. bool has_error) -> void {
  83. tree_.node_impls_.push_back(
  84. ParseTree::NodeImpl(kind, has_error, token, /*subtree_size=*/1));
  85. if (has_error) {
  86. tree_.has_errors_ = true;
  87. }
  88. }
  89. auto Parser::AddNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  90. int subtree_start, bool has_error) -> void {
  91. int subtree_size = tree_.size() - subtree_start + 1;
  92. tree_.node_impls_.push_back(
  93. ParseTree::NodeImpl(kind, has_error, token, subtree_size));
  94. if (has_error) {
  95. tree_.has_errors_ = true;
  96. }
  97. }
  98. auto Parser::ConsumeAndAddCloseParen(TokenizedBuffer::Token open_paren,
  99. ParseNodeKind close_kind) -> bool {
  100. if (ConsumeAndAddLeafNodeIf(TokenKind::CloseParen(), close_kind)) {
  101. return true;
  102. }
  103. // TODO: Include the location of the matching open_paren in the diagnostic.
  104. CARBON_DIAGNOSTIC(ExpectedCloseParen, Error, "Unexpected tokens before `)`.");
  105. emitter_.Emit(*position_, ExpectedCloseParen);
  106. SkipTo(tokens_.GetMatchedClosingToken(open_paren));
  107. AddLeafNode(close_kind, Consume());
  108. return false;
  109. }
  110. auto Parser::ConsumeAndAddLeafNodeIf(TokenKind token_kind,
  111. ParseNodeKind node_kind) -> bool {
  112. auto token = ConsumeIf(token_kind);
  113. if (!token) {
  114. return false;
  115. }
  116. AddLeafNode(node_kind, *token);
  117. return true;
  118. }
  119. auto Parser::ConsumeIf(TokenKind kind)
  120. -> llvm::Optional<TokenizedBuffer::Token> {
  121. if (!PositionIs(kind)) {
  122. return llvm::None;
  123. }
  124. return Consume();
  125. }
  126. auto Parser::FindNextOf(std::initializer_list<TokenKind> desired_kinds)
  127. -> llvm::Optional<TokenizedBuffer::Token> {
  128. auto new_position = position_;
  129. while (true) {
  130. TokenizedBuffer::Token token = *new_position;
  131. TokenKind kind = tokens_.GetKind(token);
  132. if (kind.IsOneOf(desired_kinds)) {
  133. return token;
  134. }
  135. // Step to the next token at the current bracketing level.
  136. if (kind.IsClosingSymbol() || kind == TokenKind::EndOfFile()) {
  137. // There are no more tokens at this level.
  138. return llvm::None;
  139. } else if (kind.IsOpeningSymbol()) {
  140. new_position =
  141. TokenizedBuffer::TokenIterator(tokens_.GetMatchedClosingToken(token));
  142. // Advance past the closing token.
  143. ++new_position;
  144. } else {
  145. ++new_position;
  146. }
  147. }
  148. }
  149. auto Parser::SkipMatchingGroup() -> bool {
  150. if (!PositionKind().IsOpeningSymbol()) {
  151. return false;
  152. }
  153. SkipTo(tokens_.GetMatchedClosingToken(*position_));
  154. ++position_;
  155. return true;
  156. }
  157. auto Parser::SkipPastLikelyEnd(TokenizedBuffer::Token skip_root)
  158. -> llvm::Optional<TokenizedBuffer::Token> {
  159. if (position_ == end_) {
  160. return llvm::None;
  161. }
  162. TokenizedBuffer::Line root_line = tokens_.GetLine(skip_root);
  163. int root_line_indent = tokens_.GetIndentColumnNumber(root_line);
  164. // We will keep scanning through tokens on the same line as the root or
  165. // lines with greater indentation than root's line.
  166. auto is_same_line_or_indent_greater_than_root =
  167. [&](TokenizedBuffer::Token t) {
  168. TokenizedBuffer::Line l = tokens_.GetLine(t);
  169. if (l == root_line) {
  170. return true;
  171. }
  172. return tokens_.GetIndentColumnNumber(l) > root_line_indent;
  173. };
  174. do {
  175. if (PositionIs(TokenKind::CloseCurlyBrace())) {
  176. // Immediately bail out if we hit an unmatched close curly, this will
  177. // pop us up a level of the syntax grouping.
  178. return llvm::None;
  179. }
  180. // We assume that a semicolon is always intended to be the end of the
  181. // current construct.
  182. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  183. return semi;
  184. }
  185. // Skip over any matching group of tokens_.
  186. if (SkipMatchingGroup()) {
  187. continue;
  188. }
  189. // Otherwise just step forward one token.
  190. ++position_;
  191. } while (position_ != end_ &&
  192. is_same_line_or_indent_greater_than_root(*position_));
  193. return llvm::None;
  194. }
  195. auto Parser::SkipTo(TokenizedBuffer::Token t) -> void {
  196. CARBON_CHECK(t >= *position_) << "Tried to skip backwards from " << position_
  197. << " to " << TokenizedBuffer::TokenIterator(t);
  198. position_ = TokenizedBuffer::TokenIterator(t);
  199. CARBON_CHECK(position_ != end_) << "Skipped past EOF.";
  200. }
  201. auto Parser::HandleCodeBlockState() -> void {
  202. PopAndDiscardState();
  203. PushState(ParserState::CodeBlockFinish());
  204. if (ConsumeAndAddLeafNodeIf(TokenKind::OpenCurlyBrace(),
  205. ParseNodeKind::CodeBlockStart())) {
  206. PushState(ParserState::StatementScopeLoop());
  207. } else {
  208. AddLeafNode(ParseNodeKind::CodeBlockStart(), *position_,
  209. /*has_error=*/true);
  210. // Recover by parsing a single statement.
  211. CARBON_DIAGNOSTIC(ExpectedCodeBlock, Error, "Expected braced code block.");
  212. emitter_.Emit(*position_, ExpectedCodeBlock);
  213. PushState(ParserState::Statement());
  214. }
  215. }
  216. // Determines whether the given token is considered to be the start of an
  217. // operand according to the rules for infix operator parsing.
  218. static auto IsAssumedStartOfOperand(TokenKind kind) -> bool {
  219. return kind.IsOneOf({TokenKind::OpenParen(), TokenKind::Identifier(),
  220. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  221. TokenKind::StringLiteral()});
  222. }
  223. // Determines whether the given token is considered to be the end of an
  224. // operand according to the rules for infix operator parsing.
  225. static auto IsAssumedEndOfOperand(TokenKind kind) -> bool {
  226. return kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  227. TokenKind::CloseSquareBracket(), TokenKind::Identifier(),
  228. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  229. TokenKind::StringLiteral()});
  230. }
  231. // Determines whether the given token could possibly be the start of an
  232. // operand. This is conservatively correct, and will never incorrectly return
  233. // `false`, but can incorrectly return `true`.
  234. static auto IsPossibleStartOfOperand(TokenKind kind) -> bool {
  235. return !kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  236. TokenKind::CloseSquareBracket(), TokenKind::Comma(),
  237. TokenKind::Semi(), TokenKind::Colon()});
  238. }
  239. auto Parser::IsLexicallyValidInfixOperator() -> bool {
  240. CARBON_CHECK(position_ != end_) << "Expected an operator token.";
  241. bool leading_space = tokens_.HasLeadingWhitespace(*position_);
  242. bool trailing_space = tokens_.HasTrailingWhitespace(*position_);
  243. // If there's whitespace on both sides, it's an infix operator.
  244. if (leading_space && trailing_space) {
  245. return true;
  246. }
  247. // If there's whitespace on exactly one side, it's not an infix operator.
  248. if (leading_space || trailing_space) {
  249. return false;
  250. }
  251. // Otherwise, for an infix operator, the preceding token must be any close
  252. // bracket, identifier, or literal and the next token must be an open paren,
  253. // identifier, or literal.
  254. if (position_ == tokens_.tokens().begin() ||
  255. !IsAssumedEndOfOperand(tokens_.GetKind(*(position_ - 1))) ||
  256. !IsAssumedStartOfOperand(tokens_.GetKind(*(position_ + 1)))) {
  257. return false;
  258. }
  259. return true;
  260. }
  261. auto Parser::IsTrailingOperatorInfix() -> bool {
  262. if (position_ == end_) {
  263. return false;
  264. }
  265. // An operator that follows the infix operator rules is parsed as
  266. // infix, unless the next token means that it can't possibly be.
  267. if (IsLexicallyValidInfixOperator() &&
  268. IsPossibleStartOfOperand(tokens_.GetKind(*(position_ + 1)))) {
  269. return true;
  270. }
  271. // A trailing operator with leading whitespace that's not valid as infix is
  272. // not valid at all. If the next token looks like the start of an operand,
  273. // then parse as infix, otherwise as postfix. Either way we'll produce a
  274. // diagnostic later on.
  275. if (tokens_.HasLeadingWhitespace(*position_) &&
  276. IsAssumedStartOfOperand(tokens_.GetKind(*(position_ + 1)))) {
  277. return true;
  278. }
  279. return false;
  280. }
  281. auto Parser::DiagnoseOperatorFixity(OperatorFixity fixity) -> void {
  282. if (fixity == OperatorFixity::Infix) {
  283. // Infix operators must satisfy the infix operator rules.
  284. if (!IsLexicallyValidInfixOperator()) {
  285. CARBON_DIAGNOSTIC(BinaryOperatorRequiresWhitespace, Error,
  286. "Whitespace missing {0} binary operator.",
  287. RelativeLocation);
  288. emitter_.Emit(*position_, BinaryOperatorRequiresWhitespace,
  289. tokens_.HasLeadingWhitespace(*position_)
  290. ? RelativeLocation::After
  291. : (tokens_.HasTrailingWhitespace(*position_)
  292. ? RelativeLocation::Before
  293. : RelativeLocation::Around));
  294. }
  295. } else {
  296. bool prefix = fixity == OperatorFixity::Prefix;
  297. // Whitespace is not permitted between a symbolic pre/postfix operator and
  298. // its operand.
  299. if (PositionKind().IsSymbol() &&
  300. (prefix ? tokens_.HasTrailingWhitespace(*position_)
  301. : tokens_.HasLeadingWhitespace(*position_))) {
  302. CARBON_DIAGNOSTIC(UnaryOperatorHasWhitespace, Error,
  303. "Whitespace is not allowed {0} this unary operator.",
  304. RelativeLocation);
  305. emitter_.Emit(
  306. *position_, UnaryOperatorHasWhitespace,
  307. prefix ? RelativeLocation::After : RelativeLocation::Before);
  308. }
  309. // Pre/postfix operators must not satisfy the infix operator rules.
  310. if (IsLexicallyValidInfixOperator()) {
  311. CARBON_DIAGNOSTIC(UnaryOperatorRequiresWhitespace, Error,
  312. "Whitespace is required {0} this unary operator.",
  313. RelativeLocation);
  314. emitter_.Emit(
  315. *position_, UnaryOperatorRequiresWhitespace,
  316. prefix ? RelativeLocation::Before : RelativeLocation::After);
  317. }
  318. }
  319. }
  320. auto Parser::ConsumeListToken(ParseNodeKind comma_kind, TokenKind close_kind,
  321. bool already_has_error) -> ListTokenKind {
  322. if (!PositionIs(TokenKind::Comma()) && !PositionIs(close_kind)) {
  323. // Don't error a second time on the same element.
  324. if (!already_has_error) {
  325. CARBON_DIAGNOSTIC(UnexpectedTokenAfterListElement, Error,
  326. "Expected `,` or `{0}`.", TokenKind);
  327. emitter_.Emit(*position_, UnexpectedTokenAfterListElement, close_kind);
  328. ReturnErrorOnState();
  329. }
  330. // Recover from the invalid token.
  331. auto end_of_element = FindNextOf({TokenKind::Comma(), close_kind});
  332. // The lexer guarantees that parentheses are balanced.
  333. CARBON_CHECK(end_of_element)
  334. << "missing matching `" << close_kind.GetOpeningSymbol() << "` for `"
  335. << close_kind << "`";
  336. SkipTo(*end_of_element);
  337. }
  338. if (PositionIs(close_kind)) {
  339. return ListTokenKind::Close;
  340. } else {
  341. AddLeafNode(comma_kind, Consume());
  342. return PositionIs(close_kind) ? ListTokenKind::CommaClose
  343. : ListTokenKind::Comma;
  344. }
  345. }
  346. auto Parser::Parse() -> void {
  347. // Traces state_stack_. This runs even in opt because it's low overhead.
  348. PrettyStackTraceParseState pretty_stack(this);
  349. PushState(ParserState::DeclarationLoop());
  350. while (!state_stack_.empty()) {
  351. switch (state_stack_.back().state) {
  352. #define CARBON_PARSER_STATE(Name) \
  353. case ParserState::Name(): \
  354. Handle##Name##State(); \
  355. break;
  356. #include "toolchain/parser/parser_state.def"
  357. }
  358. }
  359. AddLeafNode(ParseNodeKind::FileEnd(), *position_);
  360. }
  361. auto Parser::HandleBraceExpressionState() -> void {
  362. auto state = PopState();
  363. state.state = ParserState::BraceExpressionFinishAsUnknown();
  364. PushState(state);
  365. CARBON_CHECK(ConsumeAndAddLeafNodeIf(
  366. TokenKind::OpenCurlyBrace(),
  367. ParseNodeKind::StructLiteralOrStructTypeLiteralStart()));
  368. if (!PositionIs(TokenKind::CloseCurlyBrace())) {
  369. PushState(ParserState::BraceExpressionParameterAsUnknown());
  370. }
  371. }
  372. auto Parser::BraceExpressionKindToParserState(BraceExpressionKind kind,
  373. ParserState type,
  374. ParserState value,
  375. ParserState unknown)
  376. -> ParserState {
  377. switch (kind) {
  378. case BraceExpressionKind::Type: {
  379. return type;
  380. }
  381. case BraceExpressionKind::Value: {
  382. return value;
  383. }
  384. case BraceExpressionKind::Unknown: {
  385. return unknown;
  386. }
  387. }
  388. }
  389. auto Parser::HandleBraceExpressionParameterError(StateStackEntry state,
  390. BraceExpressionKind kind)
  391. -> void {
  392. CARBON_DIAGNOSTIC(ExpectedStructLiteralField, Error, "Expected {0}{1}{2}.",
  393. llvm::StringRef, llvm::StringRef, llvm::StringRef);
  394. bool can_be_type = kind != BraceExpressionKind::Value;
  395. bool can_be_value = kind != BraceExpressionKind::Type;
  396. emitter_.Emit(*position_, ExpectedStructLiteralField,
  397. can_be_type ? "`.field: type`" : "",
  398. (can_be_type && can_be_value) ? " or " : "",
  399. can_be_value ? "`.field = value`" : "");
  400. state.state = BraceExpressionKindToParserState(
  401. kind, ParserState::BraceExpressionParameterFinishAsType(),
  402. ParserState::BraceExpressionParameterFinishAsValue(),
  403. ParserState::BraceExpressionParameterFinishAsUnknown());
  404. state.has_error = true;
  405. PushState(state);
  406. }
  407. auto Parser::HandleBraceExpressionParameter(BraceExpressionKind kind) -> void {
  408. auto state = PopState();
  409. if (!PositionIs(TokenKind::Period())) {
  410. HandleBraceExpressionParameterError(state, kind);
  411. return;
  412. }
  413. state.state = BraceExpressionKindToParserState(
  414. kind, ParserState::BraceExpressionParameterAfterDesignatorAsType(),
  415. ParserState::BraceExpressionParameterAfterDesignatorAsValue(),
  416. ParserState::BraceExpressionParameterAfterDesignatorAsUnknown());
  417. PushState(state);
  418. PushState(ParserState::DesignatorAsStruct());
  419. }
  420. auto Parser::HandleBraceExpressionParameterAsTypeState() -> void {
  421. HandleBraceExpressionParameter(BraceExpressionKind::Type);
  422. }
  423. auto Parser::HandleBraceExpressionParameterAsValueState() -> void {
  424. HandleBraceExpressionParameter(BraceExpressionKind::Value);
  425. }
  426. auto Parser::HandleBraceExpressionParameterAsUnknownState() -> void {
  427. HandleBraceExpressionParameter(BraceExpressionKind::Unknown);
  428. }
  429. auto Parser::HandleBraceExpressionParameterAfterDesignator(
  430. BraceExpressionKind kind) -> void {
  431. auto state = PopState();
  432. if (state.has_error) {
  433. auto recovery_pos = FindNextOf(
  434. {TokenKind::Equal(), TokenKind::Colon(), TokenKind::Comma()});
  435. if (!recovery_pos || tokens_.GetKind(*recovery_pos) == TokenKind::Comma()) {
  436. state.state = BraceExpressionKindToParserState(
  437. kind, ParserState::BraceExpressionParameterFinishAsType(),
  438. ParserState::BraceExpressionParameterFinishAsValue(),
  439. ParserState::BraceExpressionParameterFinishAsUnknown());
  440. PushState(state);
  441. return;
  442. }
  443. SkipTo(*recovery_pos);
  444. }
  445. // Work out the kind of this element.
  446. auto elem_kind = BraceExpressionKind::Unknown;
  447. if (PositionIs(TokenKind::Colon())) {
  448. elem_kind = BraceExpressionKind::Type;
  449. } else if (PositionIs(TokenKind::Equal())) {
  450. elem_kind = BraceExpressionKind::Value;
  451. }
  452. // Unknown kinds and changes between type and value are errors.
  453. if (elem_kind == BraceExpressionKind::Unknown ||
  454. (kind != BraceExpressionKind::Unknown && elem_kind != kind)) {
  455. HandleBraceExpressionParameterError(state, kind);
  456. return;
  457. }
  458. // If we're setting the kind, update the BraceExpressionFinish state.
  459. if (kind == BraceExpressionKind::Unknown) {
  460. kind = elem_kind;
  461. auto finish_state = PopState();
  462. CARBON_CHECK(finish_state.state ==
  463. ParserState::BraceExpressionFinishAsUnknown());
  464. finish_state.state = BraceExpressionKindToParserState(
  465. kind, ParserState::BraceExpressionFinishAsType(),
  466. ParserState::BraceExpressionFinishAsValue(),
  467. ParserState::BraceExpressionFinishAsUnknown());
  468. PushState(finish_state);
  469. }
  470. state.state = BraceExpressionKindToParserState(
  471. kind, ParserState::BraceExpressionParameterFinishAsType(),
  472. ParserState::BraceExpressionParameterFinishAsValue(),
  473. ParserState::BraceExpressionParameterFinishAsUnknown());
  474. state.token = Consume();
  475. // Struct type fields and value fields use the same grammar except
  476. // that one has a `:` separator and the other has an `=` separator.
  477. PushState(state);
  478. PushState(ParserState::Expression());
  479. }
  480. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsTypeState()
  481. -> void {
  482. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Type);
  483. }
  484. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsValueState()
  485. -> void {
  486. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Value);
  487. }
  488. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsUnknownState()
  489. -> void {
  490. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Unknown);
  491. }
  492. auto Parser::HandleBraceExpressionParameterFinish(BraceExpressionKind kind)
  493. -> void {
  494. auto state = PopState();
  495. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructFieldType()
  496. : ParseNodeKind::StructFieldValue(),
  497. state.token, state.subtree_start, state.has_error);
  498. if (ConsumeListToken(ParseNodeKind::StructComma(),
  499. TokenKind::CloseCurlyBrace(),
  500. state.has_error) == ListTokenKind::Comma) {
  501. PushState(BraceExpressionKindToParserState(
  502. kind, ParserState::BraceExpressionParameterAsType(),
  503. ParserState::BraceExpressionParameterAsValue(),
  504. ParserState::BraceExpressionParameterAsUnknown()));
  505. }
  506. }
  507. auto Parser::HandleBraceExpressionParameterFinishAsTypeState() -> void {
  508. HandleBraceExpressionParameterFinish(BraceExpressionKind::Type);
  509. }
  510. auto Parser::HandleBraceExpressionParameterFinishAsValueState() -> void {
  511. HandleBraceExpressionParameterFinish(BraceExpressionKind::Value);
  512. }
  513. auto Parser::HandleBraceExpressionParameterFinishAsUnknownState() -> void {
  514. HandleBraceExpressionParameterFinish(BraceExpressionKind::Unknown);
  515. }
  516. auto Parser::HandleBraceExpressionFinish(BraceExpressionKind kind) -> void {
  517. auto state = PopState();
  518. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructTypeLiteral()
  519. : ParseNodeKind::StructLiteral(),
  520. Consume(), state.subtree_start, state.has_error);
  521. }
  522. auto Parser::HandleBraceExpressionFinishAsTypeState() -> void {
  523. HandleBraceExpressionFinish(BraceExpressionKind::Type);
  524. }
  525. auto Parser::HandleBraceExpressionFinishAsValueState() -> void {
  526. HandleBraceExpressionFinish(BraceExpressionKind::Value);
  527. }
  528. auto Parser::HandleBraceExpressionFinishAsUnknownState() -> void {
  529. HandleBraceExpressionFinish(BraceExpressionKind::Unknown);
  530. }
  531. auto Parser::HandleCallExpressionState() -> void {
  532. auto state = PopState();
  533. // TODO: When swapping () start/end, this should AddLeafNode the open before
  534. // continuing.
  535. state.state = ParserState::CallExpressionFinish();
  536. PushState(state);
  537. // Advance past the open paren.
  538. ++position_;
  539. if (!PositionIs(TokenKind::CloseParen())) {
  540. PushState(ParserState::CallExpressionParameterFinish());
  541. PushState(ParserState::Expression());
  542. }
  543. }
  544. auto Parser::HandleCallExpressionParameterFinishState() -> void {
  545. auto state = PopState();
  546. if (state.has_error) {
  547. ReturnErrorOnState();
  548. }
  549. if (ConsumeListToken(ParseNodeKind::CallExpressionComma(),
  550. TokenKind::CloseParen(),
  551. state.has_error) == ListTokenKind::Comma) {
  552. PushState(ParserState::CallExpressionParameterFinish());
  553. PushState(ParserState::Expression());
  554. }
  555. }
  556. auto Parser::HandleCallExpressionFinishState() -> void {
  557. auto state = PopState();
  558. AddLeafNode(ParseNodeKind::CallExpressionEnd(), Consume());
  559. AddNode(ParseNodeKind::CallExpression(), state.token, state.subtree_start,
  560. state.has_error);
  561. }
  562. auto Parser::HandleCodeBlockFinishState() -> void {
  563. auto state = PopState();
  564. // If the block started with an open curly, this is a close curly.
  565. if (tokens_.GetKind(state.token) == TokenKind::OpenCurlyBrace()) {
  566. AddNode(ParseNodeKind::CodeBlock(), Consume(), state.subtree_start,
  567. state.has_error);
  568. } else {
  569. AddNode(ParseNodeKind::CodeBlock(), state.token, state.subtree_start,
  570. /*has_error=*/true);
  571. }
  572. }
  573. auto Parser::HandleDeclarationLoopState() -> void {
  574. // This maintains the current state unless we're at the end of the file.
  575. switch (PositionKind()) {
  576. case TokenKind::EndOfFile(): {
  577. PopAndDiscardState();
  578. break;
  579. }
  580. case TokenKind::Fn(): {
  581. PushState(ParserState::FunctionIntroducer());
  582. AddLeafNode(ParseNodeKind::FunctionIntroducer(), Consume());
  583. break;
  584. }
  585. case TokenKind::Package(): {
  586. PushState(ParserState::Package());
  587. ++position_;
  588. break;
  589. }
  590. case TokenKind::Semi(): {
  591. AddLeafNode(ParseNodeKind::EmptyDeclaration(), Consume());
  592. break;
  593. }
  594. case TokenKind::Var(): {
  595. PushState(ParserState::VarAsRequireSemicolon());
  596. break;
  597. }
  598. default: {
  599. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  600. "Unrecognized declaration introducer.");
  601. emitter_.Emit(*position_, UnrecognizedDeclaration);
  602. tree_.has_errors_ = true;
  603. if (auto semi = SkipPastLikelyEnd(*position_)) {
  604. AddLeafNode(ParseNodeKind::EmptyDeclaration(), *semi,
  605. /*has_error=*/true);
  606. }
  607. break;
  608. }
  609. }
  610. }
  611. auto Parser::HandleDesignator(bool as_struct) -> void {
  612. auto state = PopState();
  613. // `.` identifier
  614. auto dot = ConsumeIf(TokenKind::Period());
  615. CARBON_CHECK(dot);
  616. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  617. ParseNodeKind::DesignatedName())) {
  618. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterDot, Error,
  619. "Expected identifier after `.`.");
  620. emitter_.Emit(*position_, ExpectedIdentifierAfterDot);
  621. // If we see a keyword, assume it was intended to be the designated name.
  622. // TODO: Should keywords be valid in designators?
  623. if (PositionKind().IsKeyword()) {
  624. AddLeafNode(ParseNodeKind::DesignatedName(), Consume(),
  625. /*has_error=*/true);
  626. } else {
  627. state.has_error = true;
  628. ReturnErrorOnState();
  629. }
  630. }
  631. AddNode(as_struct ? ParseNodeKind::StructFieldDesignator()
  632. : ParseNodeKind::DesignatorExpression(),
  633. *dot, state.subtree_start, state.has_error);
  634. }
  635. auto Parser::HandleDesignatorAsExpressionState() -> void {
  636. HandleDesignator(/*as_struct=*/false);
  637. }
  638. auto Parser::HandleDesignatorAsStructState() -> void {
  639. HandleDesignator(/*as_struct=*/true);
  640. }
  641. auto Parser::HandleExpressionState() -> void {
  642. auto state = PopState();
  643. // Check for a prefix operator.
  644. if (auto operator_precedence = PrecedenceGroup::ForLeading(PositionKind())) {
  645. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  646. *operator_precedence) !=
  647. OperatorPriority::RightFirst) {
  648. // The precedence rules don't permit this prefix operator in this
  649. // context. Diagnose this, but carry on and parse it anyway.
  650. emitter_.Emit(*position_, OperatorRequiresParentheses);
  651. } else {
  652. // Check that this operator follows the proper whitespace rules.
  653. DiagnoseOperatorFixity(OperatorFixity::Prefix);
  654. }
  655. PushStateForExpressionLoop(ParserState::ExpressionLoopForPrefix(),
  656. state.ambient_precedence, *operator_precedence);
  657. ++position_;
  658. PushStateForExpression(*operator_precedence);
  659. } else {
  660. PushStateForExpressionLoop(ParserState::ExpressionLoop(),
  661. state.ambient_precedence,
  662. PrecedenceGroup::ForPostfixExpression());
  663. PushState(ParserState::ExpressionInPostfix());
  664. }
  665. }
  666. auto Parser::HandleExpressionInPostfixState() -> void {
  667. auto state = PopState();
  668. // Continue to the loop state.
  669. state.state = ParserState::ExpressionInPostfixLoop();
  670. // Parses a primary expression, which is either a terminal portion of an
  671. // expression tree, such as an identifier or literal, or a parenthesized
  672. // expression.
  673. switch (PositionKind()) {
  674. case TokenKind::Identifier(): {
  675. AddLeafNode(ParseNodeKind::NameReference(), Consume());
  676. PushState(state);
  677. break;
  678. }
  679. case TokenKind::IntegerLiteral():
  680. case TokenKind::RealLiteral():
  681. case TokenKind::StringLiteral():
  682. case TokenKind::IntegerTypeLiteral():
  683. case TokenKind::UnsignedIntegerTypeLiteral():
  684. case TokenKind::FloatingPointTypeLiteral(): {
  685. AddLeafNode(ParseNodeKind::Literal(), Consume());
  686. PushState(state);
  687. break;
  688. }
  689. case TokenKind::OpenCurlyBrace(): {
  690. PushState(state);
  691. PushState(ParserState::BraceExpression());
  692. break;
  693. }
  694. case TokenKind::OpenParen(): {
  695. PushState(state);
  696. PushState(ParserState::ParenExpression());
  697. break;
  698. }
  699. default: {
  700. CARBON_DIAGNOSTIC(ExpectedExpression, Error, "Expected expression.");
  701. emitter_.Emit(*position_, ExpectedExpression);
  702. ReturnErrorOnState();
  703. break;
  704. }
  705. }
  706. }
  707. auto Parser::HandleExpressionInPostfixLoopState() -> void {
  708. // This is a cyclic state that repeats, so this state is typically pushed back
  709. // on.
  710. auto state = PopState();
  711. state.token = *position_;
  712. switch (PositionKind()) {
  713. case TokenKind::Period(): {
  714. PushState(state);
  715. state.state = ParserState::DesignatorAsExpression();
  716. PushState(state);
  717. break;
  718. }
  719. case TokenKind::OpenParen(): {
  720. PushState(state);
  721. state.state = ParserState::CallExpression();
  722. PushState(state);
  723. break;
  724. }
  725. default: {
  726. if (state.has_error) {
  727. ReturnErrorOnState();
  728. }
  729. break;
  730. }
  731. }
  732. }
  733. auto Parser::HandleExpressionLoopState() -> void {
  734. auto state = PopState();
  735. auto trailing_operator =
  736. PrecedenceGroup::ForTrailing(PositionKind(), IsTrailingOperatorInfix());
  737. if (!trailing_operator) {
  738. if (state.has_error) {
  739. ReturnErrorOnState();
  740. }
  741. return;
  742. }
  743. auto [operator_precedence, is_binary] = *trailing_operator;
  744. // TODO: If this operator is ambiguous with either the ambient precedence
  745. // or the LHS precedence, and there's a variant with a different fixity
  746. // that would work, use that one instead for error recovery.
  747. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  748. operator_precedence) !=
  749. OperatorPriority::RightFirst) {
  750. // The precedence rules don't permit this operator in this context. Try
  751. // again in the enclosing expression context.
  752. if (state.has_error) {
  753. ReturnErrorOnState();
  754. }
  755. return;
  756. }
  757. if (PrecedenceGroup::GetPriority(state.lhs_precedence, operator_precedence) !=
  758. OperatorPriority::LeftFirst) {
  759. // Either the LHS operator and this operator are ambiguous, or the
  760. // LHS operator is a unary operator that can't be nested within
  761. // this operator. Either way, parentheses are required.
  762. emitter_.Emit(*position_, OperatorRequiresParentheses);
  763. state.has_error = true;
  764. } else {
  765. DiagnoseOperatorFixity(is_binary ? OperatorFixity::Infix
  766. : OperatorFixity::Postfix);
  767. }
  768. state.token = Consume();
  769. state.lhs_precedence = operator_precedence;
  770. if (is_binary) {
  771. state.state = ParserState::ExpressionLoopForBinary();
  772. PushState(state);
  773. PushStateForExpression(operator_precedence);
  774. } else {
  775. AddNode(ParseNodeKind::PostfixOperator(), state.token, state.subtree_start,
  776. state.has_error);
  777. state.has_error = false;
  778. PushState(state);
  779. }
  780. }
  781. auto Parser::HandleExpressionLoopForBinaryState() -> void {
  782. auto state = PopState();
  783. AddNode(ParseNodeKind::InfixOperator(), state.token, state.subtree_start,
  784. state.has_error);
  785. state.state = ParserState::ExpressionLoop();
  786. state.has_error = false;
  787. PushState(state);
  788. }
  789. auto Parser::HandleExpressionLoopForPrefixState() -> void {
  790. auto state = PopState();
  791. AddNode(ParseNodeKind::PrefixOperator(), state.token, state.subtree_start,
  792. state.has_error);
  793. state.state = ParserState::ExpressionLoop();
  794. state.has_error = false;
  795. PushState(state);
  796. }
  797. auto Parser::HandleExpressionStatementFinishState() -> void {
  798. auto state = PopState();
  799. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  800. AddNode(ParseNodeKind::ExpressionStatement(), *semi, state.subtree_start,
  801. state.has_error);
  802. return;
  803. }
  804. if (!state.has_error) {
  805. emitter_.Emit(*position_, ExpectedSemiAfterExpression);
  806. }
  807. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  808. AddNode(ParseNodeKind::ExpressionStatement(), *semi_token,
  809. state.subtree_start,
  810. /*has_error=*/true);
  811. return;
  812. }
  813. // Found junk not even followed by a `;`, no node to add.
  814. ReturnErrorOnState();
  815. }
  816. auto Parser::HandleFunctionError(StateStackEntry state,
  817. bool skip_past_likely_end) -> void {
  818. auto token = state.token;
  819. if (skip_past_likely_end) {
  820. if (auto semi = SkipPastLikelyEnd(token)) {
  821. token = *semi;
  822. }
  823. }
  824. AddNode(ParseNodeKind::FunctionDeclaration(), token, state.subtree_start,
  825. /*has_error=*/true);
  826. }
  827. auto Parser::HandleFunctionIntroducerState() -> void {
  828. auto state = PopState();
  829. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  830. ParseNodeKind::DeclaredName())) {
  831. CARBON_DIAGNOSTIC(ExpectedFunctionName, Error,
  832. "Expected function name after `fn` keyword.");
  833. emitter_.Emit(*position_, ExpectedFunctionName);
  834. // TODO: We could change the lexer to allow us to synthesize certain
  835. // kinds of tokens and try to "recover" here, but unclear that this is
  836. // really useful.
  837. HandleFunctionError(state, true);
  838. return;
  839. }
  840. if (!PositionIs(TokenKind::OpenParen())) {
  841. CARBON_DIAGNOSTIC(ExpectedFunctionParams, Error,
  842. "Expected `(` after function name.");
  843. emitter_.Emit(*position_, ExpectedFunctionParams);
  844. HandleFunctionError(state, true);
  845. return;
  846. }
  847. // Parse the parameter list as its own subtree; once that pops, resume
  848. // function parsing.
  849. state.state = ParserState::FunctionAfterParameterList();
  850. PushState(state);
  851. PushState(ParserState::FunctionParameterListFinish());
  852. AddLeafNode(ParseNodeKind::ParameterListStart(), Consume());
  853. if (!PositionIs(TokenKind::CloseParen())) {
  854. PushState(ParserState::FunctionParameter());
  855. }
  856. }
  857. auto Parser::HandleFunctionParameterState() -> void {
  858. PopAndDiscardState();
  859. PushState(ParserState::FunctionParameterFinish());
  860. PushState(ParserState::PatternAsFunctionParameter());
  861. }
  862. auto Parser::HandleFunctionParameterFinishState() -> void {
  863. auto state = PopState();
  864. if (state.has_error) {
  865. ReturnErrorOnState();
  866. }
  867. if (ConsumeListToken(ParseNodeKind::ParameterListComma(),
  868. TokenKind::CloseParen(),
  869. state.has_error) == ListTokenKind::Comma) {
  870. PushState(ParserState::PatternAsFunctionParameter());
  871. }
  872. }
  873. auto Parser::HandleFunctionParameterListFinishState() -> void {
  874. auto state = PopState();
  875. CARBON_CHECK(PositionIs(TokenKind::CloseParen())) << PositionKind().Name();
  876. AddNode(ParseNodeKind::ParameterList(), Consume(), state.subtree_start,
  877. state.has_error);
  878. }
  879. auto Parser::HandleFunctionAfterParameterListState() -> void {
  880. auto state = PopState();
  881. // Regardless of whether there's a return type, we'll finish the signature.
  882. state.state = ParserState::FunctionSignatureFinish();
  883. PushState(state);
  884. // If there is a return type, parse the expression before adding the return
  885. // type nod.e
  886. if (PositionIs(TokenKind::MinusGreater())) {
  887. PushState(ParserState::FunctionReturnTypeFinish());
  888. ++position_;
  889. PushStateForExpression(PrecedenceGroup::ForType());
  890. }
  891. }
  892. auto Parser::HandleFunctionReturnTypeFinishState() -> void {
  893. auto state = PopState();
  894. AddNode(ParseNodeKind::ReturnType(), state.token, state.subtree_start,
  895. state.has_error);
  896. }
  897. auto Parser::HandleFunctionSignatureFinishState() -> void {
  898. auto state = PopState();
  899. switch (PositionKind()) {
  900. case TokenKind::Semi(): {
  901. AddNode(ParseNodeKind::FunctionDeclaration(), Consume(),
  902. state.subtree_start, state.has_error);
  903. break;
  904. }
  905. case TokenKind::OpenCurlyBrace(): {
  906. AddNode(ParseNodeKind::FunctionDefinitionStart(), Consume(),
  907. state.subtree_start, state.has_error);
  908. // Any error is recorded on the FunctionDefinitionStart.
  909. state.has_error = false;
  910. state.state = ParserState::FunctionDefinitionFinish();
  911. PushState(state);
  912. PushState(ParserState::StatementScopeLoop());
  913. break;
  914. }
  915. default: {
  916. CARBON_DIAGNOSTIC(
  917. ExpectedFunctionBodyOrSemi, Error,
  918. "Expected function definition or `;` after function declaration.");
  919. emitter_.Emit(*position_, ExpectedFunctionBodyOrSemi);
  920. // Only need to skip if we've not already found a new line.
  921. bool skip_past_likely_end =
  922. tokens_.GetLine(*position_) == tokens_.GetLine(state.token);
  923. HandleFunctionError(state, skip_past_likely_end);
  924. break;
  925. }
  926. }
  927. }
  928. auto Parser::HandleFunctionDefinitionFinishState() -> void {
  929. auto state = PopState();
  930. AddNode(ParseNodeKind::FunctionDefinition(), Consume(), state.subtree_start,
  931. state.has_error);
  932. }
  933. auto Parser::HandlePackageState() -> void {
  934. auto state = PopState();
  935. auto exit_on_parse_error = [&]() {
  936. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  937. AddLeafNode(ParseNodeKind::PackageEnd(), *semi_token);
  938. }
  939. return AddNode(ParseNodeKind::PackageDirective(), state.token,
  940. state.subtree_start, /*has_error=*/true);
  941. };
  942. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  943. ParseNodeKind::DeclaredName())) {
  944. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterPackage, Error,
  945. "Expected identifier after `package`.");
  946. emitter_.Emit(*position_, ExpectedIdentifierAfterPackage);
  947. exit_on_parse_error();
  948. return;
  949. }
  950. bool library_parsed = false;
  951. if (auto library_token = ConsumeIf(TokenKind::Library())) {
  952. auto library_start = tree_.size();
  953. if (!ConsumeAndAddLeafNodeIf(TokenKind::StringLiteral(),
  954. ParseNodeKind::Literal())) {
  955. CARBON_DIAGNOSTIC(
  956. ExpectedLibraryName, Error,
  957. "Expected a string literal to specify the library name.");
  958. emitter_.Emit(*position_, ExpectedLibraryName);
  959. exit_on_parse_error();
  960. return;
  961. }
  962. AddNode(ParseNodeKind::PackageLibrary(), *library_token, library_start,
  963. /*has_error=*/false);
  964. library_parsed = true;
  965. }
  966. switch (auto api_or_impl_token = tokens_.GetKind(*(position_))) {
  967. case TokenKind::Api(): {
  968. AddLeafNode(ParseNodeKind::PackageApi(), Consume());
  969. break;
  970. }
  971. case TokenKind::Impl(): {
  972. AddLeafNode(ParseNodeKind::PackageImpl(), Consume());
  973. break;
  974. }
  975. default: {
  976. if (!library_parsed && api_or_impl_token == TokenKind::StringLiteral()) {
  977. // If we come acroess a string literal and we didn't parse `library
  978. // "..."` yet, then most probably the user forgot to add `library`
  979. // before the library name.
  980. CARBON_DIAGNOSTIC(MissingLibraryKeyword, Error,
  981. "Missing `library` keyword.");
  982. emitter_.Emit(*position_, MissingLibraryKeyword);
  983. } else {
  984. CARBON_DIAGNOSTIC(ExpectedApiOrImpl, Error,
  985. "Expected a `api` or `impl`.");
  986. emitter_.Emit(*position_, ExpectedApiOrImpl);
  987. }
  988. exit_on_parse_error();
  989. return;
  990. }
  991. }
  992. if (!ConsumeAndAddLeafNodeIf(TokenKind::Semi(),
  993. ParseNodeKind::PackageEnd())) {
  994. CARBON_DIAGNOSTIC(ExpectedSemiToEndPackageDirective, Error,
  995. "Expected `;` to end package directive.");
  996. emitter_.Emit(*position_, ExpectedSemiToEndPackageDirective);
  997. exit_on_parse_error();
  998. return;
  999. }
  1000. AddNode(ParseNodeKind::PackageDirective(), state.token, state.subtree_start,
  1001. /*has_error=*/false);
  1002. }
  1003. auto Parser::HandleParenConditionState() -> void {
  1004. auto state = PopState();
  1005. auto open_paren = ConsumeIf(TokenKind::OpenParen());
  1006. if (open_paren) {
  1007. state.token = *open_paren;
  1008. } else {
  1009. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error, "Expected `(` after `{0}`.",
  1010. TokenKind);
  1011. emitter_.Emit(*position_, ExpectedParenAfter, tokens_.GetKind(state.token));
  1012. }
  1013. // TODO: This should be adding a ConditionStart here instead of ConditionEnd
  1014. // later, so this does state modification instead of a simpler push.
  1015. state.state = ParserState::ParenConditionFinish();
  1016. PushState(state);
  1017. PushState(ParserState::Expression());
  1018. }
  1019. auto Parser::HandleParenConditionFinishState() -> void {
  1020. auto state = PopState();
  1021. if (tokens_.GetKind(state.token) != TokenKind::OpenParen()) {
  1022. // Don't expect a matching closing paren if there wasn't an opening paren.
  1023. // TODO: Should probably push nodes on this state in order to have the
  1024. // condition wrapped, but it wasn't before, so not doing it for consistency.
  1025. ReturnErrorOnState();
  1026. return;
  1027. }
  1028. bool close_paren =
  1029. ConsumeAndAddCloseParen(state.token, ParseNodeKind::ConditionEnd());
  1030. return AddNode(ParseNodeKind::Condition(), state.token, state.subtree_start,
  1031. /*has_error=*/state.has_error || !close_paren);
  1032. }
  1033. auto Parser::HandleParenExpressionState() -> void {
  1034. auto state = PopState();
  1035. // TODO: When swapping () start/end, this should AddLeafNode the open before
  1036. // continuing.
  1037. // Advance past the open paren.
  1038. CARBON_CHECK(PositionIs(TokenKind::OpenParen()));
  1039. ++position_;
  1040. if (PositionIs(TokenKind::CloseParen())) {
  1041. state.state = ParserState::ParenExpressionFinishAsTuple();
  1042. PushState(state);
  1043. } else {
  1044. state.state = ParserState::ParenExpressionFinish();
  1045. PushState(state);
  1046. PushState(ParserState::ParenExpressionParameterFinishAsUnknown());
  1047. PushState(ParserState::Expression());
  1048. }
  1049. }
  1050. auto Parser::HandleParenExpressionParameterFinish(bool as_tuple) -> void {
  1051. auto state = PopState();
  1052. auto list_token_kind =
  1053. ConsumeListToken(ParseNodeKind::TupleLiteralComma(),
  1054. TokenKind::CloseParen(), state.has_error);
  1055. if (list_token_kind == ListTokenKind::Close) {
  1056. return;
  1057. }
  1058. // If this is the first item and a comma was found, switch to tuple handling.
  1059. // Note this could be `(expr,)` so we may not reuse the current state, but
  1060. // it's still necessary to switch the parent.
  1061. if (!as_tuple) {
  1062. state.state = ParserState::ParenExpressionParameterFinishAsTuple();
  1063. auto finish_state = PopState();
  1064. CARBON_CHECK(finish_state.state == ParserState::ParenExpressionFinish())
  1065. << "Unexpected parent state, found: " << finish_state.state;
  1066. finish_state.state = ParserState::ParenExpressionFinishAsTuple();
  1067. PushState(finish_state);
  1068. }
  1069. // On a comma, push another expression handler.
  1070. if (list_token_kind == ListTokenKind::Comma) {
  1071. PushState(state);
  1072. PushState(ParserState::Expression());
  1073. }
  1074. }
  1075. auto Parser::HandleParenExpressionParameterFinishAsUnknownState() -> void {
  1076. HandleParenExpressionParameterFinish(/*as_tuple=*/false);
  1077. }
  1078. auto Parser::HandleParenExpressionParameterFinishAsTupleState() -> void {
  1079. HandleParenExpressionParameterFinish(/*as_tuple=*/true);
  1080. }
  1081. auto Parser::HandleParenExpressionFinishState() -> void {
  1082. auto state = PopState();
  1083. AddLeafNode(ParseNodeKind::ParenExpressionEnd(), Consume());
  1084. AddNode(ParseNodeKind::ParenExpression(), state.token, state.subtree_start,
  1085. state.has_error);
  1086. }
  1087. auto Parser::HandleParenExpressionFinishAsTupleState() -> void {
  1088. auto state = PopState();
  1089. AddLeafNode(ParseNodeKind::TupleLiteralEnd(), Consume());
  1090. AddNode(ParseNodeKind::TupleLiteral(), state.token, state.subtree_start,
  1091. state.has_error);
  1092. }
  1093. auto Parser::HandlePattern(PatternKind pattern_kind) -> void {
  1094. auto state = PopState();
  1095. // Ensure the finish state always follows.
  1096. state.state = ParserState::PatternFinish();
  1097. // Handle an invalid pattern introducer.
  1098. if (!PositionIs(TokenKind::Identifier()) ||
  1099. tokens_.GetKind(*(position_ + 1)) != TokenKind::Colon()) {
  1100. switch (pattern_kind) {
  1101. case PatternKind::Parameter: {
  1102. CARBON_DIAGNOSTIC(ExpectedParameterName, Error,
  1103. "Expected parameter declaration.");
  1104. emitter_.Emit(*position_, ExpectedParameterName);
  1105. break;
  1106. }
  1107. case PatternKind::Variable: {
  1108. CARBON_DIAGNOSTIC(ExpectedVariableName, Error,
  1109. "Expected pattern in `var` declaration.");
  1110. emitter_.Emit(*position_, ExpectedVariableName);
  1111. break;
  1112. }
  1113. }
  1114. state.has_error = true;
  1115. PushState(state);
  1116. return;
  1117. }
  1118. // Switch the context token to the colon, so that it'll be used for the root
  1119. // node.
  1120. state.token = *(position_ + 1);
  1121. PushState(state);
  1122. PushStateForExpression(PrecedenceGroup::ForType());
  1123. AddLeafNode(ParseNodeKind::DeclaredName(), *position_);
  1124. position_ += 2;
  1125. }
  1126. auto Parser::HandlePatternAsFunctionParameterState() -> void {
  1127. HandlePattern(PatternKind::Parameter);
  1128. }
  1129. auto Parser::HandlePatternAsVariableState() -> void {
  1130. HandlePattern(PatternKind::Variable);
  1131. }
  1132. auto Parser::HandlePatternFinishState() -> void {
  1133. auto state = PopState();
  1134. // If an error was encountered, propagate it without adding a node.
  1135. if (state.has_error) {
  1136. ReturnErrorOnState();
  1137. return;
  1138. }
  1139. // TODO: may need to mark has_error if !type.
  1140. AddNode(ParseNodeKind::PatternBinding(), state.token, state.subtree_start,
  1141. /*has_error=*/false);
  1142. }
  1143. auto Parser::HandleStatementState() -> void {
  1144. PopAndDiscardState();
  1145. switch (PositionKind()) {
  1146. case TokenKind::Break(): {
  1147. PushState(ParserState::StatementBreakFinish());
  1148. AddLeafNode(ParseNodeKind::BreakStatementStart(), Consume());
  1149. break;
  1150. }
  1151. case TokenKind::Continue(): {
  1152. PushState(ParserState::StatementContinueFinish());
  1153. AddLeafNode(ParseNodeKind::ContinueStatementStart(), Consume());
  1154. break;
  1155. }
  1156. case TokenKind::For(): {
  1157. // Process the header as a child of the for so that we can get consistent
  1158. // starts.
  1159. // TODO: When reorganizing components, we can probably make this flatter.
  1160. PushState(ParserState::StatementForFinish());
  1161. ++position_;
  1162. PushState(ParserState::StatementForHeader());
  1163. break;
  1164. }
  1165. case TokenKind::If(): {
  1166. PushState(ParserState::StatementIf());
  1167. break;
  1168. }
  1169. case TokenKind::Return(): {
  1170. PushState(ParserState::StatementReturn());
  1171. break;
  1172. }
  1173. case TokenKind::Var(): {
  1174. PushState(ParserState::VarAsRequireSemicolon());
  1175. break;
  1176. }
  1177. case TokenKind::While(): {
  1178. PushState(ParserState::StatementWhile());
  1179. break;
  1180. }
  1181. default: {
  1182. PushState(ParserState::ExpressionStatementFinish());
  1183. PushState(ParserState::Expression());
  1184. break;
  1185. }
  1186. }
  1187. }
  1188. auto Parser::HandleStatementBreakFinishState() -> void {
  1189. HandleStatementKeywordFinish(ParseNodeKind::BreakStatement());
  1190. }
  1191. auto Parser::HandleStatementContinueFinishState() -> void {
  1192. HandleStatementKeywordFinish(ParseNodeKind::ContinueStatement());
  1193. }
  1194. auto Parser::HandleStatementForHeaderState() -> void {
  1195. auto state = PopState();
  1196. auto open_paren = ConsumeIf(TokenKind::OpenParen());
  1197. if (!open_paren) {
  1198. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error,
  1199. "Expected `(` after `{0}`. Recovering from missing `(` "
  1200. "not implemented yet!",
  1201. TokenKind);
  1202. emitter_.Emit(*position_, ExpectedParenAfter, TokenKind::For());
  1203. // TODO: A proper recovery strategy is needed here. For now, I assume
  1204. // that all brackets are properly balanced (i.e. each open bracket has a
  1205. // closing one).
  1206. // This is temporary until we come to a conclusion regarding the
  1207. // recovery tokens strategy.
  1208. ReturnErrorOnState();
  1209. PushState(ParserState::CodeBlock());
  1210. return;
  1211. }
  1212. state.state = ParserState::StatementForHeaderIn();
  1213. if (PositionIs(TokenKind::Var())) {
  1214. PushState(state);
  1215. PushState(ParserState::VarAsNoSemicolon());
  1216. } else {
  1217. CARBON_DIAGNOSTIC(ExpectedVariableDeclaration, Error,
  1218. "Expected `var` declaration.");
  1219. emitter_.Emit(*position_, ExpectedVariableDeclaration);
  1220. if (auto next_in = FindNextOf({TokenKind::In()})) {
  1221. SkipTo(*next_in);
  1222. }
  1223. state.has_error = true;
  1224. PushState(state);
  1225. }
  1226. }
  1227. auto Parser::HandleStatementForHeaderInState() -> void {
  1228. auto state = PopState();
  1229. state.state = ParserState::StatementForHeaderFinish();
  1230. if (!ConsumeAndAddLeafNodeIf(TokenKind::In(), ParseNodeKind::ForIn())) {
  1231. if (auto colon = ConsumeIf(TokenKind::Colon())) {
  1232. CARBON_DIAGNOSTIC(ExpectedIn, Error, "`:` should be replaced by `in`.");
  1233. emitter_.Emit(*colon, ExpectedIn);
  1234. AddLeafNode(ParseNodeKind::ForIn(), *colon, /*has_error=*/true);
  1235. } else {
  1236. CARBON_DIAGNOSTIC(ExpectedIn, Error,
  1237. "Expected `in` after loop `var` declaration.");
  1238. emitter_.Emit(*position_, ExpectedIn);
  1239. SkipTo(tokens_.GetMatchedClosingToken(state.token));
  1240. state.has_error = true;
  1241. PushState(state);
  1242. return;
  1243. }
  1244. }
  1245. PushState(state);
  1246. PushState(ParserState::Expression());
  1247. }
  1248. auto Parser::HandleStatementForHeaderFinishState() -> void {
  1249. auto state = PopState();
  1250. if (!ConsumeAndAddCloseParen(state.token, ParseNodeKind::ForHeaderEnd())) {
  1251. state.has_error = true;
  1252. }
  1253. AddNode(ParseNodeKind::ForHeader(), state.token, state.subtree_start,
  1254. state.has_error);
  1255. PushState(ParserState::CodeBlock());
  1256. }
  1257. auto Parser::HandleStatementForFinishState() -> void {
  1258. auto state = PopState();
  1259. AddNode(ParseNodeKind::ForStatement(), state.token, state.subtree_start,
  1260. state.has_error);
  1261. }
  1262. auto Parser::HandleStatementIfState() -> void {
  1263. PopAndDiscardState();
  1264. PushState(ParserState::StatementIfConditionFinish());
  1265. PushState(ParserState::ParenCondition());
  1266. ++position_;
  1267. }
  1268. auto Parser::HandleStatementIfConditionFinishState() -> void {
  1269. auto state = PopState();
  1270. state.state = ParserState::StatementIfThenBlockFinish();
  1271. PushState(state);
  1272. PushState(ParserState::CodeBlock());
  1273. }
  1274. auto Parser::HandleStatementIfThenBlockFinishState() -> void {
  1275. auto state = PopState();
  1276. if (ConsumeAndAddLeafNodeIf(TokenKind::Else(),
  1277. ParseNodeKind::IfStatementElse())) {
  1278. state.state = ParserState::StatementIfElseBlockFinish();
  1279. PushState(state);
  1280. // `else if` is permitted as a special case.
  1281. PushState(PositionIs(TokenKind::If()) ? ParserState::StatementIf()
  1282. : ParserState::CodeBlock());
  1283. } else {
  1284. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1285. state.has_error);
  1286. }
  1287. }
  1288. auto Parser::HandleStatementIfElseBlockFinishState() -> void {
  1289. auto state = PopState();
  1290. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1291. state.has_error);
  1292. }
  1293. auto Parser::HandleStatementKeywordFinish(ParseNodeKind node_kind) -> void {
  1294. auto state = PopState();
  1295. auto semi = ConsumeIf(TokenKind::Semi());
  1296. if (!semi) {
  1297. CARBON_DIAGNOSTIC(ExpectedSemiAfter, Error, "Expected `;` after `{0}`.",
  1298. TokenKind);
  1299. emitter_.Emit(*position_, ExpectedSemiAfter, tokens_.GetKind(state.token));
  1300. state.has_error = true;
  1301. // Recover to the next semicolon if possible, otherwise indicate the
  1302. // keyword for the error.
  1303. semi = SkipPastLikelyEnd(state.token);
  1304. if (!semi) {
  1305. semi = state.token;
  1306. }
  1307. }
  1308. AddNode(node_kind, *semi, state.subtree_start, state.has_error);
  1309. }
  1310. auto Parser::HandleStatementReturnState() -> void {
  1311. auto state = PopState();
  1312. state.state = ParserState::StatementReturnFinish();
  1313. PushState(state);
  1314. AddLeafNode(ParseNodeKind::ReturnStatementStart(), Consume());
  1315. if (!PositionIs(TokenKind::Semi())) {
  1316. PushState(ParserState::Expression());
  1317. }
  1318. }
  1319. auto Parser::HandleStatementReturnFinishState() -> void {
  1320. HandleStatementKeywordFinish(ParseNodeKind::ReturnStatement());
  1321. }
  1322. auto Parser::HandleStatementScopeLoopState() -> void {
  1323. // This maintains the current state until we're at the end of the scope.
  1324. auto token_kind = PositionKind();
  1325. if (token_kind == TokenKind::CloseCurlyBrace()) {
  1326. auto state = PopState();
  1327. if (state.has_error) {
  1328. ReturnErrorOnState();
  1329. }
  1330. } else {
  1331. PushState(ParserState::Statement());
  1332. }
  1333. }
  1334. auto Parser::HandleStatementWhileState() -> void {
  1335. PopAndDiscardState();
  1336. PushState(ParserState::StatementWhileConditionFinish());
  1337. PushState(ParserState::ParenCondition());
  1338. ++position_;
  1339. }
  1340. auto Parser::HandleStatementWhileConditionFinishState() -> void {
  1341. auto state = PopState();
  1342. state.state = ParserState::StatementWhileBlockFinish();
  1343. PushState(state);
  1344. PushState(ParserState::CodeBlock());
  1345. }
  1346. auto Parser::HandleStatementWhileBlockFinishState() -> void {
  1347. auto state = PopState();
  1348. AddNode(ParseNodeKind::WhileStatement(), state.token, state.subtree_start,
  1349. state.has_error);
  1350. }
  1351. auto Parser::HandleVar(bool require_semicolon) -> void {
  1352. PopAndDiscardState();
  1353. PushState(require_semicolon ? ParserState::VarFinishAsRequireSemicolon()
  1354. : ParserState::VarFinishAsNoSemicolon());
  1355. PushState(ParserState::VarAfterPattern());
  1356. ++position_;
  1357. PushState(ParserState::PatternAsVariable());
  1358. }
  1359. auto Parser::HandleVarAsRequireSemicolonState() -> void {
  1360. HandleVar(/*require_semicolon=*/true);
  1361. }
  1362. auto Parser::HandleVarAsNoSemicolonState() -> void {
  1363. HandleVar(/*require_semicolon=*/false);
  1364. }
  1365. auto Parser::HandleVarAfterPatternState() -> void {
  1366. auto state = PopState();
  1367. if (state.has_error) {
  1368. if (auto after_pattern =
  1369. FindNextOf({TokenKind::Equal(), TokenKind::Semi()})) {
  1370. SkipTo(*after_pattern);
  1371. }
  1372. }
  1373. if (PositionIs(TokenKind::Equal())) {
  1374. PushState(ParserState::VarAfterInitializer());
  1375. ++position_;
  1376. PushState(ParserState::Expression());
  1377. return;
  1378. }
  1379. }
  1380. auto Parser::HandleVarAfterInitializerState() -> void {
  1381. auto state = PopState();
  1382. AddNode(ParseNodeKind::VariableInitializer(), state.token,
  1383. state.subtree_start, state.has_error);
  1384. }
  1385. auto Parser::HandleVarFinish(bool require_semicolon) -> void {
  1386. auto state = PopState();
  1387. if (require_semicolon) {
  1388. auto semi = ConsumeAndAddLeafNodeIf(TokenKind::Semi(),
  1389. ParseNodeKind::DeclarationEnd());
  1390. if (!semi) {
  1391. emitter_.Emit(*position_, ExpectedSemiAfterExpression);
  1392. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  1393. AddLeafNode(ParseNodeKind::DeclarationEnd(), *semi_token,
  1394. /*has_error=*/true);
  1395. } else {
  1396. state.has_error = true;
  1397. }
  1398. }
  1399. }
  1400. return AddNode(ParseNodeKind::VariableDeclaration(), state.token,
  1401. state.subtree_start, state.has_error);
  1402. }
  1403. auto Parser::HandleVarFinishAsRequireSemicolonState() -> void {
  1404. HandleVarFinish(/*require_semicolon=*/true);
  1405. }
  1406. auto Parser::HandleVarFinishAsNoSemicolonState() -> void {
  1407. HandleVarFinish(/*require_semicolon=*/false);
  1408. }
  1409. } // namespace Carbon