parser.cpp 56 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/parser/parser.h"
  5. #include <cstdlib>
  6. #include <memory>
  7. #include "common/check.h"
  8. #include "llvm/ADT/Optional.h"
  9. #include "llvm/Support/PrettyStackTrace.h"
  10. #include "toolchain/lexer/token_kind.h"
  11. #include "toolchain/lexer/tokenized_buffer.h"
  12. #include "toolchain/parser/parse_node_kind.h"
  13. #include "toolchain/parser/parse_tree.h"
  14. namespace Carbon {
  15. // May be emitted a couple different ways as part of operator parsing.
  16. CARBON_DIAGNOSTIC(
  17. OperatorRequiresParentheses, Error,
  18. "Parentheses are required to disambiguate operator precedence.");
  19. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error, "Expected `(` after `{0}`.",
  20. TokenKind);
  21. CARBON_DIAGNOSTIC(ExpectedSemiAfterExpression, Error,
  22. "Expected `;` after expression.");
  23. // A relative location for characters in errors.
  24. enum class RelativeLocation : int8_t {
  25. Around,
  26. After,
  27. Before,
  28. };
  29. // Adapts RelativeLocation for use with formatv.
  30. static auto operator<<(llvm::raw_ostream& out, RelativeLocation loc)
  31. -> llvm::raw_ostream& {
  32. switch (loc) {
  33. case RelativeLocation::Around:
  34. out << "around";
  35. break;
  36. case RelativeLocation::After:
  37. out << "after";
  38. break;
  39. case RelativeLocation::Before:
  40. out << "before";
  41. break;
  42. }
  43. return out;
  44. }
  45. class Parser::PrettyStackTraceParseState : public llvm::PrettyStackTraceEntry {
  46. public:
  47. explicit PrettyStackTraceParseState(const Parser* parser) : parser_(parser) {}
  48. ~PrettyStackTraceParseState() override = default;
  49. auto print(llvm::raw_ostream& output) const -> void override {
  50. output << "Parser stack:\n";
  51. for (int i = 0; i < static_cast<int>(parser_->state_stack_.size()); ++i) {
  52. const auto& entry = parser_->state_stack_[i];
  53. output << "\t" << i << ".\t" << entry.state;
  54. Print(output, entry.token);
  55. }
  56. output << "\tcursor\tposition_";
  57. Print(output, *parser_->position_);
  58. }
  59. private:
  60. auto Print(llvm::raw_ostream& output, TokenizedBuffer::Token token) const
  61. -> void {
  62. auto line = parser_->tokens_->GetLine(token);
  63. output << " @ " << parser_->tokens_->GetLineNumber(line) << ":"
  64. << parser_->tokens_->GetColumnNumber(token) << ":"
  65. << " token " << token << " : "
  66. << parser_->tokens_->GetKind(token).Name() << "\n";
  67. }
  68. const Parser* parser_;
  69. };
  70. Parser::Parser(ParseTree& tree, TokenizedBuffer& tokens,
  71. TokenDiagnosticEmitter& emitter)
  72. : tree_(&tree),
  73. tokens_(&tokens),
  74. emitter_(&emitter),
  75. position_(tokens_->tokens().begin()),
  76. end_(tokens_->tokens().end()) {
  77. CARBON_CHECK(position_ != end_) << "Empty TokenizedBuffer";
  78. --end_;
  79. CARBON_CHECK(tokens_->GetKind(*end_) == TokenKind::EndOfFile())
  80. << "TokenizedBuffer should end with EndOfFile, ended with "
  81. << tokens_->GetKind(*end_).Name();
  82. }
  83. auto Parser::AddLeafNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  84. bool has_error) -> void {
  85. tree_->node_impls_.push_back(
  86. ParseTree::NodeImpl(kind, has_error, token, /*subtree_size=*/1));
  87. if (has_error) {
  88. tree_->has_errors_ = true;
  89. }
  90. }
  91. auto Parser::AddNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  92. int subtree_start, bool has_error) -> void {
  93. int subtree_size = tree_->size() - subtree_start + 1;
  94. tree_->node_impls_.push_back(
  95. ParseTree::NodeImpl(kind, has_error, token, subtree_size));
  96. if (has_error) {
  97. tree_->has_errors_ = true;
  98. }
  99. }
  100. auto Parser::ConsumeAndAddOpenParen(TokenizedBuffer::Token default_token,
  101. ParseNodeKind start_kind) -> void {
  102. if (auto open_paren = ConsumeIf(TokenKind::OpenParen())) {
  103. AddLeafNode(start_kind, *open_paren, /*has_error=*/false);
  104. } else {
  105. emitter_->Emit(*position_, ExpectedParenAfter,
  106. tokens_->GetKind(default_token));
  107. AddLeafNode(start_kind, default_token, /*has_error=*/true);
  108. }
  109. }
  110. auto Parser::ConsumeAndAddCloseParen(StateStackEntry state,
  111. ParseNodeKind close_kind) -> void {
  112. // state.token should point at the introducer, with the paren one after the
  113. // introducer.
  114. auto expected_paren = *(TokenizedBuffer::TokenIterator(state.token) + 1);
  115. if (tokens_->GetKind(expected_paren) != TokenKind::OpenParen()) {
  116. AddNode(close_kind, state.token, state.subtree_start, /*has_error=*/true);
  117. } else if (auto close_token = ConsumeIf(TokenKind::CloseParen())) {
  118. AddNode(close_kind, *close_token, state.subtree_start, state.has_error);
  119. } else {
  120. // TODO: Include the location of the matching open_paren in the diagnostic.
  121. CARBON_DIAGNOSTIC(ExpectedCloseParen, Error,
  122. "Unexpected tokens before `)`.");
  123. emitter_->Emit(*position_, ExpectedCloseParen);
  124. SkipTo(tokens_->GetMatchedClosingToken(expected_paren));
  125. AddNode(close_kind, Consume(), state.subtree_start, /*has_error=*/true);
  126. }
  127. }
  128. auto Parser::ConsumeAndAddLeafNodeIf(TokenKind token_kind,
  129. ParseNodeKind node_kind) -> bool {
  130. auto token = ConsumeIf(token_kind);
  131. if (!token) {
  132. return false;
  133. }
  134. AddLeafNode(node_kind, *token);
  135. return true;
  136. }
  137. auto Parser::ConsumeChecked(TokenKind kind) -> TokenizedBuffer::Token {
  138. CARBON_CHECK(PositionIs(kind))
  139. << "Required " << kind.Name() << ", found " << PositionKind().Name();
  140. return Consume();
  141. }
  142. auto Parser::ConsumeIf(TokenKind kind)
  143. -> llvm::Optional<TokenizedBuffer::Token> {
  144. if (!PositionIs(kind)) {
  145. return llvm::None;
  146. }
  147. return Consume();
  148. }
  149. auto Parser::FindNextOf(std::initializer_list<TokenKind> desired_kinds)
  150. -> llvm::Optional<TokenizedBuffer::Token> {
  151. auto new_position = position_;
  152. while (true) {
  153. TokenizedBuffer::Token token = *new_position;
  154. TokenKind kind = tokens_->GetKind(token);
  155. if (kind.IsOneOf(desired_kinds)) {
  156. return token;
  157. }
  158. // Step to the next token at the current bracketing level.
  159. if (kind.IsClosingSymbol() || kind == TokenKind::EndOfFile()) {
  160. // There are no more tokens at this level.
  161. return llvm::None;
  162. } else if (kind.IsOpeningSymbol()) {
  163. new_position = TokenizedBuffer::TokenIterator(
  164. tokens_->GetMatchedClosingToken(token));
  165. // Advance past the closing token.
  166. ++new_position;
  167. } else {
  168. ++new_position;
  169. }
  170. }
  171. }
  172. auto Parser::SkipMatchingGroup() -> bool {
  173. if (!PositionKind().IsOpeningSymbol()) {
  174. return false;
  175. }
  176. SkipTo(tokens_->GetMatchedClosingToken(*position_));
  177. ++position_;
  178. return true;
  179. }
  180. auto Parser::SkipPastLikelyEnd(TokenizedBuffer::Token skip_root)
  181. -> llvm::Optional<TokenizedBuffer::Token> {
  182. if (position_ == end_) {
  183. return llvm::None;
  184. }
  185. TokenizedBuffer::Line root_line = tokens_->GetLine(skip_root);
  186. int root_line_indent = tokens_->GetIndentColumnNumber(root_line);
  187. // We will keep scanning through tokens on the same line as the root or
  188. // lines with greater indentation than root's line.
  189. auto is_same_line_or_indent_greater_than_root =
  190. [&](TokenizedBuffer::Token t) {
  191. TokenizedBuffer::Line l = tokens_->GetLine(t);
  192. if (l == root_line) {
  193. return true;
  194. }
  195. return tokens_->GetIndentColumnNumber(l) > root_line_indent;
  196. };
  197. do {
  198. if (PositionIs(TokenKind::CloseCurlyBrace())) {
  199. // Immediately bail out if we hit an unmatched close curly, this will
  200. // pop us up a level of the syntax grouping.
  201. return llvm::None;
  202. }
  203. // We assume that a semicolon is always intended to be the end of the
  204. // current construct.
  205. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  206. return semi;
  207. }
  208. // Skip over any matching group of tokens_->
  209. if (SkipMatchingGroup()) {
  210. continue;
  211. }
  212. // Otherwise just step forward one token.
  213. ++position_;
  214. } while (position_ != end_ &&
  215. is_same_line_or_indent_greater_than_root(*position_));
  216. return llvm::None;
  217. }
  218. auto Parser::SkipTo(TokenizedBuffer::Token t) -> void {
  219. CARBON_CHECK(t >= *position_) << "Tried to skip backwards from " << position_
  220. << " to " << TokenizedBuffer::TokenIterator(t);
  221. position_ = TokenizedBuffer::TokenIterator(t);
  222. CARBON_CHECK(position_ != end_) << "Skipped past EOF.";
  223. }
  224. auto Parser::HandleCodeBlockState() -> void {
  225. PopAndDiscardState();
  226. PushState(ParserState::CodeBlockFinish());
  227. if (ConsumeAndAddLeafNodeIf(TokenKind::OpenCurlyBrace(),
  228. ParseNodeKind::CodeBlockStart())) {
  229. PushState(ParserState::StatementScopeLoop());
  230. } else {
  231. AddLeafNode(ParseNodeKind::CodeBlockStart(), *position_,
  232. /*has_error=*/true);
  233. // Recover by parsing a single statement.
  234. CARBON_DIAGNOSTIC(ExpectedCodeBlock, Error, "Expected braced code block.");
  235. emitter_->Emit(*position_, ExpectedCodeBlock);
  236. PushState(ParserState::Statement());
  237. }
  238. }
  239. // Determines whether the given token is considered to be the start of an
  240. // operand according to the rules for infix operator parsing.
  241. static auto IsAssumedStartOfOperand(TokenKind kind) -> bool {
  242. return kind.IsOneOf({TokenKind::OpenParen(), TokenKind::Identifier(),
  243. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  244. TokenKind::StringLiteral()});
  245. }
  246. // Determines whether the given token is considered to be the end of an
  247. // operand according to the rules for infix operator parsing.
  248. static auto IsAssumedEndOfOperand(TokenKind kind) -> bool {
  249. return kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  250. TokenKind::CloseSquareBracket(), TokenKind::Identifier(),
  251. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  252. TokenKind::StringLiteral()});
  253. }
  254. // Determines whether the given token could possibly be the start of an
  255. // operand. This is conservatively correct, and will never incorrectly return
  256. // `false`, but can incorrectly return `true`.
  257. static auto IsPossibleStartOfOperand(TokenKind kind) -> bool {
  258. return !kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  259. TokenKind::CloseSquareBracket(), TokenKind::Comma(),
  260. TokenKind::Semi(), TokenKind::Colon()});
  261. }
  262. auto Parser::IsLexicallyValidInfixOperator() -> bool {
  263. CARBON_CHECK(position_ != end_) << "Expected an operator token.";
  264. bool leading_space = tokens_->HasLeadingWhitespace(*position_);
  265. bool trailing_space = tokens_->HasTrailingWhitespace(*position_);
  266. // If there's whitespace on both sides, it's an infix operator.
  267. if (leading_space && trailing_space) {
  268. return true;
  269. }
  270. // If there's whitespace on exactly one side, it's not an infix operator.
  271. if (leading_space || trailing_space) {
  272. return false;
  273. }
  274. // Otherwise, for an infix operator, the preceding token must be any close
  275. // bracket, identifier, or literal and the next token must be an open paren,
  276. // identifier, or literal.
  277. if (position_ == tokens_->tokens().begin() ||
  278. !IsAssumedEndOfOperand(tokens_->GetKind(*(position_ - 1))) ||
  279. !IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  280. return false;
  281. }
  282. return true;
  283. }
  284. auto Parser::IsTrailingOperatorInfix() -> bool {
  285. if (position_ == end_) {
  286. return false;
  287. }
  288. // An operator that follows the infix operator rules is parsed as
  289. // infix, unless the next token means that it can't possibly be.
  290. if (IsLexicallyValidInfixOperator() &&
  291. IsPossibleStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  292. return true;
  293. }
  294. // A trailing operator with leading whitespace that's not valid as infix is
  295. // not valid at all. If the next token looks like the start of an operand,
  296. // then parse as infix, otherwise as postfix. Either way we'll produce a
  297. // diagnostic later on.
  298. if (tokens_->HasLeadingWhitespace(*position_) &&
  299. IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  300. return true;
  301. }
  302. return false;
  303. }
  304. auto Parser::DiagnoseOperatorFixity(OperatorFixity fixity) -> void {
  305. if (fixity == OperatorFixity::Infix) {
  306. // Infix operators must satisfy the infix operator rules.
  307. if (!IsLexicallyValidInfixOperator()) {
  308. CARBON_DIAGNOSTIC(BinaryOperatorRequiresWhitespace, Error,
  309. "Whitespace missing {0} binary operator.",
  310. RelativeLocation);
  311. emitter_->Emit(*position_, BinaryOperatorRequiresWhitespace,
  312. tokens_->HasLeadingWhitespace(*position_)
  313. ? RelativeLocation::After
  314. : (tokens_->HasTrailingWhitespace(*position_)
  315. ? RelativeLocation::Before
  316. : RelativeLocation::Around));
  317. }
  318. } else {
  319. bool prefix = fixity == OperatorFixity::Prefix;
  320. // Whitespace is not permitted between a symbolic pre/postfix operator and
  321. // its operand.
  322. if (PositionKind().IsSymbol() &&
  323. (prefix ? tokens_->HasTrailingWhitespace(*position_)
  324. : tokens_->HasLeadingWhitespace(*position_))) {
  325. CARBON_DIAGNOSTIC(UnaryOperatorHasWhitespace, Error,
  326. "Whitespace is not allowed {0} this unary operator.",
  327. RelativeLocation);
  328. emitter_->Emit(
  329. *position_, UnaryOperatorHasWhitespace,
  330. prefix ? RelativeLocation::After : RelativeLocation::Before);
  331. }
  332. // Pre/postfix operators must not satisfy the infix operator rules.
  333. if (IsLexicallyValidInfixOperator()) {
  334. CARBON_DIAGNOSTIC(UnaryOperatorRequiresWhitespace, Error,
  335. "Whitespace is required {0} this unary operator.",
  336. RelativeLocation);
  337. emitter_->Emit(
  338. *position_, UnaryOperatorRequiresWhitespace,
  339. prefix ? RelativeLocation::Before : RelativeLocation::After);
  340. }
  341. }
  342. }
  343. auto Parser::ConsumeListToken(ParseNodeKind comma_kind, TokenKind close_kind,
  344. bool already_has_error) -> ListTokenKind {
  345. if (!PositionIs(TokenKind::Comma()) && !PositionIs(close_kind)) {
  346. // Don't error a second time on the same element.
  347. if (!already_has_error) {
  348. CARBON_DIAGNOSTIC(UnexpectedTokenAfterListElement, Error,
  349. "Expected `,` or `{0}`.", TokenKind);
  350. emitter_->Emit(*position_, UnexpectedTokenAfterListElement, close_kind);
  351. ReturnErrorOnState();
  352. }
  353. // Recover from the invalid token.
  354. auto end_of_element = FindNextOf({TokenKind::Comma(), close_kind});
  355. // The lexer guarantees that parentheses are balanced.
  356. CARBON_CHECK(end_of_element)
  357. << "missing matching `" << close_kind.GetOpeningSymbol() << "` for `"
  358. << close_kind << "`";
  359. SkipTo(*end_of_element);
  360. }
  361. if (PositionIs(close_kind)) {
  362. return ListTokenKind::Close;
  363. } else {
  364. AddLeafNode(comma_kind, Consume());
  365. return PositionIs(close_kind) ? ListTokenKind::CommaClose
  366. : ListTokenKind::Comma;
  367. }
  368. }
  369. auto Parser::Parse() -> void {
  370. // Traces state_stack_. This runs even in opt because it's low overhead.
  371. PrettyStackTraceParseState pretty_stack(this);
  372. PushState(ParserState::DeclarationLoop());
  373. while (!state_stack_.empty()) {
  374. switch (state_stack_.back().state) {
  375. #define CARBON_PARSER_STATE(Name) \
  376. case ParserState::Name(): \
  377. Handle##Name##State(); \
  378. break;
  379. #include "toolchain/parser/parser_state.def"
  380. }
  381. }
  382. AddLeafNode(ParseNodeKind::FileEnd(), *position_);
  383. }
  384. auto Parser::HandleBraceExpressionState() -> void {
  385. auto state = PopState();
  386. state.state = ParserState::BraceExpressionFinishAsUnknown();
  387. PushState(state);
  388. CARBON_CHECK(ConsumeAndAddLeafNodeIf(
  389. TokenKind::OpenCurlyBrace(),
  390. ParseNodeKind::StructLiteralOrStructTypeLiteralStart()));
  391. if (!PositionIs(TokenKind::CloseCurlyBrace())) {
  392. PushState(ParserState::BraceExpressionParameterAsUnknown());
  393. }
  394. }
  395. auto Parser::BraceExpressionKindToParserState(BraceExpressionKind kind,
  396. ParserState type,
  397. ParserState value,
  398. ParserState unknown)
  399. -> ParserState {
  400. switch (kind) {
  401. case BraceExpressionKind::Type: {
  402. return type;
  403. }
  404. case BraceExpressionKind::Value: {
  405. return value;
  406. }
  407. case BraceExpressionKind::Unknown: {
  408. return unknown;
  409. }
  410. }
  411. }
  412. auto Parser::HandleBraceExpressionParameterError(StateStackEntry state,
  413. BraceExpressionKind kind)
  414. -> void {
  415. CARBON_DIAGNOSTIC(ExpectedStructLiteralField, Error, "Expected {0}{1}{2}.",
  416. llvm::StringRef, llvm::StringRef, llvm::StringRef);
  417. bool can_be_type = kind != BraceExpressionKind::Value;
  418. bool can_be_value = kind != BraceExpressionKind::Type;
  419. emitter_->Emit(*position_, ExpectedStructLiteralField,
  420. can_be_type ? "`.field: type`" : "",
  421. (can_be_type && can_be_value) ? " or " : "",
  422. can_be_value ? "`.field = value`" : "");
  423. state.state = BraceExpressionKindToParserState(
  424. kind, ParserState::BraceExpressionParameterFinishAsType(),
  425. ParserState::BraceExpressionParameterFinishAsValue(),
  426. ParserState::BraceExpressionParameterFinishAsUnknown());
  427. state.has_error = true;
  428. PushState(state);
  429. }
  430. auto Parser::HandleBraceExpressionParameter(BraceExpressionKind kind) -> void {
  431. auto state = PopState();
  432. if (!PositionIs(TokenKind::Period())) {
  433. HandleBraceExpressionParameterError(state, kind);
  434. return;
  435. }
  436. state.state = BraceExpressionKindToParserState(
  437. kind, ParserState::BraceExpressionParameterAfterDesignatorAsType(),
  438. ParserState::BraceExpressionParameterAfterDesignatorAsValue(),
  439. ParserState::BraceExpressionParameterAfterDesignatorAsUnknown());
  440. PushState(state);
  441. PushState(ParserState::DesignatorAsStruct());
  442. }
  443. auto Parser::HandleBraceExpressionParameterAsTypeState() -> void {
  444. HandleBraceExpressionParameter(BraceExpressionKind::Type);
  445. }
  446. auto Parser::HandleBraceExpressionParameterAsValueState() -> void {
  447. HandleBraceExpressionParameter(BraceExpressionKind::Value);
  448. }
  449. auto Parser::HandleBraceExpressionParameterAsUnknownState() -> void {
  450. HandleBraceExpressionParameter(BraceExpressionKind::Unknown);
  451. }
  452. auto Parser::HandleBraceExpressionParameterAfterDesignator(
  453. BraceExpressionKind kind) -> void {
  454. auto state = PopState();
  455. if (state.has_error) {
  456. auto recovery_pos = FindNextOf(
  457. {TokenKind::Equal(), TokenKind::Colon(), TokenKind::Comma()});
  458. if (!recovery_pos ||
  459. tokens_->GetKind(*recovery_pos) == TokenKind::Comma()) {
  460. state.state = BraceExpressionKindToParserState(
  461. kind, ParserState::BraceExpressionParameterFinishAsType(),
  462. ParserState::BraceExpressionParameterFinishAsValue(),
  463. ParserState::BraceExpressionParameterFinishAsUnknown());
  464. PushState(state);
  465. return;
  466. }
  467. SkipTo(*recovery_pos);
  468. }
  469. // Work out the kind of this element.
  470. auto elem_kind = BraceExpressionKind::Unknown;
  471. if (PositionIs(TokenKind::Colon())) {
  472. elem_kind = BraceExpressionKind::Type;
  473. } else if (PositionIs(TokenKind::Equal())) {
  474. elem_kind = BraceExpressionKind::Value;
  475. }
  476. // Unknown kinds and changes between type and value are errors.
  477. if (elem_kind == BraceExpressionKind::Unknown ||
  478. (kind != BraceExpressionKind::Unknown && elem_kind != kind)) {
  479. HandleBraceExpressionParameterError(state, kind);
  480. return;
  481. }
  482. // If we're setting the kind, update the BraceExpressionFinish state.
  483. if (kind == BraceExpressionKind::Unknown) {
  484. kind = elem_kind;
  485. auto finish_state = PopState();
  486. CARBON_CHECK(finish_state.state ==
  487. ParserState::BraceExpressionFinishAsUnknown());
  488. finish_state.state = BraceExpressionKindToParserState(
  489. kind, ParserState::BraceExpressionFinishAsType(),
  490. ParserState::BraceExpressionFinishAsValue(),
  491. ParserState::BraceExpressionFinishAsUnknown());
  492. PushState(finish_state);
  493. }
  494. state.state = BraceExpressionKindToParserState(
  495. kind, ParserState::BraceExpressionParameterFinishAsType(),
  496. ParserState::BraceExpressionParameterFinishAsValue(),
  497. ParserState::BraceExpressionParameterFinishAsUnknown());
  498. state.token = Consume();
  499. // Struct type fields and value fields use the same grammar except
  500. // that one has a `:` separator and the other has an `=` separator.
  501. PushState(state);
  502. PushState(ParserState::Expression());
  503. }
  504. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsTypeState()
  505. -> void {
  506. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Type);
  507. }
  508. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsValueState()
  509. -> void {
  510. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Value);
  511. }
  512. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsUnknownState()
  513. -> void {
  514. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Unknown);
  515. }
  516. auto Parser::HandleBraceExpressionParameterFinish(BraceExpressionKind kind)
  517. -> void {
  518. auto state = PopState();
  519. if (state.has_error) {
  520. AddLeafNode(ParseNodeKind::StructFieldUnknown(), state.token,
  521. /*has_error=*/true);
  522. } else {
  523. AddNode(kind == BraceExpressionKind::Type
  524. ? ParseNodeKind::StructFieldType()
  525. : ParseNodeKind::StructFieldValue(),
  526. state.token, state.subtree_start, /*has_error=*/false);
  527. }
  528. if (ConsumeListToken(ParseNodeKind::StructComma(),
  529. TokenKind::CloseCurlyBrace(),
  530. state.has_error) == ListTokenKind::Comma) {
  531. PushState(BraceExpressionKindToParserState(
  532. kind, ParserState::BraceExpressionParameterAsType(),
  533. ParserState::BraceExpressionParameterAsValue(),
  534. ParserState::BraceExpressionParameterAsUnknown()));
  535. }
  536. }
  537. auto Parser::HandleBraceExpressionParameterFinishAsTypeState() -> void {
  538. HandleBraceExpressionParameterFinish(BraceExpressionKind::Type);
  539. }
  540. auto Parser::HandleBraceExpressionParameterFinishAsValueState() -> void {
  541. HandleBraceExpressionParameterFinish(BraceExpressionKind::Value);
  542. }
  543. auto Parser::HandleBraceExpressionParameterFinishAsUnknownState() -> void {
  544. HandleBraceExpressionParameterFinish(BraceExpressionKind::Unknown);
  545. }
  546. auto Parser::HandleBraceExpressionFinish(BraceExpressionKind kind) -> void {
  547. auto state = PopState();
  548. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructTypeLiteral()
  549. : ParseNodeKind::StructLiteral(),
  550. Consume(), state.subtree_start, state.has_error);
  551. }
  552. auto Parser::HandleBraceExpressionFinishAsTypeState() -> void {
  553. HandleBraceExpressionFinish(BraceExpressionKind::Type);
  554. }
  555. auto Parser::HandleBraceExpressionFinishAsValueState() -> void {
  556. HandleBraceExpressionFinish(BraceExpressionKind::Value);
  557. }
  558. auto Parser::HandleBraceExpressionFinishAsUnknownState() -> void {
  559. HandleBraceExpressionFinish(BraceExpressionKind::Unknown);
  560. }
  561. auto Parser::HandleCallExpressionState() -> void {
  562. auto state = PopState();
  563. state.state = ParserState::CallExpressionFinish();
  564. PushState(state);
  565. AddNode(ParseNodeKind::CallExpressionStart(), Consume(), state.subtree_start,
  566. state.has_error);
  567. if (!PositionIs(TokenKind::CloseParen())) {
  568. PushState(ParserState::CallExpressionParameterFinish());
  569. PushState(ParserState::Expression());
  570. }
  571. }
  572. auto Parser::HandleCallExpressionParameterFinishState() -> void {
  573. auto state = PopState();
  574. if (state.has_error) {
  575. ReturnErrorOnState();
  576. }
  577. if (ConsumeListToken(ParseNodeKind::CallExpressionComma(),
  578. TokenKind::CloseParen(),
  579. state.has_error) == ListTokenKind::Comma) {
  580. PushState(ParserState::CallExpressionParameterFinish());
  581. PushState(ParserState::Expression());
  582. }
  583. }
  584. auto Parser::HandleCallExpressionFinishState() -> void {
  585. auto state = PopState();
  586. AddNode(ParseNodeKind::CallExpression(), Consume(), state.subtree_start,
  587. state.has_error);
  588. }
  589. auto Parser::HandleCodeBlockFinishState() -> void {
  590. auto state = PopState();
  591. // If the block started with an open curly, this is a close curly.
  592. if (tokens_->GetKind(state.token) == TokenKind::OpenCurlyBrace()) {
  593. AddNode(ParseNodeKind::CodeBlock(), Consume(), state.subtree_start,
  594. state.has_error);
  595. } else {
  596. AddNode(ParseNodeKind::CodeBlock(), state.token, state.subtree_start,
  597. /*has_error=*/true);
  598. }
  599. }
  600. auto Parser::HandleDeclarationLoopState() -> void {
  601. // This maintains the current state unless we're at the end of the file.
  602. switch (PositionKind()) {
  603. case TokenKind::EndOfFile(): {
  604. PopAndDiscardState();
  605. break;
  606. }
  607. case TokenKind::Fn(): {
  608. PushState(ParserState::FunctionIntroducer());
  609. AddLeafNode(ParseNodeKind::FunctionIntroducer(), Consume());
  610. break;
  611. }
  612. case TokenKind::Package(): {
  613. PushState(ParserState::Package());
  614. break;
  615. }
  616. case TokenKind::Semi(): {
  617. AddLeafNode(ParseNodeKind::EmptyDeclaration(), Consume());
  618. break;
  619. }
  620. case TokenKind::Var(): {
  621. PushState(ParserState::VarAsSemicolon());
  622. break;
  623. }
  624. case TokenKind::Interface(): {
  625. PushState(ParserState::InterfaceIntroducer());
  626. ++position_;
  627. break;
  628. }
  629. default: {
  630. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  631. "Unrecognized declaration introducer.");
  632. emitter_->Emit(*position_, UnrecognizedDeclaration);
  633. auto cursor = *position_;
  634. auto semi = SkipPastLikelyEnd(cursor);
  635. // Locate the EmptyDeclaration at the semi when found, but use the
  636. // original cursor location for an error when not.
  637. AddLeafNode(ParseNodeKind::EmptyDeclaration(), semi ? *semi : cursor,
  638. /*has_error=*/true);
  639. break;
  640. }
  641. }
  642. }
  643. auto Parser::HandleDesignator(bool as_struct) -> void {
  644. auto state = PopState();
  645. // `.` identifier
  646. auto dot = ConsumeChecked(TokenKind::Period());
  647. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  648. ParseNodeKind::DesignatedName())) {
  649. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterDot, Error,
  650. "Expected identifier after `.`.");
  651. emitter_->Emit(*position_, ExpectedIdentifierAfterDot);
  652. // If we see a keyword, assume it was intended to be the designated name.
  653. // TODO: Should keywords be valid in designators?
  654. if (PositionKind().IsKeyword()) {
  655. AddLeafNode(ParseNodeKind::DesignatedName(), Consume(),
  656. /*has_error=*/true);
  657. } else {
  658. AddLeafNode(ParseNodeKind::DesignatedName(), *position_,
  659. /*has_error=*/true);
  660. // Indicate the error to the parent state so that it can avoid producing
  661. // more errors.
  662. ReturnErrorOnState();
  663. }
  664. }
  665. AddNode(as_struct ? ParseNodeKind::StructFieldDesignator()
  666. : ParseNodeKind::DesignatorExpression(),
  667. dot, state.subtree_start, state.has_error);
  668. }
  669. auto Parser::HandleDesignatorAsExpressionState() -> void {
  670. HandleDesignator(/*as_struct=*/false);
  671. }
  672. auto Parser::HandleDesignatorAsStructState() -> void {
  673. HandleDesignator(/*as_struct=*/true);
  674. }
  675. auto Parser::HandleExpressionState() -> void {
  676. auto state = PopState();
  677. // Check for a prefix operator.
  678. if (auto operator_precedence = PrecedenceGroup::ForLeading(PositionKind())) {
  679. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  680. *operator_precedence) !=
  681. OperatorPriority::RightFirst) {
  682. // The precedence rules don't permit this prefix operator in this
  683. // context. Diagnose this, but carry on and parse it anyway.
  684. emitter_->Emit(*position_, OperatorRequiresParentheses);
  685. } else {
  686. // Check that this operator follows the proper whitespace rules.
  687. DiagnoseOperatorFixity(OperatorFixity::Prefix);
  688. }
  689. PushStateForExpressionLoop(ParserState::ExpressionLoopForPrefix(),
  690. state.ambient_precedence, *operator_precedence);
  691. ++position_;
  692. PushStateForExpression(*operator_precedence);
  693. } else {
  694. PushStateForExpressionLoop(ParserState::ExpressionLoop(),
  695. state.ambient_precedence,
  696. PrecedenceGroup::ForPostfixExpression());
  697. PushState(ParserState::ExpressionInPostfix());
  698. }
  699. }
  700. auto Parser::HandleExpressionInPostfixState() -> void {
  701. auto state = PopState();
  702. // Continue to the loop state.
  703. state.state = ParserState::ExpressionInPostfixLoop();
  704. // Parses a primary expression, which is either a terminal portion of an
  705. // expression tree, such as an identifier or literal, or a parenthesized
  706. // expression.
  707. switch (PositionKind()) {
  708. case TokenKind::Identifier(): {
  709. AddLeafNode(ParseNodeKind::NameReference(), Consume());
  710. PushState(state);
  711. break;
  712. }
  713. case TokenKind::IntegerLiteral():
  714. case TokenKind::RealLiteral():
  715. case TokenKind::StringLiteral():
  716. case TokenKind::IntegerTypeLiteral():
  717. case TokenKind::UnsignedIntegerTypeLiteral():
  718. case TokenKind::FloatingPointTypeLiteral(): {
  719. AddLeafNode(ParseNodeKind::Literal(), Consume());
  720. PushState(state);
  721. break;
  722. }
  723. case TokenKind::OpenCurlyBrace(): {
  724. PushState(state);
  725. PushState(ParserState::BraceExpression());
  726. break;
  727. }
  728. case TokenKind::OpenParen(): {
  729. PushState(state);
  730. PushState(ParserState::ParenExpression());
  731. break;
  732. }
  733. default: {
  734. CARBON_DIAGNOSTIC(ExpectedExpression, Error, "Expected expression.");
  735. emitter_->Emit(*position_, ExpectedExpression);
  736. ReturnErrorOnState();
  737. break;
  738. }
  739. }
  740. }
  741. auto Parser::HandleExpressionInPostfixLoopState() -> void {
  742. // This is a cyclic state that repeats, so this state is typically pushed back
  743. // on.
  744. auto state = PopState();
  745. state.token = *position_;
  746. switch (PositionKind()) {
  747. case TokenKind::Period(): {
  748. PushState(state);
  749. state.state = ParserState::DesignatorAsExpression();
  750. PushState(state);
  751. break;
  752. }
  753. case TokenKind::OpenParen(): {
  754. PushState(state);
  755. state.state = ParserState::CallExpression();
  756. PushState(state);
  757. break;
  758. }
  759. default: {
  760. if (state.has_error) {
  761. ReturnErrorOnState();
  762. }
  763. break;
  764. }
  765. }
  766. }
  767. auto Parser::HandleExpressionLoopState() -> void {
  768. auto state = PopState();
  769. auto trailing_operator =
  770. PrecedenceGroup::ForTrailing(PositionKind(), IsTrailingOperatorInfix());
  771. if (!trailing_operator) {
  772. if (state.has_error) {
  773. ReturnErrorOnState();
  774. }
  775. return;
  776. }
  777. auto [operator_precedence, is_binary] = *trailing_operator;
  778. // TODO: If this operator is ambiguous with either the ambient precedence
  779. // or the LHS precedence, and there's a variant with a different fixity
  780. // that would work, use that one instead for error recovery.
  781. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  782. operator_precedence) !=
  783. OperatorPriority::RightFirst) {
  784. // The precedence rules don't permit this operator in this context. Try
  785. // again in the enclosing expression context.
  786. if (state.has_error) {
  787. ReturnErrorOnState();
  788. }
  789. return;
  790. }
  791. if (PrecedenceGroup::GetPriority(state.lhs_precedence, operator_precedence) !=
  792. OperatorPriority::LeftFirst) {
  793. // Either the LHS operator and this operator are ambiguous, or the
  794. // LHS operator is a unary operator that can't be nested within
  795. // this operator. Either way, parentheses are required.
  796. emitter_->Emit(*position_, OperatorRequiresParentheses);
  797. state.has_error = true;
  798. } else {
  799. DiagnoseOperatorFixity(is_binary ? OperatorFixity::Infix
  800. : OperatorFixity::Postfix);
  801. }
  802. state.token = Consume();
  803. state.lhs_precedence = operator_precedence;
  804. if (is_binary) {
  805. state.state = ParserState::ExpressionLoopForBinary();
  806. PushState(state);
  807. PushStateForExpression(operator_precedence);
  808. } else {
  809. AddNode(ParseNodeKind::PostfixOperator(), state.token, state.subtree_start,
  810. state.has_error);
  811. state.has_error = false;
  812. PushState(state);
  813. }
  814. }
  815. auto Parser::HandleExpressionLoopForBinaryState() -> void {
  816. auto state = PopState();
  817. AddNode(ParseNodeKind::InfixOperator(), state.token, state.subtree_start,
  818. state.has_error);
  819. state.state = ParserState::ExpressionLoop();
  820. state.has_error = false;
  821. PushState(state);
  822. }
  823. auto Parser::HandleExpressionLoopForPrefixState() -> void {
  824. auto state = PopState();
  825. AddNode(ParseNodeKind::PrefixOperator(), state.token, state.subtree_start,
  826. state.has_error);
  827. state.state = ParserState::ExpressionLoop();
  828. state.has_error = false;
  829. PushState(state);
  830. }
  831. auto Parser::HandleExpressionStatementFinishState() -> void {
  832. auto state = PopState();
  833. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  834. AddNode(ParseNodeKind::ExpressionStatement(), *semi, state.subtree_start,
  835. state.has_error);
  836. return;
  837. }
  838. if (!state.has_error) {
  839. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  840. }
  841. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  842. AddNode(ParseNodeKind::ExpressionStatement(), *semi_token,
  843. state.subtree_start,
  844. /*has_error=*/true);
  845. return;
  846. }
  847. // Found junk not even followed by a `;`, no node to add.
  848. ReturnErrorOnState();
  849. }
  850. auto Parser::HandleFunctionError(StateStackEntry state,
  851. bool skip_past_likely_end) -> void {
  852. auto token = state.token;
  853. if (skip_past_likely_end) {
  854. if (auto semi = SkipPastLikelyEnd(token)) {
  855. token = *semi;
  856. }
  857. }
  858. AddNode(ParseNodeKind::FunctionDeclaration(), token, state.subtree_start,
  859. /*has_error=*/true);
  860. }
  861. auto Parser::HandleFunctionIntroducerState() -> void {
  862. auto state = PopState();
  863. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  864. ParseNodeKind::DeclaredName())) {
  865. CARBON_DIAGNOSTIC(ExpectedFunctionName, Error,
  866. "Expected function name after `fn` keyword.");
  867. emitter_->Emit(*position_, ExpectedFunctionName);
  868. // TODO: We could change the lexer to allow us to synthesize certain
  869. // kinds of tokens and try to "recover" here, but unclear that this is
  870. // really useful.
  871. HandleFunctionError(state, true);
  872. return;
  873. }
  874. if (!PositionIs(TokenKind::OpenParen())) {
  875. CARBON_DIAGNOSTIC(ExpectedFunctionParams, Error,
  876. "Expected `(` after function name.");
  877. emitter_->Emit(*position_, ExpectedFunctionParams);
  878. HandleFunctionError(state, true);
  879. return;
  880. }
  881. // Parse the parameter list as its own subtree; once that pops, resume
  882. // function parsing.
  883. state.state = ParserState::FunctionAfterParameterList();
  884. PushState(state);
  885. PushState(ParserState::FunctionParameterListFinish());
  886. AddLeafNode(ParseNodeKind::ParameterListStart(), Consume());
  887. if (!PositionIs(TokenKind::CloseParen())) {
  888. PushState(ParserState::FunctionParameter());
  889. }
  890. }
  891. auto Parser::HandleFunctionParameterState() -> void {
  892. PopAndDiscardState();
  893. PushState(ParserState::FunctionParameterFinish());
  894. PushState(ParserState::PatternAsFunctionParameter());
  895. }
  896. auto Parser::HandleFunctionParameterFinishState() -> void {
  897. auto state = PopState();
  898. if (state.has_error) {
  899. ReturnErrorOnState();
  900. }
  901. if (ConsumeListToken(ParseNodeKind::ParameterListComma(),
  902. TokenKind::CloseParen(),
  903. state.has_error) == ListTokenKind::Comma) {
  904. PushState(ParserState::PatternAsFunctionParameter());
  905. }
  906. }
  907. auto Parser::HandleFunctionParameterListFinishState() -> void {
  908. auto state = PopState();
  909. AddNode(ParseNodeKind::ParameterList(),
  910. ConsumeChecked(TokenKind::CloseParen()), state.subtree_start,
  911. state.has_error);
  912. }
  913. auto Parser::HandleFunctionAfterParameterListState() -> void {
  914. auto state = PopState();
  915. // Regardless of whether there's a return type, we'll finish the signature.
  916. state.state = ParserState::FunctionSignatureFinish();
  917. PushState(state);
  918. // If there is a return type, parse the expression before adding the return
  919. // type nod.e
  920. if (PositionIs(TokenKind::MinusGreater())) {
  921. PushState(ParserState::FunctionReturnTypeFinish());
  922. ++position_;
  923. PushStateForExpression(PrecedenceGroup::ForType());
  924. }
  925. }
  926. auto Parser::HandleFunctionReturnTypeFinishState() -> void {
  927. auto state = PopState();
  928. AddNode(ParseNodeKind::ReturnType(), state.token, state.subtree_start,
  929. state.has_error);
  930. }
  931. auto Parser::HandleFunctionSignatureFinishState() -> void {
  932. auto state = PopState();
  933. switch (PositionKind()) {
  934. case TokenKind::Semi(): {
  935. AddNode(ParseNodeKind::FunctionDeclaration(), Consume(),
  936. state.subtree_start, state.has_error);
  937. break;
  938. }
  939. case TokenKind::OpenCurlyBrace(): {
  940. AddNode(ParseNodeKind::FunctionDefinitionStart(), Consume(),
  941. state.subtree_start, state.has_error);
  942. // Any error is recorded on the FunctionDefinitionStart.
  943. state.has_error = false;
  944. state.state = ParserState::FunctionDefinitionFinish();
  945. PushState(state);
  946. PushState(ParserState::StatementScopeLoop());
  947. break;
  948. }
  949. default: {
  950. CARBON_DIAGNOSTIC(
  951. ExpectedFunctionBodyOrSemi, Error,
  952. "Expected function definition or `;` after function declaration.");
  953. emitter_->Emit(*position_, ExpectedFunctionBodyOrSemi);
  954. // Only need to skip if we've not already found a new line.
  955. bool skip_past_likely_end =
  956. tokens_->GetLine(*position_) == tokens_->GetLine(state.token);
  957. HandleFunctionError(state, skip_past_likely_end);
  958. break;
  959. }
  960. }
  961. }
  962. auto Parser::HandleFunctionDefinitionFinishState() -> void {
  963. auto state = PopState();
  964. AddNode(ParseNodeKind::FunctionDefinition(), Consume(), state.subtree_start,
  965. state.has_error);
  966. }
  967. auto Parser::HandlePackageState() -> void {
  968. auto state = PopState();
  969. AddLeafNode(ParseNodeKind::PackageIntroducer(), Consume());
  970. auto exit_on_parse_error = [&]() {
  971. auto semi_token = SkipPastLikelyEnd(state.token);
  972. return AddNode(ParseNodeKind::PackageDirective(),
  973. semi_token ? *semi_token : state.token, state.subtree_start,
  974. /*has_error=*/true);
  975. };
  976. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  977. ParseNodeKind::DeclaredName())) {
  978. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterPackage, Error,
  979. "Expected identifier after `package`.");
  980. emitter_->Emit(*position_, ExpectedIdentifierAfterPackage);
  981. exit_on_parse_error();
  982. return;
  983. }
  984. bool library_parsed = false;
  985. if (auto library_token = ConsumeIf(TokenKind::Library())) {
  986. auto library_start = tree_->size();
  987. if (!ConsumeAndAddLeafNodeIf(TokenKind::StringLiteral(),
  988. ParseNodeKind::Literal())) {
  989. CARBON_DIAGNOSTIC(
  990. ExpectedLibraryName, Error,
  991. "Expected a string literal to specify the library name.");
  992. emitter_->Emit(*position_, ExpectedLibraryName);
  993. exit_on_parse_error();
  994. return;
  995. }
  996. AddNode(ParseNodeKind::PackageLibrary(), *library_token, library_start,
  997. /*has_error=*/false);
  998. library_parsed = true;
  999. }
  1000. switch (auto api_or_impl_token = tokens_->GetKind(*(position_))) {
  1001. case TokenKind::Api(): {
  1002. AddLeafNode(ParseNodeKind::PackageApi(), Consume());
  1003. break;
  1004. }
  1005. case TokenKind::Impl(): {
  1006. AddLeafNode(ParseNodeKind::PackageImpl(), Consume());
  1007. break;
  1008. }
  1009. default: {
  1010. if (!library_parsed && api_or_impl_token == TokenKind::StringLiteral()) {
  1011. // If we come acroess a string literal and we didn't parse `library
  1012. // "..."` yet, then most probably the user forgot to add `library`
  1013. // before the library name.
  1014. CARBON_DIAGNOSTIC(MissingLibraryKeyword, Error,
  1015. "Missing `library` keyword.");
  1016. emitter_->Emit(*position_, MissingLibraryKeyword);
  1017. } else {
  1018. CARBON_DIAGNOSTIC(ExpectedApiOrImpl, Error,
  1019. "Expected a `api` or `impl`.");
  1020. emitter_->Emit(*position_, ExpectedApiOrImpl);
  1021. }
  1022. exit_on_parse_error();
  1023. return;
  1024. }
  1025. }
  1026. if (!PositionIs(TokenKind::Semi())) {
  1027. CARBON_DIAGNOSTIC(ExpectedSemiToEndPackageDirective, Error,
  1028. "Expected `;` to end package directive.");
  1029. emitter_->Emit(*position_, ExpectedSemiToEndPackageDirective);
  1030. exit_on_parse_error();
  1031. return;
  1032. }
  1033. AddNode(ParseNodeKind::PackageDirective(), Consume(), state.subtree_start,
  1034. /*has_error=*/false);
  1035. }
  1036. auto Parser::HandleParenCondition(ParseNodeKind start_kind,
  1037. ParserState finish_state) -> void {
  1038. auto state = PopState();
  1039. ConsumeAndAddOpenParen(state.token, start_kind);
  1040. state.state = finish_state;
  1041. PushState(state);
  1042. PushState(ParserState::Expression());
  1043. }
  1044. auto Parser::HandleParenConditionAsIfState() -> void {
  1045. HandleParenCondition(ParseNodeKind::IfConditionStart(),
  1046. ParserState::ParenConditionFinishAsIf());
  1047. }
  1048. auto Parser::HandleParenConditionAsWhileState() -> void {
  1049. HandleParenCondition(ParseNodeKind::WhileConditionStart(),
  1050. ParserState::ParenConditionFinishAsWhile());
  1051. }
  1052. auto Parser::HandleParenConditionFinishAsIfState() -> void {
  1053. auto state = PopState();
  1054. ConsumeAndAddCloseParen(state, ParseNodeKind::IfCondition());
  1055. }
  1056. auto Parser::HandleParenConditionFinishAsWhileState() -> void {
  1057. auto state = PopState();
  1058. ConsumeAndAddCloseParen(state, ParseNodeKind::WhileCondition());
  1059. }
  1060. auto Parser::HandleParenExpressionState() -> void {
  1061. auto state = PopState();
  1062. // Advance past the open paren.
  1063. AddLeafNode(ParseNodeKind::ParenExpressionOrTupleLiteralStart(),
  1064. ConsumeChecked(TokenKind::OpenParen()));
  1065. if (PositionIs(TokenKind::CloseParen())) {
  1066. state.state = ParserState::ParenExpressionFinishAsTuple();
  1067. PushState(state);
  1068. } else {
  1069. state.state = ParserState::ParenExpressionFinish();
  1070. PushState(state);
  1071. PushState(ParserState::ParenExpressionParameterFinishAsUnknown());
  1072. PushState(ParserState::Expression());
  1073. }
  1074. }
  1075. auto Parser::HandleParenExpressionParameterFinish(bool as_tuple) -> void {
  1076. auto state = PopState();
  1077. auto list_token_kind =
  1078. ConsumeListToken(ParseNodeKind::TupleLiteralComma(),
  1079. TokenKind::CloseParen(), state.has_error);
  1080. if (list_token_kind == ListTokenKind::Close) {
  1081. return;
  1082. }
  1083. // If this is the first item and a comma was found, switch to tuple handling.
  1084. // Note this could be `(expr,)` so we may not reuse the current state, but
  1085. // it's still necessary to switch the parent.
  1086. if (!as_tuple) {
  1087. state.state = ParserState::ParenExpressionParameterFinishAsTuple();
  1088. auto finish_state = PopState();
  1089. CARBON_CHECK(finish_state.state == ParserState::ParenExpressionFinish())
  1090. << "Unexpected parent state, found: " << finish_state.state;
  1091. finish_state.state = ParserState::ParenExpressionFinishAsTuple();
  1092. PushState(finish_state);
  1093. }
  1094. // On a comma, push another expression handler.
  1095. if (list_token_kind == ListTokenKind::Comma) {
  1096. PushState(state);
  1097. PushState(ParserState::Expression());
  1098. }
  1099. }
  1100. auto Parser::HandleParenExpressionParameterFinishAsUnknownState() -> void {
  1101. HandleParenExpressionParameterFinish(/*as_tuple=*/false);
  1102. }
  1103. auto Parser::HandleParenExpressionParameterFinishAsTupleState() -> void {
  1104. HandleParenExpressionParameterFinish(/*as_tuple=*/true);
  1105. }
  1106. auto Parser::HandleParenExpressionFinishState() -> void {
  1107. auto state = PopState();
  1108. AddNode(ParseNodeKind::ParenExpression(), Consume(), state.subtree_start,
  1109. state.has_error);
  1110. }
  1111. auto Parser::HandleParenExpressionFinishAsTupleState() -> void {
  1112. auto state = PopState();
  1113. AddNode(ParseNodeKind::TupleLiteral(), Consume(), state.subtree_start,
  1114. state.has_error);
  1115. }
  1116. auto Parser::HandlePattern(PatternKind pattern_kind) -> void {
  1117. auto state = PopState();
  1118. // Ensure the finish state always follows.
  1119. state.state = ParserState::PatternFinish();
  1120. // Handle an invalid pattern introducer.
  1121. if (!PositionIs(TokenKind::Identifier()) ||
  1122. tokens_->GetKind(*(position_ + 1)) != TokenKind::Colon()) {
  1123. switch (pattern_kind) {
  1124. case PatternKind::Parameter: {
  1125. CARBON_DIAGNOSTIC(ExpectedParameterName, Error,
  1126. "Expected parameter declaration.");
  1127. emitter_->Emit(*position_, ExpectedParameterName);
  1128. break;
  1129. }
  1130. case PatternKind::Variable: {
  1131. CARBON_DIAGNOSTIC(ExpectedVariableName, Error,
  1132. "Expected pattern in `var` declaration.");
  1133. emitter_->Emit(*position_, ExpectedVariableName);
  1134. break;
  1135. }
  1136. }
  1137. state.has_error = true;
  1138. PushState(state);
  1139. return;
  1140. }
  1141. // Switch the context token to the colon, so that it'll be used for the root
  1142. // node.
  1143. state.token = *(position_ + 1);
  1144. PushState(state);
  1145. PushStateForExpression(PrecedenceGroup::ForType());
  1146. AddLeafNode(ParseNodeKind::DeclaredName(), *position_);
  1147. position_ += 2;
  1148. }
  1149. auto Parser::HandlePatternAsFunctionParameterState() -> void {
  1150. HandlePattern(PatternKind::Parameter);
  1151. }
  1152. auto Parser::HandlePatternAsVariableState() -> void {
  1153. HandlePattern(PatternKind::Variable);
  1154. }
  1155. auto Parser::HandlePatternFinishState() -> void {
  1156. auto state = PopState();
  1157. // If an error was encountered, propagate it without adding a node.
  1158. if (state.has_error) {
  1159. ReturnErrorOnState();
  1160. return;
  1161. }
  1162. // TODO: may need to mark has_error if !type.
  1163. AddNode(ParseNodeKind::PatternBinding(), state.token, state.subtree_start,
  1164. /*has_error=*/false);
  1165. }
  1166. auto Parser::HandleStatementState() -> void {
  1167. PopAndDiscardState();
  1168. switch (PositionKind()) {
  1169. case TokenKind::Break(): {
  1170. PushState(ParserState::StatementBreakFinish());
  1171. AddLeafNode(ParseNodeKind::BreakStatementStart(), Consume());
  1172. break;
  1173. }
  1174. case TokenKind::Continue(): {
  1175. PushState(ParserState::StatementContinueFinish());
  1176. AddLeafNode(ParseNodeKind::ContinueStatementStart(), Consume());
  1177. break;
  1178. }
  1179. case TokenKind::For(): {
  1180. PushState(ParserState::StatementForFinish());
  1181. PushState(ParserState::StatementForHeader());
  1182. ++position_;
  1183. break;
  1184. }
  1185. case TokenKind::If(): {
  1186. PushState(ParserState::StatementIf());
  1187. break;
  1188. }
  1189. case TokenKind::Return(): {
  1190. PushState(ParserState::StatementReturn());
  1191. break;
  1192. }
  1193. case TokenKind::Var(): {
  1194. PushState(ParserState::VarAsSemicolon());
  1195. break;
  1196. }
  1197. case TokenKind::While(): {
  1198. PushState(ParserState::StatementWhile());
  1199. break;
  1200. }
  1201. default: {
  1202. PushState(ParserState::ExpressionStatementFinish());
  1203. PushState(ParserState::Expression());
  1204. break;
  1205. }
  1206. }
  1207. }
  1208. auto Parser::HandleStatementBreakFinishState() -> void {
  1209. HandleStatementKeywordFinish(ParseNodeKind::BreakStatement());
  1210. }
  1211. auto Parser::HandleStatementContinueFinishState() -> void {
  1212. HandleStatementKeywordFinish(ParseNodeKind::ContinueStatement());
  1213. }
  1214. auto Parser::HandleStatementForHeaderState() -> void {
  1215. auto state = PopState();
  1216. ConsumeAndAddOpenParen(state.token, ParseNodeKind::ForHeaderStart());
  1217. state.state = ParserState::StatementForHeaderIn();
  1218. if (PositionIs(TokenKind::Var())) {
  1219. PushState(state);
  1220. PushState(ParserState::VarAsFor());
  1221. } else {
  1222. CARBON_DIAGNOSTIC(ExpectedVariableDeclaration, Error,
  1223. "Expected `var` declaration.");
  1224. emitter_->Emit(*position_, ExpectedVariableDeclaration);
  1225. if (auto next_in = FindNextOf({TokenKind::In()})) {
  1226. SkipTo(*next_in);
  1227. ++position_;
  1228. }
  1229. state.has_error = true;
  1230. PushState(state);
  1231. }
  1232. }
  1233. auto Parser::HandleStatementForHeaderInState() -> void {
  1234. auto state = PopState();
  1235. state.state = ParserState::StatementForHeaderFinish();
  1236. PushState(state);
  1237. PushState(ParserState::Expression());
  1238. }
  1239. auto Parser::HandleStatementForHeaderFinishState() -> void {
  1240. auto state = PopState();
  1241. ConsumeAndAddCloseParen(state, ParseNodeKind::ForHeader());
  1242. PushState(ParserState::CodeBlock());
  1243. }
  1244. auto Parser::HandleStatementForFinishState() -> void {
  1245. auto state = PopState();
  1246. AddNode(ParseNodeKind::ForStatement(), state.token, state.subtree_start,
  1247. state.has_error);
  1248. }
  1249. auto Parser::HandleStatementIfState() -> void {
  1250. PopAndDiscardState();
  1251. PushState(ParserState::StatementIfConditionFinish());
  1252. PushState(ParserState::ParenConditionAsIf());
  1253. ++position_;
  1254. }
  1255. auto Parser::HandleStatementIfConditionFinishState() -> void {
  1256. auto state = PopState();
  1257. state.state = ParserState::StatementIfThenBlockFinish();
  1258. PushState(state);
  1259. PushState(ParserState::CodeBlock());
  1260. }
  1261. auto Parser::HandleStatementIfThenBlockFinishState() -> void {
  1262. auto state = PopState();
  1263. if (ConsumeAndAddLeafNodeIf(TokenKind::Else(),
  1264. ParseNodeKind::IfStatementElse())) {
  1265. state.state = ParserState::StatementIfElseBlockFinish();
  1266. PushState(state);
  1267. // `else if` is permitted as a special case.
  1268. PushState(PositionIs(TokenKind::If()) ? ParserState::StatementIf()
  1269. : ParserState::CodeBlock());
  1270. } else {
  1271. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1272. state.has_error);
  1273. }
  1274. }
  1275. auto Parser::HandleStatementIfElseBlockFinishState() -> void {
  1276. auto state = PopState();
  1277. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1278. state.has_error);
  1279. }
  1280. auto Parser::HandleStatementKeywordFinish(ParseNodeKind node_kind) -> void {
  1281. auto state = PopState();
  1282. auto semi = ConsumeIf(TokenKind::Semi());
  1283. if (!semi) {
  1284. CARBON_DIAGNOSTIC(ExpectedSemiAfter, Error, "Expected `;` after `{0}`.",
  1285. TokenKind);
  1286. emitter_->Emit(*position_, ExpectedSemiAfter,
  1287. tokens_->GetKind(state.token));
  1288. state.has_error = true;
  1289. // Recover to the next semicolon if possible, otherwise indicate the
  1290. // keyword for the error.
  1291. semi = SkipPastLikelyEnd(state.token);
  1292. if (!semi) {
  1293. semi = state.token;
  1294. }
  1295. }
  1296. AddNode(node_kind, *semi, state.subtree_start, state.has_error);
  1297. }
  1298. auto Parser::HandleStatementReturnState() -> void {
  1299. auto state = PopState();
  1300. state.state = ParserState::StatementReturnFinish();
  1301. PushState(state);
  1302. AddLeafNode(ParseNodeKind::ReturnStatementStart(), Consume());
  1303. if (!PositionIs(TokenKind::Semi())) {
  1304. PushState(ParserState::Expression());
  1305. }
  1306. }
  1307. auto Parser::HandleStatementReturnFinishState() -> void {
  1308. HandleStatementKeywordFinish(ParseNodeKind::ReturnStatement());
  1309. }
  1310. auto Parser::HandleStatementScopeLoopState() -> void {
  1311. // This maintains the current state until we're at the end of the scope.
  1312. auto token_kind = PositionKind();
  1313. if (token_kind == TokenKind::CloseCurlyBrace()) {
  1314. auto state = PopState();
  1315. if (state.has_error) {
  1316. ReturnErrorOnState();
  1317. }
  1318. } else {
  1319. PushState(ParserState::Statement());
  1320. }
  1321. }
  1322. auto Parser::HandleStatementWhileState() -> void {
  1323. PopAndDiscardState();
  1324. PushState(ParserState::StatementWhileConditionFinish());
  1325. PushState(ParserState::ParenConditionAsWhile());
  1326. ++position_;
  1327. }
  1328. auto Parser::HandleStatementWhileConditionFinishState() -> void {
  1329. auto state = PopState();
  1330. state.state = ParserState::StatementWhileBlockFinish();
  1331. PushState(state);
  1332. PushState(ParserState::CodeBlock());
  1333. }
  1334. auto Parser::HandleStatementWhileBlockFinishState() -> void {
  1335. auto state = PopState();
  1336. AddNode(ParseNodeKind::WhileStatement(), state.token, state.subtree_start,
  1337. state.has_error);
  1338. }
  1339. auto Parser::HandleVar(ParserState finish_state) -> void {
  1340. PopAndDiscardState();
  1341. // These will start at the `var`.
  1342. PushState(finish_state);
  1343. PushState(ParserState::VarAfterPattern());
  1344. AddLeafNode(ParseNodeKind::VariableIntroducer(), Consume());
  1345. // This will start at the pattern.
  1346. PushState(ParserState::PatternAsVariable());
  1347. }
  1348. auto Parser::HandleVarAsSemicolonState() -> void {
  1349. HandleVar(ParserState::VarFinishAsSemicolon());
  1350. }
  1351. auto Parser::HandleVarAsForState() -> void {
  1352. HandleVar(ParserState::VarFinishAsFor());
  1353. }
  1354. auto Parser::HandleVarAfterPatternState() -> void {
  1355. auto state = PopState();
  1356. if (state.has_error) {
  1357. if (auto after_pattern =
  1358. FindNextOf({TokenKind::Equal(), TokenKind::Semi()})) {
  1359. SkipTo(*after_pattern);
  1360. }
  1361. }
  1362. if (PositionIs(TokenKind::Equal())) {
  1363. PushState(ParserState::VarAfterInitializer());
  1364. ++position_;
  1365. PushState(ParserState::Expression());
  1366. return;
  1367. }
  1368. }
  1369. auto Parser::HandleVarAfterInitializerState() -> void {
  1370. auto state = PopState();
  1371. AddNode(ParseNodeKind::VariableInitializer(), state.token,
  1372. state.subtree_start, state.has_error);
  1373. }
  1374. auto Parser::HandleVarFinishAsSemicolonState() -> void {
  1375. auto state = PopState();
  1376. auto end_token = state.token;
  1377. if (PositionIs(TokenKind::Semi())) {
  1378. end_token = Consume();
  1379. } else {
  1380. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  1381. state.has_error = true;
  1382. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  1383. end_token = *semi_token;
  1384. }
  1385. }
  1386. AddNode(ParseNodeKind::VariableDeclaration(), end_token, state.subtree_start,
  1387. state.has_error);
  1388. }
  1389. auto Parser::HandleVarFinishAsForState() -> void {
  1390. auto state = PopState();
  1391. auto end_token = state.token;
  1392. if (PositionIs(TokenKind::In())) {
  1393. end_token = Consume();
  1394. } else if (PositionIs(TokenKind::Colon())) {
  1395. CARBON_DIAGNOSTIC(ExpectedIn, Error, "`:` should be replaced by `in`.");
  1396. emitter_->Emit(*position_, ExpectedIn);
  1397. state.has_error = true;
  1398. end_token = Consume();
  1399. } else {
  1400. CARBON_DIAGNOSTIC(ExpectedIn, Error,
  1401. "Expected `in` after loop `var` declaration.");
  1402. emitter_->Emit(*position_, ExpectedIn);
  1403. state.has_error = true;
  1404. }
  1405. AddNode(ParseNodeKind::ForIn(), end_token, state.subtree_start,
  1406. state.has_error);
  1407. }
  1408. auto Parser::HandleInterfaceIntroducerState() -> void {
  1409. auto state = PopState();
  1410. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  1411. ParseNodeKind::DeclaredName())) {
  1412. CARBON_DIAGNOSTIC(ExpectedInterfaceName, Error,
  1413. "Expected interface name after `interface` keyword.");
  1414. emitter_->Emit(*position_, ExpectedInterfaceName);
  1415. state.has_error = true;
  1416. // Add a name node even when it's not present because it's used for subtree
  1417. // bracketing on interfaces.
  1418. // TODO: Either fix this or normalize it, still deciding on the right
  1419. // approach.
  1420. AddLeafNode(ParseNodeKind::DeclaredName(), state.token, /*has_error=*/true);
  1421. }
  1422. bool parse_body = true;
  1423. if (!PositionIs(TokenKind::OpenCurlyBrace())) {
  1424. CARBON_DIAGNOSTIC(ExpectedInterfaceOpenCurlyBrace, Error,
  1425. "Expected `{{` to start interface definition.");
  1426. emitter_->Emit(*position_, ExpectedInterfaceOpenCurlyBrace);
  1427. state.has_error = true;
  1428. SkipPastLikelyEnd(state.token);
  1429. parse_body = false;
  1430. }
  1431. state.state = ParserState::InterfaceDefinitionFinish();
  1432. PushState(state);
  1433. if (parse_body) {
  1434. PushState(ParserState::InterfaceDefinitionLoop());
  1435. AddLeafNode(ParseNodeKind::InterfaceBodyStart(), Consume());
  1436. }
  1437. }
  1438. auto Parser::HandleInterfaceDefinitionLoopState() -> void {
  1439. // This maintains the current state unless we're at the end of the interface
  1440. // definition.
  1441. switch (PositionKind()) {
  1442. case TokenKind::CloseCurlyBrace(): {
  1443. auto state = PopState();
  1444. AddNode(ParseNodeKind::InterfaceBody(), Consume(), state.subtree_start,
  1445. state.has_error);
  1446. break;
  1447. }
  1448. // TODO: Handle possible declarations inside interface body.
  1449. default: {
  1450. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  1451. "Unrecognized declaration introducer.");
  1452. emitter_->Emit(*position_, UnrecognizedDeclaration);
  1453. if (auto semi = SkipPastLikelyEnd(*position_)) {
  1454. AddLeafNode(ParseNodeKind::EmptyDeclaration(), *semi,
  1455. /*has_error=*/true);
  1456. } else {
  1457. ReturnErrorOnState();
  1458. }
  1459. break;
  1460. }
  1461. }
  1462. }
  1463. auto Parser::HandleInterfaceDefinitionFinishState() -> void {
  1464. auto state = PopState();
  1465. AddNode(ParseNodeKind::InterfaceDefinition(), state.token,
  1466. state.subtree_start, state.has_error);
  1467. }
  1468. } // namespace Carbon