parser.cpp 56 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. #include "toolchain/parser/parser.h"
  5. #include <cstdlib>
  6. #include <memory>
  7. #include "common/check.h"
  8. #include "llvm/ADT/Optional.h"
  9. #include "llvm/Support/PrettyStackTrace.h"
  10. #include "toolchain/lexer/token_kind.h"
  11. #include "toolchain/lexer/tokenized_buffer.h"
  12. #include "toolchain/parser/parse_node_kind.h"
  13. #include "toolchain/parser/parse_tree.h"
  14. namespace Carbon {
  15. // May be emitted a couple different ways as part of operator parsing.
  16. CARBON_DIAGNOSTIC(
  17. OperatorRequiresParentheses, Error,
  18. "Parentheses are required to disambiguate operator precedence.");
  19. CARBON_DIAGNOSTIC(ExpectedSemiAfterExpression, Error,
  20. "Expected `;` after expression.");
  21. // A relative location for characters in errors.
  22. enum class RelativeLocation : int8_t {
  23. Around,
  24. After,
  25. Before,
  26. };
  27. // Adapts RelativeLocation for use with formatv.
  28. static auto operator<<(llvm::raw_ostream& out, RelativeLocation loc)
  29. -> llvm::raw_ostream& {
  30. switch (loc) {
  31. case RelativeLocation::Around:
  32. out << "around";
  33. break;
  34. case RelativeLocation::After:
  35. out << "after";
  36. break;
  37. case RelativeLocation::Before:
  38. out << "before";
  39. break;
  40. }
  41. return out;
  42. }
  43. class Parser::PrettyStackTraceParseState : public llvm::PrettyStackTraceEntry {
  44. public:
  45. explicit PrettyStackTraceParseState(const Parser* parser) : parser_(parser) {}
  46. ~PrettyStackTraceParseState() override = default;
  47. auto print(llvm::raw_ostream& output) const -> void override {
  48. output << "Parser stack:\n";
  49. for (int i = 0; i < static_cast<int>(parser_->state_stack_.size()); ++i) {
  50. const auto& entry = parser_->state_stack_[i];
  51. output << "\t" << i << ".\t" << entry.state;
  52. Print(output, entry.token);
  53. }
  54. output << "\tcursor\tposition_";
  55. Print(output, *parser_->position_);
  56. }
  57. private:
  58. auto Print(llvm::raw_ostream& output, TokenizedBuffer::Token token) const
  59. -> void {
  60. auto line = parser_->tokens_->GetLine(token);
  61. output << " @ " << parser_->tokens_->GetLineNumber(line) << ":"
  62. << parser_->tokens_->GetColumnNumber(token) << ":"
  63. << " token " << token << " : "
  64. << parser_->tokens_->GetKind(token).Name() << "\n";
  65. }
  66. const Parser* parser_;
  67. };
  68. Parser::Parser(ParseTree& tree, TokenizedBuffer& tokens,
  69. TokenDiagnosticEmitter& emitter)
  70. : tree_(&tree),
  71. tokens_(&tokens),
  72. emitter_(&emitter),
  73. position_(tokens_->tokens().begin()),
  74. end_(tokens_->tokens().end()) {
  75. CARBON_CHECK(position_ != end_) << "Empty TokenizedBuffer";
  76. --end_;
  77. CARBON_CHECK(tokens_->GetKind(*end_) == TokenKind::EndOfFile())
  78. << "TokenizedBuffer should end with EndOfFile, ended with "
  79. << tokens_->GetKind(*end_).Name();
  80. }
  81. auto Parser::AddLeafNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  82. bool has_error) -> void {
  83. tree_->node_impls_.push_back(
  84. ParseTree::NodeImpl(kind, has_error, token, /*subtree_size=*/1));
  85. if (has_error) {
  86. tree_->has_errors_ = true;
  87. }
  88. }
  89. auto Parser::AddNode(ParseNodeKind kind, TokenizedBuffer::Token token,
  90. int subtree_start, bool has_error) -> void {
  91. int subtree_size = tree_->size() - subtree_start + 1;
  92. tree_->node_impls_.push_back(
  93. ParseTree::NodeImpl(kind, has_error, token, subtree_size));
  94. if (has_error) {
  95. tree_->has_errors_ = true;
  96. }
  97. }
  98. auto Parser::ConsumeAndAddCloseParen(TokenizedBuffer::Token open_paren,
  99. ParseNodeKind close_kind) -> bool {
  100. if (ConsumeAndAddLeafNodeIf(TokenKind::CloseParen(), close_kind)) {
  101. return true;
  102. }
  103. // TODO: Include the location of the matching open_paren in the diagnostic.
  104. CARBON_DIAGNOSTIC(ExpectedCloseParen, Error, "Unexpected tokens before `)`.");
  105. emitter_->Emit(*position_, ExpectedCloseParen);
  106. SkipTo(tokens_->GetMatchedClosingToken(open_paren));
  107. AddLeafNode(close_kind, Consume());
  108. return false;
  109. }
  110. auto Parser::ConsumeAndAddLeafNodeIf(TokenKind token_kind,
  111. ParseNodeKind node_kind) -> bool {
  112. auto token = ConsumeIf(token_kind);
  113. if (!token) {
  114. return false;
  115. }
  116. AddLeafNode(node_kind, *token);
  117. return true;
  118. }
  119. auto Parser::ConsumeIf(TokenKind kind)
  120. -> llvm::Optional<TokenizedBuffer::Token> {
  121. if (!PositionIs(kind)) {
  122. return llvm::None;
  123. }
  124. return Consume();
  125. }
  126. auto Parser::FindNextOf(std::initializer_list<TokenKind> desired_kinds)
  127. -> llvm::Optional<TokenizedBuffer::Token> {
  128. auto new_position = position_;
  129. while (true) {
  130. TokenizedBuffer::Token token = *new_position;
  131. TokenKind kind = tokens_->GetKind(token);
  132. if (kind.IsOneOf(desired_kinds)) {
  133. return token;
  134. }
  135. // Step to the next token at the current bracketing level.
  136. if (kind.IsClosingSymbol() || kind == TokenKind::EndOfFile()) {
  137. // There are no more tokens at this level.
  138. return llvm::None;
  139. } else if (kind.IsOpeningSymbol()) {
  140. new_position = TokenizedBuffer::TokenIterator(
  141. tokens_->GetMatchedClosingToken(token));
  142. // Advance past the closing token.
  143. ++new_position;
  144. } else {
  145. ++new_position;
  146. }
  147. }
  148. }
  149. auto Parser::SkipMatchingGroup() -> bool {
  150. if (!PositionKind().IsOpeningSymbol()) {
  151. return false;
  152. }
  153. SkipTo(tokens_->GetMatchedClosingToken(*position_));
  154. ++position_;
  155. return true;
  156. }
  157. auto Parser::SkipPastLikelyEnd(TokenizedBuffer::Token skip_root)
  158. -> llvm::Optional<TokenizedBuffer::Token> {
  159. if (position_ == end_) {
  160. return llvm::None;
  161. }
  162. TokenizedBuffer::Line root_line = tokens_->GetLine(skip_root);
  163. int root_line_indent = tokens_->GetIndentColumnNumber(root_line);
  164. // We will keep scanning through tokens on the same line as the root or
  165. // lines with greater indentation than root's line.
  166. auto is_same_line_or_indent_greater_than_root =
  167. [&](TokenizedBuffer::Token t) {
  168. TokenizedBuffer::Line l = tokens_->GetLine(t);
  169. if (l == root_line) {
  170. return true;
  171. }
  172. return tokens_->GetIndentColumnNumber(l) > root_line_indent;
  173. };
  174. do {
  175. if (PositionIs(TokenKind::CloseCurlyBrace())) {
  176. // Immediately bail out if we hit an unmatched close curly, this will
  177. // pop us up a level of the syntax grouping.
  178. return llvm::None;
  179. }
  180. // We assume that a semicolon is always intended to be the end of the
  181. // current construct.
  182. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  183. return semi;
  184. }
  185. // Skip over any matching group of tokens_->
  186. if (SkipMatchingGroup()) {
  187. continue;
  188. }
  189. // Otherwise just step forward one token.
  190. ++position_;
  191. } while (position_ != end_ &&
  192. is_same_line_or_indent_greater_than_root(*position_));
  193. return llvm::None;
  194. }
  195. auto Parser::SkipTo(TokenizedBuffer::Token t) -> void {
  196. CARBON_CHECK(t >= *position_) << "Tried to skip backwards from " << position_
  197. << " to " << TokenizedBuffer::TokenIterator(t);
  198. position_ = TokenizedBuffer::TokenIterator(t);
  199. CARBON_CHECK(position_ != end_) << "Skipped past EOF.";
  200. }
  201. auto Parser::HandleCodeBlockState() -> void {
  202. PopAndDiscardState();
  203. PushState(ParserState::CodeBlockFinish());
  204. if (ConsumeAndAddLeafNodeIf(TokenKind::OpenCurlyBrace(),
  205. ParseNodeKind::CodeBlockStart())) {
  206. PushState(ParserState::StatementScopeLoop());
  207. } else {
  208. AddLeafNode(ParseNodeKind::CodeBlockStart(), *position_,
  209. /*has_error=*/true);
  210. // Recover by parsing a single statement.
  211. CARBON_DIAGNOSTIC(ExpectedCodeBlock, Error, "Expected braced code block.");
  212. emitter_->Emit(*position_, ExpectedCodeBlock);
  213. PushState(ParserState::Statement());
  214. }
  215. }
  216. // Determines whether the given token is considered to be the start of an
  217. // operand according to the rules for infix operator parsing.
  218. static auto IsAssumedStartOfOperand(TokenKind kind) -> bool {
  219. return kind.IsOneOf({TokenKind::OpenParen(), TokenKind::Identifier(),
  220. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  221. TokenKind::StringLiteral()});
  222. }
  223. // Determines whether the given token is considered to be the end of an
  224. // operand according to the rules for infix operator parsing.
  225. static auto IsAssumedEndOfOperand(TokenKind kind) -> bool {
  226. return kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  227. TokenKind::CloseSquareBracket(), TokenKind::Identifier(),
  228. TokenKind::IntegerLiteral(), TokenKind::RealLiteral(),
  229. TokenKind::StringLiteral()});
  230. }
  231. // Determines whether the given token could possibly be the start of an
  232. // operand. This is conservatively correct, and will never incorrectly return
  233. // `false`, but can incorrectly return `true`.
  234. static auto IsPossibleStartOfOperand(TokenKind kind) -> bool {
  235. return !kind.IsOneOf({TokenKind::CloseParen(), TokenKind::CloseCurlyBrace(),
  236. TokenKind::CloseSquareBracket(), TokenKind::Comma(),
  237. TokenKind::Semi(), TokenKind::Colon()});
  238. }
  239. auto Parser::IsLexicallyValidInfixOperator() -> bool {
  240. CARBON_CHECK(position_ != end_) << "Expected an operator token.";
  241. bool leading_space = tokens_->HasLeadingWhitespace(*position_);
  242. bool trailing_space = tokens_->HasTrailingWhitespace(*position_);
  243. // If there's whitespace on both sides, it's an infix operator.
  244. if (leading_space && trailing_space) {
  245. return true;
  246. }
  247. // If there's whitespace on exactly one side, it's not an infix operator.
  248. if (leading_space || trailing_space) {
  249. return false;
  250. }
  251. // Otherwise, for an infix operator, the preceding token must be any close
  252. // bracket, identifier, or literal and the next token must be an open paren,
  253. // identifier, or literal.
  254. if (position_ == tokens_->tokens().begin() ||
  255. !IsAssumedEndOfOperand(tokens_->GetKind(*(position_ - 1))) ||
  256. !IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  257. return false;
  258. }
  259. return true;
  260. }
  261. auto Parser::IsTrailingOperatorInfix() -> bool {
  262. if (position_ == end_) {
  263. return false;
  264. }
  265. // An operator that follows the infix operator rules is parsed as
  266. // infix, unless the next token means that it can't possibly be.
  267. if (IsLexicallyValidInfixOperator() &&
  268. IsPossibleStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  269. return true;
  270. }
  271. // A trailing operator with leading whitespace that's not valid as infix is
  272. // not valid at all. If the next token looks like the start of an operand,
  273. // then parse as infix, otherwise as postfix. Either way we'll produce a
  274. // diagnostic later on.
  275. if (tokens_->HasLeadingWhitespace(*position_) &&
  276. IsAssumedStartOfOperand(tokens_->GetKind(*(position_ + 1)))) {
  277. return true;
  278. }
  279. return false;
  280. }
  281. auto Parser::DiagnoseOperatorFixity(OperatorFixity fixity) -> void {
  282. if (fixity == OperatorFixity::Infix) {
  283. // Infix operators must satisfy the infix operator rules.
  284. if (!IsLexicallyValidInfixOperator()) {
  285. CARBON_DIAGNOSTIC(BinaryOperatorRequiresWhitespace, Error,
  286. "Whitespace missing {0} binary operator.",
  287. RelativeLocation);
  288. emitter_->Emit(*position_, BinaryOperatorRequiresWhitespace,
  289. tokens_->HasLeadingWhitespace(*position_)
  290. ? RelativeLocation::After
  291. : (tokens_->HasTrailingWhitespace(*position_)
  292. ? RelativeLocation::Before
  293. : RelativeLocation::Around));
  294. }
  295. } else {
  296. bool prefix = fixity == OperatorFixity::Prefix;
  297. // Whitespace is not permitted between a symbolic pre/postfix operator and
  298. // its operand.
  299. if (PositionKind().IsSymbol() &&
  300. (prefix ? tokens_->HasTrailingWhitespace(*position_)
  301. : tokens_->HasLeadingWhitespace(*position_))) {
  302. CARBON_DIAGNOSTIC(UnaryOperatorHasWhitespace, Error,
  303. "Whitespace is not allowed {0} this unary operator.",
  304. RelativeLocation);
  305. emitter_->Emit(
  306. *position_, UnaryOperatorHasWhitespace,
  307. prefix ? RelativeLocation::After : RelativeLocation::Before);
  308. }
  309. // Pre/postfix operators must not satisfy the infix operator rules.
  310. if (IsLexicallyValidInfixOperator()) {
  311. CARBON_DIAGNOSTIC(UnaryOperatorRequiresWhitespace, Error,
  312. "Whitespace is required {0} this unary operator.",
  313. RelativeLocation);
  314. emitter_->Emit(
  315. *position_, UnaryOperatorRequiresWhitespace,
  316. prefix ? RelativeLocation::Before : RelativeLocation::After);
  317. }
  318. }
  319. }
  320. auto Parser::ConsumeListToken(ParseNodeKind comma_kind, TokenKind close_kind,
  321. bool already_has_error) -> ListTokenKind {
  322. if (!PositionIs(TokenKind::Comma()) && !PositionIs(close_kind)) {
  323. // Don't error a second time on the same element.
  324. if (!already_has_error) {
  325. CARBON_DIAGNOSTIC(UnexpectedTokenAfterListElement, Error,
  326. "Expected `,` or `{0}`.", TokenKind);
  327. emitter_->Emit(*position_, UnexpectedTokenAfterListElement, close_kind);
  328. ReturnErrorOnState();
  329. }
  330. // Recover from the invalid token.
  331. auto end_of_element = FindNextOf({TokenKind::Comma(), close_kind});
  332. // The lexer guarantees that parentheses are balanced.
  333. CARBON_CHECK(end_of_element)
  334. << "missing matching `" << close_kind.GetOpeningSymbol() << "` for `"
  335. << close_kind << "`";
  336. SkipTo(*end_of_element);
  337. }
  338. if (PositionIs(close_kind)) {
  339. return ListTokenKind::Close;
  340. } else {
  341. AddLeafNode(comma_kind, Consume());
  342. return PositionIs(close_kind) ? ListTokenKind::CommaClose
  343. : ListTokenKind::Comma;
  344. }
  345. }
  346. auto Parser::Parse() -> void {
  347. // Traces state_stack_. This runs even in opt because it's low overhead.
  348. PrettyStackTraceParseState pretty_stack(this);
  349. PushState(ParserState::DeclarationLoop());
  350. while (!state_stack_.empty()) {
  351. switch (state_stack_.back().state) {
  352. #define CARBON_PARSER_STATE(Name) \
  353. case ParserState::Name(): \
  354. Handle##Name##State(); \
  355. break;
  356. #include "toolchain/parser/parser_state.def"
  357. }
  358. }
  359. AddLeafNode(ParseNodeKind::FileEnd(), *position_);
  360. }
  361. auto Parser::HandleBraceExpressionState() -> void {
  362. auto state = PopState();
  363. state.state = ParserState::BraceExpressionFinishAsUnknown();
  364. PushState(state);
  365. CARBON_CHECK(ConsumeAndAddLeafNodeIf(
  366. TokenKind::OpenCurlyBrace(),
  367. ParseNodeKind::StructLiteralOrStructTypeLiteralStart()));
  368. if (!PositionIs(TokenKind::CloseCurlyBrace())) {
  369. PushState(ParserState::BraceExpressionParameterAsUnknown());
  370. }
  371. }
  372. auto Parser::BraceExpressionKindToParserState(BraceExpressionKind kind,
  373. ParserState type,
  374. ParserState value,
  375. ParserState unknown)
  376. -> ParserState {
  377. switch (kind) {
  378. case BraceExpressionKind::Type: {
  379. return type;
  380. }
  381. case BraceExpressionKind::Value: {
  382. return value;
  383. }
  384. case BraceExpressionKind::Unknown: {
  385. return unknown;
  386. }
  387. }
  388. }
  389. auto Parser::HandleBraceExpressionParameterError(StateStackEntry state,
  390. BraceExpressionKind kind)
  391. -> void {
  392. CARBON_DIAGNOSTIC(ExpectedStructLiteralField, Error, "Expected {0}{1}{2}.",
  393. llvm::StringRef, llvm::StringRef, llvm::StringRef);
  394. bool can_be_type = kind != BraceExpressionKind::Value;
  395. bool can_be_value = kind != BraceExpressionKind::Type;
  396. emitter_->Emit(*position_, ExpectedStructLiteralField,
  397. can_be_type ? "`.field: type`" : "",
  398. (can_be_type && can_be_value) ? " or " : "",
  399. can_be_value ? "`.field = value`" : "");
  400. state.state = BraceExpressionKindToParserState(
  401. kind, ParserState::BraceExpressionParameterFinishAsType(),
  402. ParserState::BraceExpressionParameterFinishAsValue(),
  403. ParserState::BraceExpressionParameterFinishAsUnknown());
  404. state.has_error = true;
  405. PushState(state);
  406. }
  407. auto Parser::HandleBraceExpressionParameter(BraceExpressionKind kind) -> void {
  408. auto state = PopState();
  409. if (!PositionIs(TokenKind::Period())) {
  410. HandleBraceExpressionParameterError(state, kind);
  411. return;
  412. }
  413. state.state = BraceExpressionKindToParserState(
  414. kind, ParserState::BraceExpressionParameterAfterDesignatorAsType(),
  415. ParserState::BraceExpressionParameterAfterDesignatorAsValue(),
  416. ParserState::BraceExpressionParameterAfterDesignatorAsUnknown());
  417. PushState(state);
  418. PushState(ParserState::DesignatorAsStruct());
  419. }
  420. auto Parser::HandleBraceExpressionParameterAsTypeState() -> void {
  421. HandleBraceExpressionParameter(BraceExpressionKind::Type);
  422. }
  423. auto Parser::HandleBraceExpressionParameterAsValueState() -> void {
  424. HandleBraceExpressionParameter(BraceExpressionKind::Value);
  425. }
  426. auto Parser::HandleBraceExpressionParameterAsUnknownState() -> void {
  427. HandleBraceExpressionParameter(BraceExpressionKind::Unknown);
  428. }
  429. auto Parser::HandleBraceExpressionParameterAfterDesignator(
  430. BraceExpressionKind kind) -> void {
  431. auto state = PopState();
  432. if (state.has_error) {
  433. auto recovery_pos = FindNextOf(
  434. {TokenKind::Equal(), TokenKind::Colon(), TokenKind::Comma()});
  435. if (!recovery_pos ||
  436. tokens_->GetKind(*recovery_pos) == TokenKind::Comma()) {
  437. state.state = BraceExpressionKindToParserState(
  438. kind, ParserState::BraceExpressionParameterFinishAsType(),
  439. ParserState::BraceExpressionParameterFinishAsValue(),
  440. ParserState::BraceExpressionParameterFinishAsUnknown());
  441. PushState(state);
  442. return;
  443. }
  444. SkipTo(*recovery_pos);
  445. }
  446. // Work out the kind of this element.
  447. auto elem_kind = BraceExpressionKind::Unknown;
  448. if (PositionIs(TokenKind::Colon())) {
  449. elem_kind = BraceExpressionKind::Type;
  450. } else if (PositionIs(TokenKind::Equal())) {
  451. elem_kind = BraceExpressionKind::Value;
  452. }
  453. // Unknown kinds and changes between type and value are errors.
  454. if (elem_kind == BraceExpressionKind::Unknown ||
  455. (kind != BraceExpressionKind::Unknown && elem_kind != kind)) {
  456. HandleBraceExpressionParameterError(state, kind);
  457. return;
  458. }
  459. // If we're setting the kind, update the BraceExpressionFinish state.
  460. if (kind == BraceExpressionKind::Unknown) {
  461. kind = elem_kind;
  462. auto finish_state = PopState();
  463. CARBON_CHECK(finish_state.state ==
  464. ParserState::BraceExpressionFinishAsUnknown());
  465. finish_state.state = BraceExpressionKindToParserState(
  466. kind, ParserState::BraceExpressionFinishAsType(),
  467. ParserState::BraceExpressionFinishAsValue(),
  468. ParserState::BraceExpressionFinishAsUnknown());
  469. PushState(finish_state);
  470. }
  471. state.state = BraceExpressionKindToParserState(
  472. kind, ParserState::BraceExpressionParameterFinishAsType(),
  473. ParserState::BraceExpressionParameterFinishAsValue(),
  474. ParserState::BraceExpressionParameterFinishAsUnknown());
  475. state.token = Consume();
  476. // Struct type fields and value fields use the same grammar except
  477. // that one has a `:` separator and the other has an `=` separator.
  478. PushState(state);
  479. PushState(ParserState::Expression());
  480. }
  481. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsTypeState()
  482. -> void {
  483. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Type);
  484. }
  485. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsValueState()
  486. -> void {
  487. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Value);
  488. }
  489. auto Parser::HandleBraceExpressionParameterAfterDesignatorAsUnknownState()
  490. -> void {
  491. HandleBraceExpressionParameterAfterDesignator(BraceExpressionKind::Unknown);
  492. }
  493. auto Parser::HandleBraceExpressionParameterFinish(BraceExpressionKind kind)
  494. -> void {
  495. auto state = PopState();
  496. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructFieldType()
  497. : ParseNodeKind::StructFieldValue(),
  498. state.token, state.subtree_start, state.has_error);
  499. if (ConsumeListToken(ParseNodeKind::StructComma(),
  500. TokenKind::CloseCurlyBrace(),
  501. state.has_error) == ListTokenKind::Comma) {
  502. PushState(BraceExpressionKindToParserState(
  503. kind, ParserState::BraceExpressionParameterAsType(),
  504. ParserState::BraceExpressionParameterAsValue(),
  505. ParserState::BraceExpressionParameterAsUnknown()));
  506. }
  507. }
  508. auto Parser::HandleBraceExpressionParameterFinishAsTypeState() -> void {
  509. HandleBraceExpressionParameterFinish(BraceExpressionKind::Type);
  510. }
  511. auto Parser::HandleBraceExpressionParameterFinishAsValueState() -> void {
  512. HandleBraceExpressionParameterFinish(BraceExpressionKind::Value);
  513. }
  514. auto Parser::HandleBraceExpressionParameterFinishAsUnknownState() -> void {
  515. HandleBraceExpressionParameterFinish(BraceExpressionKind::Unknown);
  516. }
  517. auto Parser::HandleBraceExpressionFinish(BraceExpressionKind kind) -> void {
  518. auto state = PopState();
  519. AddNode(kind == BraceExpressionKind::Type ? ParseNodeKind::StructTypeLiteral()
  520. : ParseNodeKind::StructLiteral(),
  521. Consume(), state.subtree_start, state.has_error);
  522. }
  523. auto Parser::HandleBraceExpressionFinishAsTypeState() -> void {
  524. HandleBraceExpressionFinish(BraceExpressionKind::Type);
  525. }
  526. auto Parser::HandleBraceExpressionFinishAsValueState() -> void {
  527. HandleBraceExpressionFinish(BraceExpressionKind::Value);
  528. }
  529. auto Parser::HandleBraceExpressionFinishAsUnknownState() -> void {
  530. HandleBraceExpressionFinish(BraceExpressionKind::Unknown);
  531. }
  532. auto Parser::HandleCallExpressionState() -> void {
  533. auto state = PopState();
  534. // TODO: When swapping () start/end, this should AddLeafNode the open before
  535. // continuing.
  536. state.state = ParserState::CallExpressionFinish();
  537. PushState(state);
  538. // Advance past the open paren.
  539. ++position_;
  540. if (!PositionIs(TokenKind::CloseParen())) {
  541. PushState(ParserState::CallExpressionParameterFinish());
  542. PushState(ParserState::Expression());
  543. }
  544. }
  545. auto Parser::HandleCallExpressionParameterFinishState() -> void {
  546. auto state = PopState();
  547. if (state.has_error) {
  548. ReturnErrorOnState();
  549. }
  550. if (ConsumeListToken(ParseNodeKind::CallExpressionComma(),
  551. TokenKind::CloseParen(),
  552. state.has_error) == ListTokenKind::Comma) {
  553. PushState(ParserState::CallExpressionParameterFinish());
  554. PushState(ParserState::Expression());
  555. }
  556. }
  557. auto Parser::HandleCallExpressionFinishState() -> void {
  558. auto state = PopState();
  559. AddLeafNode(ParseNodeKind::CallExpressionEnd(), Consume());
  560. AddNode(ParseNodeKind::CallExpression(), state.token, state.subtree_start,
  561. state.has_error);
  562. }
  563. auto Parser::HandleCodeBlockFinishState() -> void {
  564. auto state = PopState();
  565. // If the block started with an open curly, this is a close curly.
  566. if (tokens_->GetKind(state.token) == TokenKind::OpenCurlyBrace()) {
  567. AddNode(ParseNodeKind::CodeBlock(), Consume(), state.subtree_start,
  568. state.has_error);
  569. } else {
  570. AddNode(ParseNodeKind::CodeBlock(), state.token, state.subtree_start,
  571. /*has_error=*/true);
  572. }
  573. }
  574. auto Parser::HandleDeclarationLoopState() -> void {
  575. // This maintains the current state unless we're at the end of the file.
  576. switch (PositionKind()) {
  577. case TokenKind::EndOfFile(): {
  578. PopAndDiscardState();
  579. break;
  580. }
  581. case TokenKind::Fn(): {
  582. PushState(ParserState::FunctionIntroducer());
  583. AddLeafNode(ParseNodeKind::FunctionIntroducer(), Consume());
  584. break;
  585. }
  586. case TokenKind::Package(): {
  587. PushState(ParserState::Package());
  588. ++position_;
  589. break;
  590. }
  591. case TokenKind::Semi(): {
  592. AddLeafNode(ParseNodeKind::EmptyDeclaration(), Consume());
  593. break;
  594. }
  595. case TokenKind::Var(): {
  596. PushState(ParserState::VarAsRequireSemicolon());
  597. break;
  598. }
  599. case TokenKind::Interface(): {
  600. PushState(ParserState::InterfaceIntroducer());
  601. ++position_;
  602. break;
  603. }
  604. default: {
  605. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  606. "Unrecognized declaration introducer.");
  607. emitter_->Emit(*position_, UnrecognizedDeclaration);
  608. auto cursor = *position_;
  609. auto semi = SkipPastLikelyEnd(cursor);
  610. // Locate the EmptyDeclaration at the semi when found, but use the
  611. // original cursor location for an error when not.
  612. AddLeafNode(ParseNodeKind::EmptyDeclaration(), semi ? *semi : cursor,
  613. /*has_error=*/true);
  614. break;
  615. }
  616. }
  617. }
  618. auto Parser::HandleDesignator(bool as_struct) -> void {
  619. auto state = PopState();
  620. // `.` identifier
  621. auto dot = ConsumeIf(TokenKind::Period());
  622. CARBON_CHECK(dot);
  623. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  624. ParseNodeKind::DesignatedName())) {
  625. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterDot, Error,
  626. "Expected identifier after `.`.");
  627. emitter_->Emit(*position_, ExpectedIdentifierAfterDot);
  628. // If we see a keyword, assume it was intended to be the designated name.
  629. // TODO: Should keywords be valid in designators?
  630. if (PositionKind().IsKeyword()) {
  631. AddLeafNode(ParseNodeKind::DesignatedName(), Consume(),
  632. /*has_error=*/true);
  633. } else {
  634. state.has_error = true;
  635. ReturnErrorOnState();
  636. }
  637. }
  638. AddNode(as_struct ? ParseNodeKind::StructFieldDesignator()
  639. : ParseNodeKind::DesignatorExpression(),
  640. *dot, state.subtree_start, state.has_error);
  641. }
  642. auto Parser::HandleDesignatorAsExpressionState() -> void {
  643. HandleDesignator(/*as_struct=*/false);
  644. }
  645. auto Parser::HandleDesignatorAsStructState() -> void {
  646. HandleDesignator(/*as_struct=*/true);
  647. }
  648. auto Parser::HandleExpressionState() -> void {
  649. auto state = PopState();
  650. // Check for a prefix operator.
  651. if (auto operator_precedence = PrecedenceGroup::ForLeading(PositionKind())) {
  652. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  653. *operator_precedence) !=
  654. OperatorPriority::RightFirst) {
  655. // The precedence rules don't permit this prefix operator in this
  656. // context. Diagnose this, but carry on and parse it anyway.
  657. emitter_->Emit(*position_, OperatorRequiresParentheses);
  658. } else {
  659. // Check that this operator follows the proper whitespace rules.
  660. DiagnoseOperatorFixity(OperatorFixity::Prefix);
  661. }
  662. PushStateForExpressionLoop(ParserState::ExpressionLoopForPrefix(),
  663. state.ambient_precedence, *operator_precedence);
  664. ++position_;
  665. PushStateForExpression(*operator_precedence);
  666. } else {
  667. PushStateForExpressionLoop(ParserState::ExpressionLoop(),
  668. state.ambient_precedence,
  669. PrecedenceGroup::ForPostfixExpression());
  670. PushState(ParserState::ExpressionInPostfix());
  671. }
  672. }
  673. auto Parser::HandleExpressionInPostfixState() -> void {
  674. auto state = PopState();
  675. // Continue to the loop state.
  676. state.state = ParserState::ExpressionInPostfixLoop();
  677. // Parses a primary expression, which is either a terminal portion of an
  678. // expression tree, such as an identifier or literal, or a parenthesized
  679. // expression.
  680. switch (PositionKind()) {
  681. case TokenKind::Identifier(): {
  682. AddLeafNode(ParseNodeKind::NameReference(), Consume());
  683. PushState(state);
  684. break;
  685. }
  686. case TokenKind::IntegerLiteral():
  687. case TokenKind::RealLiteral():
  688. case TokenKind::StringLiteral():
  689. case TokenKind::IntegerTypeLiteral():
  690. case TokenKind::UnsignedIntegerTypeLiteral():
  691. case TokenKind::FloatingPointTypeLiteral(): {
  692. AddLeafNode(ParseNodeKind::Literal(), Consume());
  693. PushState(state);
  694. break;
  695. }
  696. case TokenKind::OpenCurlyBrace(): {
  697. PushState(state);
  698. PushState(ParserState::BraceExpression());
  699. break;
  700. }
  701. case TokenKind::OpenParen(): {
  702. PushState(state);
  703. PushState(ParserState::ParenExpression());
  704. break;
  705. }
  706. default: {
  707. CARBON_DIAGNOSTIC(ExpectedExpression, Error, "Expected expression.");
  708. emitter_->Emit(*position_, ExpectedExpression);
  709. ReturnErrorOnState();
  710. break;
  711. }
  712. }
  713. }
  714. auto Parser::HandleExpressionInPostfixLoopState() -> void {
  715. // This is a cyclic state that repeats, so this state is typically pushed back
  716. // on.
  717. auto state = PopState();
  718. state.token = *position_;
  719. switch (PositionKind()) {
  720. case TokenKind::Period(): {
  721. PushState(state);
  722. state.state = ParserState::DesignatorAsExpression();
  723. PushState(state);
  724. break;
  725. }
  726. case TokenKind::OpenParen(): {
  727. PushState(state);
  728. state.state = ParserState::CallExpression();
  729. PushState(state);
  730. break;
  731. }
  732. default: {
  733. if (state.has_error) {
  734. ReturnErrorOnState();
  735. }
  736. break;
  737. }
  738. }
  739. }
  740. auto Parser::HandleExpressionLoopState() -> void {
  741. auto state = PopState();
  742. auto trailing_operator =
  743. PrecedenceGroup::ForTrailing(PositionKind(), IsTrailingOperatorInfix());
  744. if (!trailing_operator) {
  745. if (state.has_error) {
  746. ReturnErrorOnState();
  747. }
  748. return;
  749. }
  750. auto [operator_precedence, is_binary] = *trailing_operator;
  751. // TODO: If this operator is ambiguous with either the ambient precedence
  752. // or the LHS precedence, and there's a variant with a different fixity
  753. // that would work, use that one instead for error recovery.
  754. if (PrecedenceGroup::GetPriority(state.ambient_precedence,
  755. operator_precedence) !=
  756. OperatorPriority::RightFirst) {
  757. // The precedence rules don't permit this operator in this context. Try
  758. // again in the enclosing expression context.
  759. if (state.has_error) {
  760. ReturnErrorOnState();
  761. }
  762. return;
  763. }
  764. if (PrecedenceGroup::GetPriority(state.lhs_precedence, operator_precedence) !=
  765. OperatorPriority::LeftFirst) {
  766. // Either the LHS operator and this operator are ambiguous, or the
  767. // LHS operator is a unary operator that can't be nested within
  768. // this operator. Either way, parentheses are required.
  769. emitter_->Emit(*position_, OperatorRequiresParentheses);
  770. state.has_error = true;
  771. } else {
  772. DiagnoseOperatorFixity(is_binary ? OperatorFixity::Infix
  773. : OperatorFixity::Postfix);
  774. }
  775. state.token = Consume();
  776. state.lhs_precedence = operator_precedence;
  777. if (is_binary) {
  778. state.state = ParserState::ExpressionLoopForBinary();
  779. PushState(state);
  780. PushStateForExpression(operator_precedence);
  781. } else {
  782. AddNode(ParseNodeKind::PostfixOperator(), state.token, state.subtree_start,
  783. state.has_error);
  784. state.has_error = false;
  785. PushState(state);
  786. }
  787. }
  788. auto Parser::HandleExpressionLoopForBinaryState() -> void {
  789. auto state = PopState();
  790. AddNode(ParseNodeKind::InfixOperator(), state.token, state.subtree_start,
  791. state.has_error);
  792. state.state = ParserState::ExpressionLoop();
  793. state.has_error = false;
  794. PushState(state);
  795. }
  796. auto Parser::HandleExpressionLoopForPrefixState() -> void {
  797. auto state = PopState();
  798. AddNode(ParseNodeKind::PrefixOperator(), state.token, state.subtree_start,
  799. state.has_error);
  800. state.state = ParserState::ExpressionLoop();
  801. state.has_error = false;
  802. PushState(state);
  803. }
  804. auto Parser::HandleExpressionStatementFinishState() -> void {
  805. auto state = PopState();
  806. if (auto semi = ConsumeIf(TokenKind::Semi())) {
  807. AddNode(ParseNodeKind::ExpressionStatement(), *semi, state.subtree_start,
  808. state.has_error);
  809. return;
  810. }
  811. if (!state.has_error) {
  812. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  813. }
  814. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  815. AddNode(ParseNodeKind::ExpressionStatement(), *semi_token,
  816. state.subtree_start,
  817. /*has_error=*/true);
  818. return;
  819. }
  820. // Found junk not even followed by a `;`, no node to add.
  821. ReturnErrorOnState();
  822. }
  823. auto Parser::HandleFunctionError(StateStackEntry state,
  824. bool skip_past_likely_end) -> void {
  825. auto token = state.token;
  826. if (skip_past_likely_end) {
  827. if (auto semi = SkipPastLikelyEnd(token)) {
  828. token = *semi;
  829. }
  830. }
  831. AddNode(ParseNodeKind::FunctionDeclaration(), token, state.subtree_start,
  832. /*has_error=*/true);
  833. }
  834. auto Parser::HandleFunctionIntroducerState() -> void {
  835. auto state = PopState();
  836. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  837. ParseNodeKind::DeclaredName())) {
  838. CARBON_DIAGNOSTIC(ExpectedFunctionName, Error,
  839. "Expected function name after `fn` keyword.");
  840. emitter_->Emit(*position_, ExpectedFunctionName);
  841. // TODO: We could change the lexer to allow us to synthesize certain
  842. // kinds of tokens and try to "recover" here, but unclear that this is
  843. // really useful.
  844. HandleFunctionError(state, true);
  845. return;
  846. }
  847. if (!PositionIs(TokenKind::OpenParen())) {
  848. CARBON_DIAGNOSTIC(ExpectedFunctionParams, Error,
  849. "Expected `(` after function name.");
  850. emitter_->Emit(*position_, ExpectedFunctionParams);
  851. HandleFunctionError(state, true);
  852. return;
  853. }
  854. // Parse the parameter list as its own subtree; once that pops, resume
  855. // function parsing.
  856. state.state = ParserState::FunctionAfterParameterList();
  857. PushState(state);
  858. PushState(ParserState::FunctionParameterListFinish());
  859. AddLeafNode(ParseNodeKind::ParameterListStart(), Consume());
  860. if (!PositionIs(TokenKind::CloseParen())) {
  861. PushState(ParserState::FunctionParameter());
  862. }
  863. }
  864. auto Parser::HandleFunctionParameterState() -> void {
  865. PopAndDiscardState();
  866. PushState(ParserState::FunctionParameterFinish());
  867. PushState(ParserState::PatternAsFunctionParameter());
  868. }
  869. auto Parser::HandleFunctionParameterFinishState() -> void {
  870. auto state = PopState();
  871. if (state.has_error) {
  872. ReturnErrorOnState();
  873. }
  874. if (ConsumeListToken(ParseNodeKind::ParameterListComma(),
  875. TokenKind::CloseParen(),
  876. state.has_error) == ListTokenKind::Comma) {
  877. PushState(ParserState::PatternAsFunctionParameter());
  878. }
  879. }
  880. auto Parser::HandleFunctionParameterListFinishState() -> void {
  881. auto state = PopState();
  882. CARBON_CHECK(PositionIs(TokenKind::CloseParen())) << PositionKind().Name();
  883. AddNode(ParseNodeKind::ParameterList(), Consume(), state.subtree_start,
  884. state.has_error);
  885. }
  886. auto Parser::HandleFunctionAfterParameterListState() -> void {
  887. auto state = PopState();
  888. // Regardless of whether there's a return type, we'll finish the signature.
  889. state.state = ParserState::FunctionSignatureFinish();
  890. PushState(state);
  891. // If there is a return type, parse the expression before adding the return
  892. // type nod.e
  893. if (PositionIs(TokenKind::MinusGreater())) {
  894. PushState(ParserState::FunctionReturnTypeFinish());
  895. ++position_;
  896. PushStateForExpression(PrecedenceGroup::ForType());
  897. }
  898. }
  899. auto Parser::HandleFunctionReturnTypeFinishState() -> void {
  900. auto state = PopState();
  901. AddNode(ParseNodeKind::ReturnType(), state.token, state.subtree_start,
  902. state.has_error);
  903. }
  904. auto Parser::HandleFunctionSignatureFinishState() -> void {
  905. auto state = PopState();
  906. switch (PositionKind()) {
  907. case TokenKind::Semi(): {
  908. AddNode(ParseNodeKind::FunctionDeclaration(), Consume(),
  909. state.subtree_start, state.has_error);
  910. break;
  911. }
  912. case TokenKind::OpenCurlyBrace(): {
  913. AddNode(ParseNodeKind::FunctionDefinitionStart(), Consume(),
  914. state.subtree_start, state.has_error);
  915. // Any error is recorded on the FunctionDefinitionStart.
  916. state.has_error = false;
  917. state.state = ParserState::FunctionDefinitionFinish();
  918. PushState(state);
  919. PushState(ParserState::StatementScopeLoop());
  920. break;
  921. }
  922. default: {
  923. CARBON_DIAGNOSTIC(
  924. ExpectedFunctionBodyOrSemi, Error,
  925. "Expected function definition or `;` after function declaration.");
  926. emitter_->Emit(*position_, ExpectedFunctionBodyOrSemi);
  927. // Only need to skip if we've not already found a new line.
  928. bool skip_past_likely_end =
  929. tokens_->GetLine(*position_) == tokens_->GetLine(state.token);
  930. HandleFunctionError(state, skip_past_likely_end);
  931. break;
  932. }
  933. }
  934. }
  935. auto Parser::HandleFunctionDefinitionFinishState() -> void {
  936. auto state = PopState();
  937. AddNode(ParseNodeKind::FunctionDefinition(), Consume(), state.subtree_start,
  938. state.has_error);
  939. }
  940. auto Parser::HandlePackageState() -> void {
  941. auto state = PopState();
  942. auto exit_on_parse_error = [&]() {
  943. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  944. AddLeafNode(ParseNodeKind::PackageEnd(), *semi_token);
  945. }
  946. return AddNode(ParseNodeKind::PackageDirective(), state.token,
  947. state.subtree_start, /*has_error=*/true);
  948. };
  949. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  950. ParseNodeKind::DeclaredName())) {
  951. CARBON_DIAGNOSTIC(ExpectedIdentifierAfterPackage, Error,
  952. "Expected identifier after `package`.");
  953. emitter_->Emit(*position_, ExpectedIdentifierAfterPackage);
  954. exit_on_parse_error();
  955. return;
  956. }
  957. bool library_parsed = false;
  958. if (auto library_token = ConsumeIf(TokenKind::Library())) {
  959. auto library_start = tree_->size();
  960. if (!ConsumeAndAddLeafNodeIf(TokenKind::StringLiteral(),
  961. ParseNodeKind::Literal())) {
  962. CARBON_DIAGNOSTIC(
  963. ExpectedLibraryName, Error,
  964. "Expected a string literal to specify the library name.");
  965. emitter_->Emit(*position_, ExpectedLibraryName);
  966. exit_on_parse_error();
  967. return;
  968. }
  969. AddNode(ParseNodeKind::PackageLibrary(), *library_token, library_start,
  970. /*has_error=*/false);
  971. library_parsed = true;
  972. }
  973. switch (auto api_or_impl_token = tokens_->GetKind(*(position_))) {
  974. case TokenKind::Api(): {
  975. AddLeafNode(ParseNodeKind::PackageApi(), Consume());
  976. break;
  977. }
  978. case TokenKind::Impl(): {
  979. AddLeafNode(ParseNodeKind::PackageImpl(), Consume());
  980. break;
  981. }
  982. default: {
  983. if (!library_parsed && api_or_impl_token == TokenKind::StringLiteral()) {
  984. // If we come acroess a string literal and we didn't parse `library
  985. // "..."` yet, then most probably the user forgot to add `library`
  986. // before the library name.
  987. CARBON_DIAGNOSTIC(MissingLibraryKeyword, Error,
  988. "Missing `library` keyword.");
  989. emitter_->Emit(*position_, MissingLibraryKeyword);
  990. } else {
  991. CARBON_DIAGNOSTIC(ExpectedApiOrImpl, Error,
  992. "Expected a `api` or `impl`.");
  993. emitter_->Emit(*position_, ExpectedApiOrImpl);
  994. }
  995. exit_on_parse_error();
  996. return;
  997. }
  998. }
  999. if (!ConsumeAndAddLeafNodeIf(TokenKind::Semi(),
  1000. ParseNodeKind::PackageEnd())) {
  1001. CARBON_DIAGNOSTIC(ExpectedSemiToEndPackageDirective, Error,
  1002. "Expected `;` to end package directive.");
  1003. emitter_->Emit(*position_, ExpectedSemiToEndPackageDirective);
  1004. exit_on_parse_error();
  1005. return;
  1006. }
  1007. AddNode(ParseNodeKind::PackageDirective(), state.token, state.subtree_start,
  1008. /*has_error=*/false);
  1009. }
  1010. auto Parser::HandleParenConditionState() -> void {
  1011. auto state = PopState();
  1012. auto open_paren = ConsumeIf(TokenKind::OpenParen());
  1013. if (open_paren) {
  1014. state.token = *open_paren;
  1015. } else {
  1016. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error, "Expected `(` after `{0}`.",
  1017. TokenKind);
  1018. emitter_->Emit(*position_, ExpectedParenAfter,
  1019. tokens_->GetKind(state.token));
  1020. }
  1021. // TODO: This should be adding a ConditionStart here instead of ConditionEnd
  1022. // later, so this does state modification instead of a simpler push.
  1023. state.state = ParserState::ParenConditionFinish();
  1024. PushState(state);
  1025. PushState(ParserState::Expression());
  1026. }
  1027. auto Parser::HandleParenConditionFinishState() -> void {
  1028. auto state = PopState();
  1029. if (tokens_->GetKind(state.token) != TokenKind::OpenParen()) {
  1030. // Don't expect a matching closing paren if there wasn't an opening paren.
  1031. // TODO: Should probably push nodes on this state in order to have the
  1032. // condition wrapped, but it wasn't before, so not doing it for consistency.
  1033. ReturnErrorOnState();
  1034. return;
  1035. }
  1036. bool close_paren =
  1037. ConsumeAndAddCloseParen(state.token, ParseNodeKind::ConditionEnd());
  1038. return AddNode(ParseNodeKind::Condition(), state.token, state.subtree_start,
  1039. /*has_error=*/state.has_error || !close_paren);
  1040. }
  1041. auto Parser::HandleParenExpressionState() -> void {
  1042. auto state = PopState();
  1043. // TODO: When swapping () start/end, this should AddLeafNode the open before
  1044. // continuing.
  1045. // Advance past the open paren.
  1046. CARBON_CHECK(PositionIs(TokenKind::OpenParen()));
  1047. ++position_;
  1048. if (PositionIs(TokenKind::CloseParen())) {
  1049. state.state = ParserState::ParenExpressionFinishAsTuple();
  1050. PushState(state);
  1051. } else {
  1052. state.state = ParserState::ParenExpressionFinish();
  1053. PushState(state);
  1054. PushState(ParserState::ParenExpressionParameterFinishAsUnknown());
  1055. PushState(ParserState::Expression());
  1056. }
  1057. }
  1058. auto Parser::HandleParenExpressionParameterFinish(bool as_tuple) -> void {
  1059. auto state = PopState();
  1060. auto list_token_kind =
  1061. ConsumeListToken(ParseNodeKind::TupleLiteralComma(),
  1062. TokenKind::CloseParen(), state.has_error);
  1063. if (list_token_kind == ListTokenKind::Close) {
  1064. return;
  1065. }
  1066. // If this is the first item and a comma was found, switch to tuple handling.
  1067. // Note this could be `(expr,)` so we may not reuse the current state, but
  1068. // it's still necessary to switch the parent.
  1069. if (!as_tuple) {
  1070. state.state = ParserState::ParenExpressionParameterFinishAsTuple();
  1071. auto finish_state = PopState();
  1072. CARBON_CHECK(finish_state.state == ParserState::ParenExpressionFinish())
  1073. << "Unexpected parent state, found: " << finish_state.state;
  1074. finish_state.state = ParserState::ParenExpressionFinishAsTuple();
  1075. PushState(finish_state);
  1076. }
  1077. // On a comma, push another expression handler.
  1078. if (list_token_kind == ListTokenKind::Comma) {
  1079. PushState(state);
  1080. PushState(ParserState::Expression());
  1081. }
  1082. }
  1083. auto Parser::HandleParenExpressionParameterFinishAsUnknownState() -> void {
  1084. HandleParenExpressionParameterFinish(/*as_tuple=*/false);
  1085. }
  1086. auto Parser::HandleParenExpressionParameterFinishAsTupleState() -> void {
  1087. HandleParenExpressionParameterFinish(/*as_tuple=*/true);
  1088. }
  1089. auto Parser::HandleParenExpressionFinishState() -> void {
  1090. auto state = PopState();
  1091. AddLeafNode(ParseNodeKind::ParenExpressionEnd(), Consume());
  1092. AddNode(ParseNodeKind::ParenExpression(), state.token, state.subtree_start,
  1093. state.has_error);
  1094. }
  1095. auto Parser::HandleParenExpressionFinishAsTupleState() -> void {
  1096. auto state = PopState();
  1097. AddLeafNode(ParseNodeKind::TupleLiteralEnd(), Consume());
  1098. AddNode(ParseNodeKind::TupleLiteral(), state.token, state.subtree_start,
  1099. state.has_error);
  1100. }
  1101. auto Parser::HandlePattern(PatternKind pattern_kind) -> void {
  1102. auto state = PopState();
  1103. // Ensure the finish state always follows.
  1104. state.state = ParserState::PatternFinish();
  1105. // Handle an invalid pattern introducer.
  1106. if (!PositionIs(TokenKind::Identifier()) ||
  1107. tokens_->GetKind(*(position_ + 1)) != TokenKind::Colon()) {
  1108. switch (pattern_kind) {
  1109. case PatternKind::Parameter: {
  1110. CARBON_DIAGNOSTIC(ExpectedParameterName, Error,
  1111. "Expected parameter declaration.");
  1112. emitter_->Emit(*position_, ExpectedParameterName);
  1113. break;
  1114. }
  1115. case PatternKind::Variable: {
  1116. CARBON_DIAGNOSTIC(ExpectedVariableName, Error,
  1117. "Expected pattern in `var` declaration.");
  1118. emitter_->Emit(*position_, ExpectedVariableName);
  1119. break;
  1120. }
  1121. }
  1122. state.has_error = true;
  1123. PushState(state);
  1124. return;
  1125. }
  1126. // Switch the context token to the colon, so that it'll be used for the root
  1127. // node.
  1128. state.token = *(position_ + 1);
  1129. PushState(state);
  1130. PushStateForExpression(PrecedenceGroup::ForType());
  1131. AddLeafNode(ParseNodeKind::DeclaredName(), *position_);
  1132. position_ += 2;
  1133. }
  1134. auto Parser::HandlePatternAsFunctionParameterState() -> void {
  1135. HandlePattern(PatternKind::Parameter);
  1136. }
  1137. auto Parser::HandlePatternAsVariableState() -> void {
  1138. HandlePattern(PatternKind::Variable);
  1139. }
  1140. auto Parser::HandlePatternFinishState() -> void {
  1141. auto state = PopState();
  1142. // If an error was encountered, propagate it without adding a node.
  1143. if (state.has_error) {
  1144. ReturnErrorOnState();
  1145. return;
  1146. }
  1147. // TODO: may need to mark has_error if !type.
  1148. AddNode(ParseNodeKind::PatternBinding(), state.token, state.subtree_start,
  1149. /*has_error=*/false);
  1150. }
  1151. auto Parser::HandleStatementState() -> void {
  1152. PopAndDiscardState();
  1153. switch (PositionKind()) {
  1154. case TokenKind::Break(): {
  1155. PushState(ParserState::StatementBreakFinish());
  1156. AddLeafNode(ParseNodeKind::BreakStatementStart(), Consume());
  1157. break;
  1158. }
  1159. case TokenKind::Continue(): {
  1160. PushState(ParserState::StatementContinueFinish());
  1161. AddLeafNode(ParseNodeKind::ContinueStatementStart(), Consume());
  1162. break;
  1163. }
  1164. case TokenKind::For(): {
  1165. // Process the header as a child of the for so that we can get consistent
  1166. // starts.
  1167. // TODO: When reorganizing components, we can probably make this flatter.
  1168. PushState(ParserState::StatementForFinish());
  1169. ++position_;
  1170. PushState(ParserState::StatementForHeader());
  1171. break;
  1172. }
  1173. case TokenKind::If(): {
  1174. PushState(ParserState::StatementIf());
  1175. break;
  1176. }
  1177. case TokenKind::Return(): {
  1178. PushState(ParserState::StatementReturn());
  1179. break;
  1180. }
  1181. case TokenKind::Var(): {
  1182. PushState(ParserState::VarAsRequireSemicolon());
  1183. break;
  1184. }
  1185. case TokenKind::While(): {
  1186. PushState(ParserState::StatementWhile());
  1187. break;
  1188. }
  1189. default: {
  1190. PushState(ParserState::ExpressionStatementFinish());
  1191. PushState(ParserState::Expression());
  1192. break;
  1193. }
  1194. }
  1195. }
  1196. auto Parser::HandleStatementBreakFinishState() -> void {
  1197. HandleStatementKeywordFinish(ParseNodeKind::BreakStatement());
  1198. }
  1199. auto Parser::HandleStatementContinueFinishState() -> void {
  1200. HandleStatementKeywordFinish(ParseNodeKind::ContinueStatement());
  1201. }
  1202. auto Parser::HandleStatementForHeaderState() -> void {
  1203. auto state = PopState();
  1204. auto open_paren = ConsumeIf(TokenKind::OpenParen());
  1205. if (!open_paren) {
  1206. CARBON_DIAGNOSTIC(ExpectedParenAfter, Error,
  1207. "Expected `(` after `{0}`. Recovering from missing `(` "
  1208. "not implemented yet!",
  1209. TokenKind);
  1210. emitter_->Emit(*position_, ExpectedParenAfter, TokenKind::For());
  1211. // TODO: A proper recovery strategy is needed here. For now, I assume
  1212. // that all brackets are properly balanced (i.e. each open bracket has a
  1213. // closing one).
  1214. // This is temporary until we come to a conclusion regarding the
  1215. // recovery tokens strategy.
  1216. ReturnErrorOnState();
  1217. PushState(ParserState::CodeBlock());
  1218. return;
  1219. }
  1220. state.state = ParserState::StatementForHeaderIn();
  1221. if (PositionIs(TokenKind::Var())) {
  1222. PushState(state);
  1223. PushState(ParserState::VarAsNoSemicolon());
  1224. } else {
  1225. CARBON_DIAGNOSTIC(ExpectedVariableDeclaration, Error,
  1226. "Expected `var` declaration.");
  1227. emitter_->Emit(*position_, ExpectedVariableDeclaration);
  1228. if (auto next_in = FindNextOf({TokenKind::In()})) {
  1229. SkipTo(*next_in);
  1230. }
  1231. state.has_error = true;
  1232. PushState(state);
  1233. }
  1234. }
  1235. auto Parser::HandleStatementForHeaderInState() -> void {
  1236. auto state = PopState();
  1237. state.state = ParserState::StatementForHeaderFinish();
  1238. if (!ConsumeAndAddLeafNodeIf(TokenKind::In(), ParseNodeKind::ForIn())) {
  1239. if (auto colon = ConsumeIf(TokenKind::Colon())) {
  1240. CARBON_DIAGNOSTIC(ExpectedIn, Error, "`:` should be replaced by `in`.");
  1241. emitter_->Emit(*colon, ExpectedIn);
  1242. AddLeafNode(ParseNodeKind::ForIn(), *colon, /*has_error=*/true);
  1243. } else {
  1244. CARBON_DIAGNOSTIC(ExpectedIn, Error,
  1245. "Expected `in` after loop `var` declaration.");
  1246. emitter_->Emit(*position_, ExpectedIn);
  1247. SkipTo(tokens_->GetMatchedClosingToken(state.token));
  1248. state.has_error = true;
  1249. PushState(state);
  1250. return;
  1251. }
  1252. }
  1253. PushState(state);
  1254. PushState(ParserState::Expression());
  1255. }
  1256. auto Parser::HandleStatementForHeaderFinishState() -> void {
  1257. auto state = PopState();
  1258. if (!ConsumeAndAddCloseParen(state.token, ParseNodeKind::ForHeaderEnd())) {
  1259. state.has_error = true;
  1260. }
  1261. AddNode(ParseNodeKind::ForHeader(), state.token, state.subtree_start,
  1262. state.has_error);
  1263. PushState(ParserState::CodeBlock());
  1264. }
  1265. auto Parser::HandleStatementForFinishState() -> void {
  1266. auto state = PopState();
  1267. AddNode(ParseNodeKind::ForStatement(), state.token, state.subtree_start,
  1268. state.has_error);
  1269. }
  1270. auto Parser::HandleStatementIfState() -> void {
  1271. PopAndDiscardState();
  1272. PushState(ParserState::StatementIfConditionFinish());
  1273. PushState(ParserState::ParenCondition());
  1274. ++position_;
  1275. }
  1276. auto Parser::HandleStatementIfConditionFinishState() -> void {
  1277. auto state = PopState();
  1278. state.state = ParserState::StatementIfThenBlockFinish();
  1279. PushState(state);
  1280. PushState(ParserState::CodeBlock());
  1281. }
  1282. auto Parser::HandleStatementIfThenBlockFinishState() -> void {
  1283. auto state = PopState();
  1284. if (ConsumeAndAddLeafNodeIf(TokenKind::Else(),
  1285. ParseNodeKind::IfStatementElse())) {
  1286. state.state = ParserState::StatementIfElseBlockFinish();
  1287. PushState(state);
  1288. // `else if` is permitted as a special case.
  1289. PushState(PositionIs(TokenKind::If()) ? ParserState::StatementIf()
  1290. : ParserState::CodeBlock());
  1291. } else {
  1292. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1293. state.has_error);
  1294. }
  1295. }
  1296. auto Parser::HandleStatementIfElseBlockFinishState() -> void {
  1297. auto state = PopState();
  1298. AddNode(ParseNodeKind::IfStatement(), state.token, state.subtree_start,
  1299. state.has_error);
  1300. }
  1301. auto Parser::HandleStatementKeywordFinish(ParseNodeKind node_kind) -> void {
  1302. auto state = PopState();
  1303. auto semi = ConsumeIf(TokenKind::Semi());
  1304. if (!semi) {
  1305. CARBON_DIAGNOSTIC(ExpectedSemiAfter, Error, "Expected `;` after `{0}`.",
  1306. TokenKind);
  1307. emitter_->Emit(*position_, ExpectedSemiAfter,
  1308. tokens_->GetKind(state.token));
  1309. state.has_error = true;
  1310. // Recover to the next semicolon if possible, otherwise indicate the
  1311. // keyword for the error.
  1312. semi = SkipPastLikelyEnd(state.token);
  1313. if (!semi) {
  1314. semi = state.token;
  1315. }
  1316. }
  1317. AddNode(node_kind, *semi, state.subtree_start, state.has_error);
  1318. }
  1319. auto Parser::HandleStatementReturnState() -> void {
  1320. auto state = PopState();
  1321. state.state = ParserState::StatementReturnFinish();
  1322. PushState(state);
  1323. AddLeafNode(ParseNodeKind::ReturnStatementStart(), Consume());
  1324. if (!PositionIs(TokenKind::Semi())) {
  1325. PushState(ParserState::Expression());
  1326. }
  1327. }
  1328. auto Parser::HandleStatementReturnFinishState() -> void {
  1329. HandleStatementKeywordFinish(ParseNodeKind::ReturnStatement());
  1330. }
  1331. auto Parser::HandleStatementScopeLoopState() -> void {
  1332. // This maintains the current state until we're at the end of the scope.
  1333. auto token_kind = PositionKind();
  1334. if (token_kind == TokenKind::CloseCurlyBrace()) {
  1335. auto state = PopState();
  1336. if (state.has_error) {
  1337. ReturnErrorOnState();
  1338. }
  1339. } else {
  1340. PushState(ParserState::Statement());
  1341. }
  1342. }
  1343. auto Parser::HandleStatementWhileState() -> void {
  1344. PopAndDiscardState();
  1345. PushState(ParserState::StatementWhileConditionFinish());
  1346. PushState(ParserState::ParenCondition());
  1347. ++position_;
  1348. }
  1349. auto Parser::HandleStatementWhileConditionFinishState() -> void {
  1350. auto state = PopState();
  1351. state.state = ParserState::StatementWhileBlockFinish();
  1352. PushState(state);
  1353. PushState(ParserState::CodeBlock());
  1354. }
  1355. auto Parser::HandleStatementWhileBlockFinishState() -> void {
  1356. auto state = PopState();
  1357. AddNode(ParseNodeKind::WhileStatement(), state.token, state.subtree_start,
  1358. state.has_error);
  1359. }
  1360. auto Parser::HandleVar(bool require_semicolon) -> void {
  1361. PopAndDiscardState();
  1362. PushState(require_semicolon ? ParserState::VarFinishAsRequireSemicolon()
  1363. : ParserState::VarFinishAsNoSemicolon());
  1364. PushState(ParserState::VarAfterPattern());
  1365. ++position_;
  1366. PushState(ParserState::PatternAsVariable());
  1367. }
  1368. auto Parser::HandleVarAsRequireSemicolonState() -> void {
  1369. HandleVar(/*require_semicolon=*/true);
  1370. }
  1371. auto Parser::HandleVarAsNoSemicolonState() -> void {
  1372. HandleVar(/*require_semicolon=*/false);
  1373. }
  1374. auto Parser::HandleVarAfterPatternState() -> void {
  1375. auto state = PopState();
  1376. if (state.has_error) {
  1377. if (auto after_pattern =
  1378. FindNextOf({TokenKind::Equal(), TokenKind::Semi()})) {
  1379. SkipTo(*after_pattern);
  1380. }
  1381. }
  1382. if (PositionIs(TokenKind::Equal())) {
  1383. PushState(ParserState::VarAfterInitializer());
  1384. ++position_;
  1385. PushState(ParserState::Expression());
  1386. return;
  1387. }
  1388. }
  1389. auto Parser::HandleVarAfterInitializerState() -> void {
  1390. auto state = PopState();
  1391. AddNode(ParseNodeKind::VariableInitializer(), state.token,
  1392. state.subtree_start, state.has_error);
  1393. }
  1394. auto Parser::HandleVarFinish(bool require_semicolon) -> void {
  1395. auto state = PopState();
  1396. if (require_semicolon) {
  1397. auto semi = ConsumeAndAddLeafNodeIf(TokenKind::Semi(),
  1398. ParseNodeKind::DeclarationEnd());
  1399. if (!semi) {
  1400. emitter_->Emit(*position_, ExpectedSemiAfterExpression);
  1401. if (auto semi_token = SkipPastLikelyEnd(state.token)) {
  1402. AddLeafNode(ParseNodeKind::DeclarationEnd(), *semi_token,
  1403. /*has_error=*/true);
  1404. } else {
  1405. state.has_error = true;
  1406. }
  1407. }
  1408. }
  1409. return AddNode(ParseNodeKind::VariableDeclaration(), state.token,
  1410. state.subtree_start, state.has_error);
  1411. }
  1412. auto Parser::HandleVarFinishAsRequireSemicolonState() -> void {
  1413. HandleVarFinish(/*require_semicolon=*/true);
  1414. }
  1415. auto Parser::HandleVarFinishAsNoSemicolonState() -> void {
  1416. HandleVarFinish(/*require_semicolon=*/false);
  1417. }
  1418. auto Parser::HandleInterfaceIntroducerState() -> void {
  1419. auto state = PopState();
  1420. if (!ConsumeAndAddLeafNodeIf(TokenKind::Identifier(),
  1421. ParseNodeKind::DeclaredName())) {
  1422. CARBON_DIAGNOSTIC(ExpectedInterfaceName, Error,
  1423. "Expected interface name after `interface` keyword.");
  1424. emitter_->Emit(*position_, ExpectedInterfaceName);
  1425. state.has_error = true;
  1426. }
  1427. bool parse_body = true;
  1428. if (!PositionIs(TokenKind::OpenCurlyBrace())) {
  1429. CARBON_DIAGNOSTIC(ExpectedInterfaceOpenCurlyBrace, Error,
  1430. "Expected `{{` to start interface definition.");
  1431. emitter_->Emit(*position_, ExpectedInterfaceOpenCurlyBrace);
  1432. state.has_error = true;
  1433. SkipPastLikelyEnd(state.token);
  1434. parse_body = false;
  1435. }
  1436. state.state = ParserState::InterfaceDefinitionFinish();
  1437. PushState(state);
  1438. if (parse_body) {
  1439. PushState(ParserState::InterfaceDefinitionLoop());
  1440. AddLeafNode(ParseNodeKind::InterfaceBodyStart(), Consume());
  1441. }
  1442. }
  1443. auto Parser::HandleInterfaceDefinitionLoopState() -> void {
  1444. // This maintains the current state unless we're at the end of the interface
  1445. // definition.
  1446. switch (PositionKind()) {
  1447. case TokenKind::CloseCurlyBrace(): {
  1448. auto state = PopState();
  1449. AddNode(ParseNodeKind::InterfaceBody(), Consume(), state.subtree_start,
  1450. state.has_error);
  1451. break;
  1452. }
  1453. // TODO: Handle possible declarations inside interface body.
  1454. default: {
  1455. CARBON_DIAGNOSTIC(UnrecognizedDeclaration, Error,
  1456. "Unrecognized declaration introducer.");
  1457. emitter_->Emit(*position_, UnrecognizedDeclaration);
  1458. if (auto semi = SkipPastLikelyEnd(*position_)) {
  1459. AddLeafNode(ParseNodeKind::EmptyDeclaration(), *semi,
  1460. /*has_error=*/true);
  1461. } else {
  1462. ReturnErrorOnState();
  1463. }
  1464. break;
  1465. }
  1466. }
  1467. }
  1468. auto Parser::HandleInterfaceDefinitionFinishState() -> void {
  1469. auto state = PopState();
  1470. AddNode(ParseNodeKind::InterfaceDefinition(), state.token,
  1471. state.subtree_start, state.has_error);
  1472. }
  1473. } // namespace Carbon