| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- #include "toolchain/lex/token_kind.h"
- #include "toolchain/parse/context.h"
- #include "toolchain/parse/handle.h"
- namespace Carbon::Parse {
- static auto DiagnoseStatementOperatorAsSubExpr(Context& context) -> void {
- CARBON_DIAGNOSTIC(StatementOperatorAsSubExpr, Error,
- "operator `{0}` can only be used as a complete statement",
- Lex::TokenKind);
- context.emitter().Emit(*context.position(), StatementOperatorAsSubExpr,
- context.PositionKind());
- }
- auto HandleExpr(Context& context) -> void {
- auto state = context.PopState();
- // Check for a prefix operator.
- if (auto operator_precedence =
- PrecedenceGroup::ForLeading(context.PositionKind())) {
- if (PrecedenceGroup::GetPriority(state.ambient_precedence,
- *operator_precedence) !=
- OperatorPriority::RightFirst) {
- // The precedence rules don't permit this prefix operator in this
- // context. Diagnose this, but carry on and parse it anyway.
- if (PrecedenceGroup::GetPriority(PrecedenceGroup::ForTopLevelExpr(),
- *operator_precedence) ==
- OperatorPriority::RightFirst) {
- CARBON_DIAGNOSTIC(
- UnaryOperatorRequiresParentheses, Error,
- "parentheses are required around this unary `{0}` operator",
- Lex::TokenKind);
- context.emitter().Emit(*context.position(),
- UnaryOperatorRequiresParentheses,
- context.PositionKind());
- } else {
- // This operator wouldn't be allowed even if parenthesized.
- DiagnoseStatementOperatorAsSubExpr(context);
- }
- } else {
- // Check that this operator follows the proper whitespace rules.
- context.DiagnoseOperatorFixity(Context::OperatorFixity::Prefix);
- }
- if (context.PositionIs(Lex::TokenKind::If)) {
- context.PushState(StateKind::IfExprFinish);
- context.PushState(StateKind::IfExprFinishCondition);
- } else {
- context.PushStateForExprLoop(StateKind::ExprLoopForPrefixOperator,
- state.ambient_precedence,
- *operator_precedence);
- }
- context.ConsumeAndDiscard();
- context.PushStateForExpr(*operator_precedence);
- } else {
- context.PushStateForExprLoop(StateKind::ExprLoop, state.ambient_precedence,
- PrecedenceGroup::ForPostfixExpr());
- context.PushState(StateKind::ExprInPostfix);
- }
- }
- auto HandleExprInPostfix(Context& context) -> void {
- auto state = context.PopState();
- // Continue to the loop state.
- state.kind = StateKind::ExprInPostfixLoop;
- // Parses a primary expression, which is either a terminal portion of an
- // expression tree, such as an identifier or literal, or a parenthesized
- // expression.
- switch (auto token_kind = context.PositionKind()) {
- case Lex::TokenKind::Identifier: {
- context.AddLeafNode(NodeKind::IdentifierNameExpr, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Fn: {
- context.PushState(state);
- context.PushState(StateKind::LambdaIntroducer);
- break;
- }
- case Lex::TokenKind::False: {
- context.AddLeafNode(NodeKind::BoolLiteralFalse, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::True: {
- context.AddLeafNode(NodeKind::BoolLiteralTrue, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::CharLiteral: {
- context.AddLeafNode(NodeKind::CharLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::IntLiteral: {
- context.AddLeafNode(NodeKind::IntLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::RealLiteral: {
- context.AddLeafNode(NodeKind::RealLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::StringLiteral: {
- context.AddLeafNode(NodeKind::StringLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Bool: {
- context.AddLeafNode(NodeKind::BoolTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Char: {
- context.AddLeafNode(NodeKind::CharTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::IntTypeLiteral: {
- context.AddLeafNode(NodeKind::IntTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::UnsignedIntTypeLiteral: {
- context.AddLeafNode(NodeKind::UnsignedIntTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::FloatTypeLiteral: {
- context.AddLeafNode(NodeKind::FloatTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Str: {
- context.AddLeafNode(NodeKind::StringTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Type: {
- context.AddLeafNode(NodeKind::TypeTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Auto: {
- context.AddLeafNode(NodeKind::AutoTypeLiteral, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::OpenCurlyBrace: {
- context.PushState(state);
- context.PushState(StateKind::BraceExpr);
- break;
- }
- case Lex::TokenKind::OpenParen: {
- context.PushState(state);
- context.PushState(StateKind::ParenExpr);
- break;
- }
- case Lex::TokenKind::Array: {
- context.PushState(state);
- context.PushState(StateKind::ArrayExpr);
- break;
- }
- case Lex::TokenKind::Form: {
- context.PushState(state);
- context.PushState(StateKind::FormLiteral);
- break;
- }
- case Lex::TokenKind::Package: {
- context.AddLeafNode(NodeKind::PackageExpr, context.Consume());
- if (context.PositionKind() != Lex::TokenKind::Period) {
- CARBON_DIAGNOSTIC(ExpectedPeriodAfterPackage, Error,
- "expected `.` after `package` expression");
- context.emitter().Emit(*context.position(), ExpectedPeriodAfterPackage);
- state.has_error = true;
- }
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Core: {
- context.AddLeafNode(NodeKind::CoreNameExpr, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Cpp: {
- context.AddLeafNode(NodeKind::CppNameExpr, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::SelfValueIdentifier: {
- context.AddLeafNode(NodeKind::SelfValueNameExpr, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::SelfTypeIdentifier: {
- context.AddLeafNode(NodeKind::SelfTypeNameExpr, context.Consume());
- context.PushState(state);
- break;
- }
- case Lex::TokenKind::Period: {
- // For periods, we look at the next token to form a designator like
- // `.Member` or `.Self`.
- auto period = context.Consume();
- if (context.ConsumeAndAddLeafNodeIf(
- Lex::TokenKind::Identifier,
- NodeKind::IdentifierNameNotBeforeSignature)) {
- // OK, `.` identifier.
- } else if (context.ConsumeAndAddLeafNodeIf(
- Lex::TokenKind::SelfTypeIdentifier,
- NodeKind::SelfTypeName)) {
- // OK, `.Self`.
- } else {
- CARBON_DIAGNOSTIC(ExpectedIdentifierOrSelfAfterPeriod, Error,
- "expected identifier or `Self` after `.`");
- context.emitter().Emit(*context.position(),
- ExpectedIdentifierOrSelfAfterPeriod);
- // Only consume if it is a number or word.
- if (context.PositionKind().is_keyword()) {
- context.AddLeafNode(NodeKind::IdentifierNameNotBeforeSignature,
- context.Consume(), /*has_error=*/true);
- } else if (context.PositionIs(Lex::TokenKind::IntLiteral)) {
- context.AddInvalidParse(context.Consume());
- } else {
- context.AddInvalidParse(*context.position());
- // Indicate the error to the parent state so that it can avoid
- // producing more errors. We only do this on this path where we don't
- // consume the token after the period, where we expect further errors
- // since we likely haven't recovered.
- context.ReturnErrorOnState();
- }
- state.has_error = true;
- }
- context.AddNode(NodeKind::DesignatorExpr, period, state.has_error);
- context.PushState(state);
- break;
- }
- default: {
- // If not already diagnosed in the lexer, diagnose it here.
- if (token_kind != Lex::TokenKind::Error) {
- CARBON_DIAGNOSTIC(ExpectedExpr, Error, "expected expression");
- CARBON_DIAGNOSTIC(ExpectedPattern, Error, "expected pattern");
- llvm::SmallVector<StateKind, 2> state_kinds(
- llvm::map_range(llvm::ArrayRef(context.state_stack()).take_back(2),
- [&](const Context::State& s) { return s.kind; }));
- bool in_pattern = state_kinds == llvm::ArrayRef{StateKind::ExprPattern,
- StateKind::ExprLoop};
- context.emitter().Emit(*context.position(),
- in_pattern ? ExpectedPattern : ExpectedExpr);
- }
- // Add a node to keep the parse tree balanced.
- context.AddInvalidParse(*context.position());
- context.ReturnErrorOnState();
- break;
- }
- }
- }
- auto HandleExprInPostfixLoop(Context& context) -> void {
- // This is a cyclic state that repeats, so this state is typically pushed back
- // on.
- auto state = context.PopState();
- state.token = *context.position();
- switch (context.PositionKind()) {
- case Lex::TokenKind::Period: {
- context.PushState(state);
- context.PushState(state, StateKind::PeriodAsExpr);
- break;
- }
- case Lex::TokenKind::MinusGreater: {
- context.PushState(state);
- context.PushState(state, StateKind::ArrowExpr);
- break;
- }
- case Lex::TokenKind::OpenParen: {
- context.PushState(state);
- context.PushState(state, StateKind::CallExpr);
- break;
- }
- case Lex::TokenKind::OpenSquareBracket: {
- context.PushState(state);
- context.PushState(state, StateKind::IndexExpr);
- break;
- }
- default: {
- if (state.has_error) {
- context.ReturnErrorOnState();
- }
- break;
- }
- }
- }
- auto HandleExprLoop(Context& context) -> void {
- auto state = context.PopState();
- auto operator_kind = context.PositionKind();
- auto trailing_operator = PrecedenceGroup::ForTrailing(
- operator_kind, context.IsTrailingOperatorInfix());
- if (!trailing_operator) {
- // TODO: Generalize this to handle a sequence of operator modifiers once we
- // have more than one.
- if (context.PositionIs(Lex::TokenKind::Unsafe)) {
- operator_kind = context.PositionKind(Lookahead::NextToken);
- trailing_operator = PrecedenceGroup::ForTrailing(
- operator_kind, context.IsTrailingOperatorInfix());
- }
- if (!trailing_operator) {
- if (state.has_error) {
- context.ReturnErrorOnState();
- }
- return;
- }
- }
- auto [operator_precedence, is_binary] = *trailing_operator;
- // TODO: If this operator is ambiguous with either the ambient precedence
- // or the LHS precedence, and there's a variant with a different fixity
- // that would work, use that one instead for error recovery.
- if (PrecedenceGroup::GetPriority(state.ambient_precedence,
- operator_precedence) !=
- OperatorPriority::RightFirst) {
- // The precedence rules don't permit this operator in this context. Try
- // again in the enclosing expression context.
- if (state.has_error) {
- context.ReturnErrorOnState();
- }
- return;
- }
- if (PrecedenceGroup::GetPriority(state.lhs_precedence, operator_precedence) !=
- OperatorPriority::LeftFirst) {
- // Either the LHS operator and this operator are ambiguous, or the
- // LHS operator is a unary operator that can't be nested within
- // this operator. Either way, parentheses are required.
- if (PrecedenceGroup::GetPriority(PrecedenceGroup::ForTopLevelExpr(),
- operator_precedence) ==
- OperatorPriority::RightFirst) {
- CARBON_DIAGNOSTIC(
- OperatorRequiresParentheses, Error,
- "parentheses are required to disambiguate operator precedence");
- context.emitter().Emit(*context.position(), OperatorRequiresParentheses);
- } else {
- // This operator wouldn't be allowed even if parenthesized.
- DiagnoseStatementOperatorAsSubExpr(context);
- }
- state.has_error = true;
- } else {
- context.DiagnoseOperatorFixity(is_binary
- ? Context::OperatorFixity::Infix
- : Context::OperatorFixity::Postfix);
- }
- // For operator modifiers, wrap the first operand in the modifier.
- if (context.PositionIs(Lex::TokenKind::Unsafe)) {
- if (context.PositionIs(Lex::TokenKind::As, Lookahead::NextToken)) {
- context.AddNode<NodeKind::UnsafeModifier>(context.Consume(),
- state.has_error);
- } else {
- CARBON_DIAGNOSTIC(ModifierNotAllowedOnOperator, Error,
- "`{0}` not allowed on operator `{1}`", Lex::TokenKind,
- Lex::TokenKind);
- context.emitter().Emit(*context.position(), ModifierNotAllowedOnOperator,
- context.PositionKind(),
- context.PositionKind(Lookahead::NextToken));
- context.Consume();
- state.has_error = true;
- }
- }
- state.token = context.Consume();
- state.lhs_precedence = operator_precedence;
- if (is_binary) {
- switch (operator_kind) {
- // For `and` and `or`, wrap the first operand in a virtual parse tree
- // node so that checking can insert control flow here.
- case Lex::TokenKind::And:
- context.AddNode(NodeKind::ShortCircuitOperandAnd, state.token,
- state.has_error);
- state.kind = StateKind::ExprLoopForShortCircuitOperatorAsAnd;
- break;
- case Lex::TokenKind::Or:
- context.AddNode(NodeKind::ShortCircuitOperandOr, state.token,
- state.has_error);
- state.kind = StateKind::ExprLoopForShortCircuitOperatorAsOr;
- break;
- // `where` also needs a virtual parse tree node, and parses its right
- // argument in a mode where it can handle requirement operators like
- // `impls` and `=`.
- case Lex::TokenKind::Where:
- context.AddNode(NodeKind::WhereOperand, state.token, state.has_error);
- context.PushState(state, StateKind::WhereFinish);
- context.PushState(StateKind::RequirementBegin);
- return;
- default:
- state.kind = StateKind::ExprLoopForInfixOperator;
- break;
- }
- context.PushState(state);
- context.PushStateForExpr(operator_precedence);
- } else {
- NodeKind node_kind;
- switch (operator_kind) {
- #define CARBON_PARSE_NODE_KIND(Name)
- #define CARBON_PARSE_NODE_KIND_POSTFIX_OPERATOR(Name) \
- case Lex::TokenKind::Name: \
- node_kind = NodeKind::PostfixOperator##Name; \
- break;
- #include "toolchain/parse/node_kind.def"
- default:
- CARBON_FATAL("Unexpected token kind for postfix operator: {0}",
- operator_kind);
- }
- context.AddNode(node_kind, state.token, state.has_error);
- state.has_error = false;
- context.PushState(state);
- }
- }
- // Adds the operator node and returns the main expression loop.
- static auto HandleExprLoopForOperator(Context& context, Context::State state,
- NodeKind node_kind) -> void {
- context.AddNode(node_kind, state.token, state.has_error);
- state.has_error = false;
- context.PushState(state, StateKind::ExprLoop);
- }
- auto HandleExprLoopForInfixOperator(Context& context) -> void {
- auto state = context.PopState();
- switch (auto token_kind = context.tokens().GetKind(state.token)) {
- #define CARBON_PARSE_NODE_KIND(Name)
- #define CARBON_PARSE_NODE_KIND_INFIX_OPERATOR(Name) \
- case Lex::TokenKind::Name: \
- HandleExprLoopForOperator(context, state, NodeKind::InfixOperator##Name); \
- break;
- #include "toolchain/parse/node_kind.def"
- default:
- CARBON_FATAL("Unexpected token kind for infix operator: {0}", token_kind);
- }
- }
- auto HandleExprLoopForPrefixOperator(Context& context) -> void {
- auto state = context.PopState();
- switch (auto token_kind = context.tokens().GetKind(state.token)) {
- #define CARBON_PARSE_NODE_KIND(Name)
- #define CARBON_PARSE_NODE_KIND_PREFIX_OPERATOR(Name) \
- case Lex::TokenKind::Name: \
- HandleExprLoopForOperator(context, state, NodeKind::PrefixOperator##Name); \
- break;
- #include "toolchain/parse/node_kind.def"
- default:
- CARBON_FATAL("Unexpected token kind for prefix operator: {0}",
- token_kind);
- }
- }
- auto HandleExprLoopForShortCircuitOperatorAsAnd(Context& context) -> void {
- auto state = context.PopState();
- HandleExprLoopForOperator(context, state, NodeKind::ShortCircuitOperatorAnd);
- }
- auto HandleExprLoopForShortCircuitOperatorAsOr(Context& context) -> void {
- auto state = context.PopState();
- HandleExprLoopForOperator(context, state, NodeKind::ShortCircuitOperatorOr);
- }
- auto HandleExprStatementFinish(Context& context) -> void {
- auto state = context.PopState();
- if (auto semi = context.ConsumeIf(Lex::TokenKind::Semi)) {
- context.AddNode(NodeKind::ExprStatement, *semi, state.has_error);
- return;
- }
- if (!state.has_error) {
- CARBON_DIAGNOSTIC(ExpectedExprSemi, Error,
- "expected `;` after expression statement");
- context.emitter().Emit(*context.position(), ExpectedExprSemi);
- }
- context.AddNode(NodeKind::ExprStatement,
- context.SkipPastLikelyEnd(state.token), /*has_error=*/true);
- }
- } // namespace Carbon::Parse
|