| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- // -----------------------------------------------------------------------------
- // Bison Configuration
- // -----------------------------------------------------------------------------
- %require "3.2"
- %language "c++"
- // We don't need a separate header for Bison locations.
- %define api.location.file none
- // Use a type-safe C++ variant for semantic values
- %define api.value.type variant
- // Have Bison generate the functions ‘make_TEXT’ and ‘make_NUMBER’, but also
- // ‘make_YYEOF’, for the end of input.
- %define api.token.constructor
- // Generate the parser as `::Carbon::Parser`.
- %define api.namespace { Carbon }
- %define api.parser.class { Parser }
- // Make parse error messages more detailed
- %define parse.error verbose
- // Enable support for parser debugging
- %define parse.trace true
- //
- // Parameters to the parser and lexer
- //
- // Parameters to the parser are stored therein as protected data members, and
- // thus available to its methods.
- // "out" parameter passed to the parser, where the AST is written.
- %parse-param {std::optional<AST>& parsed_program}
- // "inout" parameter passed to both the parser and the lexer.
- %param {ParseAndLexContext& context}
- // No shift-reduce conflicts are expected.
- %expect 0
- // -----------------------------------------------------------------------------
- %code top {
- #include <algorithm>
- #include <cstdarg>
- #include <cstdio>
- #include <cstdlib>
- #include <list>
- #include <vector>
- #include "common/check.h"
- #include "executable_semantics/syntax/syntax_helpers.h"
- #include "executable_semantics/syntax/parse_and_lex_context.h"
- #include "llvm/ADT/StringExtras.h"
- } // %code top
- %code requires {
- #include <optional>
- #include "executable_semantics/ast/abstract_syntax_tree.h"
- #include "executable_semantics/ast/declaration.h"
- #include "executable_semantics/ast/expression.h"
- #include "executable_semantics/ast/function_definition.h"
- #include "executable_semantics/ast/pattern.h"
- #include "executable_semantics/common/arena.h"
- #include "executable_semantics/common/ptr.h"
- #include "executable_semantics/ast/paren_contents.h"
- namespace Carbon {
- class ParseAndLexContext;
- } // namespace Carbon
- } // %code requires
- %code {
- extern int yylineno;
- void Carbon::Parser::error(const location_type&, const std::string& message) {
- context.PrintDiagnostic(message, yylineno);
- }
- } // %code
- %token <int> integer_literal
- %token <std::string> identifier
- %token <std::string> sized_type_literal
- %token <std::string> string_literal
- %type <std::string> designator
- %type <const Declaration*> declaration
- %type <const FunctionDefinition*> function_declaration
- %type <const FunctionDefinition*> function_definition
- %type <std::list<Ptr<const Declaration>>> declaration_list
- %type <const Statement*> statement
- %type <const Statement*> if_statement
- %type <const Statement*> optional_else
- %type <std::pair<const Expression*, bool>> return_expression
- %type <const Statement*> block
- %type <const Statement*> statement_list
- %type <const Expression*> expression
- %type <GenericBinding> generic_binding
- %type <std::vector<GenericBinding>> deduced_params
- %type <std::vector<GenericBinding>> deduced_param_list
- %type <const Pattern*> pattern
- %type <const Pattern*> non_expression_pattern
- %type <std::pair<const Expression*, bool>> return_type
- %type <const Expression*> paren_expression
- %type <const Expression*> tuple
- %type <std::optional<std::string>> binding_lhs
- %type <const BindingPattern*> variable_declaration
- %type <Member*> member
- %type <std::list<Member*>> member_list
- %type <ParenContents<Expression>::Element> paren_expression_element
- %type <ParenContents<Expression>> paren_expression_base
- %type <ParenContents<Expression>> paren_expression_contents
- %type <const Pattern*> paren_pattern
- %type <const TuplePattern*> tuple_pattern
- %type <const TuplePattern*> maybe_empty_tuple_pattern
- %type <ParenContents<Pattern>> paren_pattern_base
- %type <ParenContents<Pattern>::Element> paren_pattern_element
- %type <ParenContents<Pattern>> paren_pattern_contents
- %type <std::pair<std::string, const Expression*>> alternative
- %type <std::list<std::pair<std::string, const Expression*>>> alternative_list
- %type <std::pair<const Pattern*, const Statement*>*> clause
- %type <std::list<std::pair<const Pattern*, const Statement*>>*> clause_list
- %token END_OF_FILE 0
- %token AND
- %token OR
- %token NOT
- %token STRING
- %token BOOL
- %token TYPE
- %token FN
- %token FNTY
- %token ARROW "->"
- %token FNARROW "-> in return type"
- %token VAR
- %token EQUAL_EQUAL
- %token IF
- %token ELSE
- %token WHILE
- %token CONTINUATION_TYPE
- %token CONTINUATION
- %token RUN
- %token AWAIT
- %token BREAK
- %token CONTINUE
- %token RETURN
- %token TRUE
- %token FALSE
- %token CLASS
- %token CHOICE
- %token MATCH
- %token CASE
- %token DBLARROW "=>"
- %token DEFAULT
- %token AUTO
- %token UNDERSCORE
- %token
- EQUAL "="
- MINUS "-"
- PLUS "+"
- // The lexer determines the arity and fixity of each `*` based on whitespace
- // and adjacent tokens. UNARY_STAR indicates that the operator is unary but
- // could be either prefix or postfix.
- UNARY_STAR "unary *"
- PREFIX_STAR "prefix *"
- POSTFIX_STAR "postfix *"
- BINARY_STAR "binary *"
- SLASH "/"
- LEFT_PARENTHESIS "("
- RIGHT_PARENTHESIS ")"
- LEFT_CURLY_BRACE "{"
- RIGHT_CURLY_BRACE "}"
- LEFT_SQUARE_BRACKET "["
- RIGHT_SQUARE_BRACKET "]"
- PERIOD "."
- COMMA ","
- SEMICOLON ";"
- COLON_BANG ":!"
- COLON ":"
- ;
- %precedence FNARROW
- %precedence "{" "}"
- %precedence ":!" ":" "," DBLARROW
- %left OR AND
- %nonassoc EQUAL_EQUAL
- %left "+" "-"
- %left BINARY_STAR
- %precedence NOT UNARY_MINUS PREFIX_STAR
- // We need to give the `UNARY_STAR` token a precedence, rather than overriding
- // the precedence of the `expression UNARY_STAR` rule below, because bison
- // compares the precedence of the final token (for a shift) to the precedence
- // of the other rule (for a reduce) when attempting to resolve a shift-reduce
- // conflict. See https://stackoverflow.com/a/26188429/1041090. When UNARY_STAR
- // is the final token of a rule, it must be a postfix usage, so we give it the
- // same precedence as POSTFIX_STAR.
- %precedence POSTFIX_STAR UNARY_STAR
- %left "." ARROW
- %precedence "(" ")" "[" "]"
- %start input
- %locations
- %%
- input: declaration_list
- { parsed_program = $1; }
- ;
- expression:
- identifier
- { $$ = global_arena->RawNew<IdentifierExpression>(yylineno, $1); }
- | expression designator
- { $$ = global_arena->RawNew<FieldAccessExpression>(yylineno, $1, $2); }
- | expression "[" expression "]"
- { $$ = global_arena->RawNew<IndexExpression>(yylineno, $1, $3); }
- | integer_literal
- { $$ = global_arena->RawNew<IntLiteral>(yylineno, $1); }
- | string_literal
- { $$ = global_arena->RawNew<StringLiteral>(yylineno, $1); }
- | TRUE
- { $$ = global_arena->RawNew<BoolLiteral>(yylineno, true); }
- | FALSE
- { $$ = global_arena->RawNew<BoolLiteral>(yylineno, false); }
- | sized_type_literal
- {
- int val;
- CHECK(llvm::to_integer(llvm::StringRef($1).substr(1), val));
- CHECK($1[0] == 'i' && val == 32) << "Only i32 is supported for now: " << $1;
- $$ = global_arena->RawNew<IntTypeLiteral>(yylineno);
- }
- | STRING
- { $$ = global_arena->RawNew<StringTypeLiteral>(yylineno); }
- | BOOL
- { $$ = global_arena->RawNew<BoolTypeLiteral>(yylineno); }
- | TYPE
- { $$ = global_arena->RawNew<TypeTypeLiteral>(yylineno); }
- | CONTINUATION_TYPE
- { $$ = global_arena->RawNew<ContinuationTypeLiteral>(yylineno); }
- | paren_expression { $$ = $1; }
- | expression EQUAL_EQUAL expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Eq, std::vector<const Expression*>({$1, $3})); }
- | expression "+" expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Add, std::vector<const Expression*>({$1, $3})); }
- | expression "-" expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Sub, std::vector<const Expression*>({$1, $3})); }
- | expression BINARY_STAR expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Mul, std::vector<const Expression*>({$1, $3})); }
- | expression AND expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::And, std::vector<const Expression*>({$1, $3})); }
- | expression OR expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Or, std::vector<const Expression*>({$1, $3})); }
- | NOT expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Not, std::vector<const Expression*>({$2})); }
- | "-" expression %prec UNARY_MINUS
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Neg, std::vector<const Expression*>({$2})); }
- | PREFIX_STAR expression
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Deref, std::vector<const Expression*>({$2})); }
- | UNARY_STAR expression %prec PREFIX_STAR
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Deref, std::vector<const Expression*>({$2})); }
- | expression tuple
- { $$ = global_arena->RawNew<CallExpression>(yylineno, $1, $2); }
- | expression POSTFIX_STAR
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Ptr, std::vector<const Expression*>({$1})); }
- | expression UNARY_STAR
- { $$ = global_arena->RawNew<PrimitiveOperatorExpression>(
- yylineno, Operator::Ptr, std::vector<const Expression*>({$1})); }
- | FNTY tuple return_type
- { $$ = global_arena->RawNew<FunctionTypeLiteral>(
- yylineno, $2, $3.first, $3.second); }
- ;
- designator: "." identifier { $$ = $2; }
- ;
- paren_expression: paren_expression_base
- { $$ = ExpressionFromParenContents(yylineno, $1); }
- ;
- tuple: paren_expression_base
- { $$ = TupleExpressionFromParenContents(yylineno, $1); }
- ;
- paren_expression_element:
- expression
- { $$ = {.name = std::nullopt, .term = $1}; }
- | designator "=" expression
- { $$ = {.name = $1, .term = $3}; }
- ;
- paren_expression_base:
- "(" ")"
- { $$ = {.elements = {}, .has_trailing_comma = false}; }
- | "(" paren_expression_contents ")"
- { $$ = $2; }
- | "(" paren_expression_contents "," ")"
- {
- $$ = $2;
- $$.has_trailing_comma = true;
- }
- ;
- paren_expression_contents:
- paren_expression_element
- { $$ = {.elements = {$1}, .has_trailing_comma = false}; }
- | paren_expression_contents "," paren_expression_element
- {
- $$ = $1;
- $$.elements.push_back($3);
- }
- ;
- // In many cases, using `pattern` recursively will result in ambiguities.
- // When that happens, it's necessary to factor out two separate productions,
- // one for when the sub-pattern is an expression, and one for when it is not.
- // To facilitate this, non-terminals besides `pattern` whose names contain
- // `pattern` are structured to be disjoint from `expression`, unless otherwise
- // specified.
- pattern:
- non_expression_pattern
- { $$ = $1; }
- | expression
- { $$ = global_arena->RawNew<ExpressionPattern>($1); }
- ;
- non_expression_pattern:
- AUTO
- { $$ = global_arena->RawNew<AutoPattern>(yylineno); }
- | binding_lhs ":" pattern
- { $$ = global_arena->RawNew<BindingPattern>(yylineno, $1, $3); }
- | paren_pattern
- { $$ = $1; }
- | expression tuple_pattern
- { $$ = global_arena->RawNew<AlternativePattern>(yylineno, $1, $2); }
- ;
- binding_lhs:
- identifier { $$ = $1; }
- | UNDERSCORE { $$ = std::nullopt; }
- ;
- paren_pattern: paren_pattern_base
- { $$ = PatternFromParenContents(yylineno, $1); }
- ;
- paren_pattern_base:
- "(" paren_pattern_contents ")"
- { $$ = $2; }
- | "(" paren_pattern_contents "," ")"
- {
- $$ = $2;
- $$.has_trailing_comma = true;
- }
- ;
- // paren_pattern is analogous to paren_expression, but in order to avoid
- // ambiguities, it must be disjoint from paren_expression, meaning it must
- // contain at least one non_expression_pattern. The structure of this rule
- // is very different from the corresponding expression rule because is has to
- // enforce that requirement.
- paren_pattern_contents:
- paren_pattern_element
- { $$ = {.elements = {$1}, .has_trailing_comma = false }; }
- | paren_expression_contents "," paren_pattern_element
- {
- $$ = ParenExpressionToParenPattern($1);
- $$.elements.push_back($3);
- }
- | paren_pattern_contents "," paren_expression_element
- {
- $$ = $1;
- $$.elements.push_back({.name = $3.name, .term = global_arena->RawNew<ExpressionPattern>($3.term)});
- }
- | paren_pattern_contents "," paren_pattern_element
- {
- $$ = $1;
- $$.elements.push_back($3);
- }
- ;
- paren_pattern_element:
- non_expression_pattern
- { $$ = {.name = std::nullopt, .term = $1}; }
- | designator "=" non_expression_pattern
- { $$ = {.name = $1, .term = $3}; }
- ;
- tuple_pattern: paren_pattern_base
- { $$ = TuplePatternFromParenContents(yylineno, $1); }
- ;
- // Unlike most `pattern` nonterminals, this one overlaps with `expression`,
- // so it should be used only when prior context (such as an introducer)
- // rules out the possibility of an `expression` at this point.
- maybe_empty_tuple_pattern:
- "(" ")"
- { $$ = global_arena->RawNew<TuplePattern>(yylineno, std::vector<TuplePattern::Field>()); }
- | tuple_pattern
- { $$ = $1; }
- ;
- clause:
- CASE pattern DBLARROW statement
- { $$ = global_arena->RawNew<std::pair<const Pattern*, const Statement*>>($2, $4); }
- | DEFAULT DBLARROW statement
- {
- auto vp = global_arena->RawNew<BindingPattern>(
- yylineno, std::nullopt, global_arena->RawNew<AutoPattern>(yylineno));
- $$ = global_arena->RawNew<std::pair<const Pattern*, const Statement*>>(vp, $3);
- }
- ;
- clause_list:
- // Empty
- {
- $$ = global_arena->RawNew<std::list<
- std::pair<const Pattern*, const Statement*>>>();
- }
- | clause clause_list
- { $$ = $2; $$->push_front(*$1); }
- ;
- statement:
- expression "=" expression ";"
- { $$ = global_arena->RawNew<Assign>(yylineno, $1, $3); }
- | VAR pattern "=" expression ";"
- { $$ = global_arena->RawNew<VariableDefinition>(yylineno, $2, $4); }
- | expression ";"
- { $$ = global_arena->RawNew<ExpressionStatement>(yylineno, $1); }
- | if_statement
- { $$ = $1; }
- | WHILE "(" expression ")" block
- { $$ = global_arena->RawNew<While>(yylineno, $3, $5); }
- | BREAK ";"
- { $$ = global_arena->RawNew<Break>(yylineno); }
- | CONTINUE ";"
- { $$ = global_arena->RawNew<Continue>(yylineno); }
- | RETURN return_expression ";"
- { $$ = global_arena->RawNew<Return>(yylineno, $2.first, $2.second); }
- | block
- { $$ = $1; }
- | MATCH "(" expression ")" "{" clause_list "}"
- { $$ = global_arena->RawNew<Match>(yylineno, $3, $6); }
- | CONTINUATION identifier statement
- { $$ = global_arena->RawNew<Continuation>(yylineno, $2, $3); }
- | RUN expression ";"
- { $$ = global_arena->RawNew<Run>(yylineno, $2); }
- | AWAIT ";"
- { $$ = global_arena->RawNew<Await>(yylineno); }
- ;
- if_statement:
- IF "(" expression ")" block optional_else
- { $$ = global_arena->RawNew<If>(yylineno, $3, $5, $6); }
- ;
- optional_else:
- // Empty
- { $$ = 0; }
- | ELSE if_statement
- { $$ = $2; }
- | ELSE block
- { $$ = $2; }
- ;
- return_expression:
- // Empty
- { $$ = {global_arena->RawNew<TupleLiteral>(yylineno), true}; }
- | expression
- { $$ = {$1, false}; }
- ;
- statement_list:
- // Empty
- { $$ = 0; }
- | statement statement_list
- { $$ = global_arena->RawNew<Sequence>(yylineno, $1, $2); }
- ;
- block:
- "{" statement_list "}"
- { $$ = global_arena->RawNew<Block>(yylineno, $2); }
- ;
- return_type:
- // Empty
- { $$ = {global_arena->RawNew<TupleLiteral>(yylineno), true}; }
- | ARROW expression %prec FNARROW
- { $$ = {$2, false}; }
- ;
- generic_binding:
- identifier ":!" expression
- {
- $$ = GenericBinding({.name = std::move($1), .type = $3});
- }
- ;
- deduced_param_list:
- // Empty
- { $$ = std::vector<GenericBinding>(); }
- | generic_binding
- {
- $$ = std::vector<GenericBinding>();
- $$.push_back($1);
- }
- | generic_binding "," deduced_param_list
- {
- $$ = $3;
- $$.push_back($1);
- }
- ;
- deduced_params:
- // Empty
- { $$ = std::vector<GenericBinding>(); }
- | "[" deduced_param_list "]"
- { $$ = $2; }
- ;
- function_definition:
- FN identifier deduced_params maybe_empty_tuple_pattern return_type block
- {
- $$ = global_arena->RawNew<FunctionDefinition>(
- yylineno, $2, $3, $4,
- global_arena->RawNew<ExpressionPattern>($5.first),
- $5.second, $6);
- }
- | FN identifier deduced_params maybe_empty_tuple_pattern DBLARROW expression ";"
- {
- // The return type is not considered "omitted" because it's automatic from
- // the expression.
- $$ = global_arena->RawNew<FunctionDefinition>(
- yylineno, $2, $3, $4,
- global_arena->RawNew<AutoPattern>(yylineno), true,
- global_arena->RawNew<Return>(yylineno, $6, true));
- }
- ;
- function_declaration:
- FN identifier deduced_params maybe_empty_tuple_pattern return_type ";"
- {
- $$ = global_arena->RawNew<FunctionDefinition>(
- yylineno, $2, $3, $4,
- global_arena->RawNew<ExpressionPattern>($5.first),
- $5.second, nullptr); }
- ;
- variable_declaration: identifier ":" pattern
- { $$ = global_arena->RawNew<BindingPattern>(yylineno, $1, $3); }
- ;
- member: VAR variable_declaration ";"
- { $$ = global_arena->RawNew<FieldMember>(yylineno, $2); }
- ;
- member_list:
- // Empty
- { $$ = std::list<Member*>(); }
- | member member_list
- { $$ = $2; $$.push_front($1); }
- ;
- alternative:
- identifier tuple
- { $$ = std::pair<std::string, const Expression*>($1, $2); }
- | identifier
- {
- $$ = std::pair<std::string, const Expression*>(
- $1, global_arena->RawNew<TupleLiteral>(yylineno));
- }
- ;
- alternative_list:
- // Empty
- { $$ = std::list<std::pair<std::string, const Expression*>>(); }
- | alternative
- {
- $$ = std::list<std::pair<std::string, const Expression*>>();
- $$.push_front($1);
- }
- | alternative "," alternative_list
- { $$ = std::move($3); $$.push_front($1); }
- ;
- declaration:
- function_definition
- { $$ = global_arena->RawNew<FunctionDeclaration>($1); }
- | function_declaration
- { $$ = global_arena->RawNew<FunctionDeclaration>($1); }
- | CLASS identifier "{" member_list "}"
- {
- $$ = global_arena->RawNew<ClassDeclaration>(yylineno, $2, $4);
- }
- | CHOICE identifier "{" alternative_list "}"
- {
- $$ = global_arena->RawNew<ChoiceDeclaration>(yylineno, $2, $4);
- }
- | VAR variable_declaration "=" expression ";"
- {
- $$ = global_arena->RawNew<VariableDeclaration>(yylineno, $2, $4);
- }
- ;
- declaration_list:
- // Empty
- { $$ = std::list<Ptr<const Declaration>>(); }
- | declaration declaration_list
- {
- $$ = $2;
- $$.push_front(Ptr<const Declaration>($1));
- }
- ;
- %%
|