parser.ypp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. // -----------------------------------------------------------------------------
  5. // Bison Configuration
  6. // -----------------------------------------------------------------------------
  7. %require "3.2"
  8. %language "c++"
  9. // We don't need a separate header for Bison locations.
  10. %define api.location.file none
  11. // Use a type-safe C++ variant for semantic values
  12. %define api.value.type variant
  13. // Have Bison generate the functions ‘make_TEXT’ and ‘make_NUMBER’, but also
  14. // ‘make_YYEOF’, for the end of input.
  15. %define api.token.constructor
  16. // Make parse error messages more detailed
  17. %define parse.error verbose
  18. // Enable support for parser debugging
  19. %define parse.trace true
  20. //
  21. // Parameters to the parser and lexer
  22. //
  23. // Parameters to the parser are stored therein as protected data members, and
  24. // thus available to its methods.
  25. // "out" parameter passed to the parser, where the AST is written.
  26. %parse-param {std::optional<Carbon::AST>& parsed_program}
  27. // "inout" parameter passed to both the parser and the lexer.
  28. %param {Carbon::ParseAndLexContext& context}
  29. // The following shift-reduce conflicts are expected; any others should be
  30. // treated as errors:
  31. // - The "dangling else" ambiguity: `if (b) if (c) x = 1; else x = 2;`
  32. // could parse as either `if (b) { if (c) x = 1; else x = 2;}` or
  33. // `if (b) { if (c) x = 1; } else x = 2;`. Following C++, we want Carbon
  34. // to choose the first option. Resolving this by restructuring the grammar
  35. // would make it harder to read, and resolving it by assigning precedence to
  36. // `if` and `else` could mask other ambiguities, especially if we allow
  37. // `if`/`else` in expressions, so we allow Bison to resolve it through its
  38. // default behavior of preferring to shift rather than reduce.
  39. %expect 1
  40. // -----------------------------------------------------------------------------
  41. %code top {
  42. #include <algorithm>
  43. #include <cstdarg>
  44. #include <cstdio>
  45. #include <cstdlib>
  46. #include <iostream>
  47. #include <list>
  48. #include "executable_semantics/syntax/syntax_helpers.h"
  49. #include "executable_semantics/syntax/parse_and_lex_context.h"
  50. } // %code top
  51. %code requires {
  52. #include <optional>
  53. #include "executable_semantics/ast/abstract_syntax_tree.h"
  54. #include "executable_semantics/ast/declaration.h"
  55. #include "executable_semantics/ast/function_definition.h"
  56. #include "executable_semantics/syntax/paren_contents.h"
  57. namespace Carbon {
  58. class ParseAndLexContext;
  59. } // namespace Carbon
  60. } // %code requires
  61. %code {
  62. extern int yylineno;
  63. void yy::parser::error(const location_type&, const std::string& message) {
  64. context.PrintDiagnostic(message, yylineno);
  65. }
  66. } // %code
  67. %token <int> integer_literal
  68. %token <char*> identifier
  69. %type <char*> designator
  70. %type <Carbon::Declaration> declaration
  71. %type <Carbon::FunctionDefinition> function_declaration
  72. %type <Carbon::FunctionDefinition> function_definition
  73. %type <std::list<Carbon::Declaration>> declaration_list
  74. %type <const Carbon::Statement*> statement
  75. %type <const Carbon::Statement*> optional_else
  76. %type <const Carbon::Statement*> statement_list
  77. %type <const Carbon::Expression*> expression
  78. %type <const Carbon::Expression*> pattern
  79. %type <const Carbon::Expression*> return_type
  80. %type <const Carbon::Expression*> paren_expression
  81. %type <const Carbon::Expression*> tuple
  82. %type <std::optional<std::string>> binding_lhs
  83. %type <Carbon::Member*> variable_declaration
  84. %type <Carbon::Member*> member
  85. %type <std::list<Carbon::Member*>> member_list
  86. %type <Carbon::FieldInitializer> field_initializer
  87. %type <Carbon::ParenContents> paren_contents
  88. %type <std::vector<Carbon::FieldInitializer>> paren_contents_without_trailing_comma
  89. %type <std::pair<std::string, const Carbon::Expression*>> alternative
  90. %type <std::list<std::pair<std::string, const Carbon::Expression*>>> alternative_list
  91. %type <std::pair<const Carbon::Expression*, const Carbon::Statement*>*> clause
  92. %type <std::list<std::pair<const Carbon::Expression*, const Carbon::Statement*>>*> clause_list
  93. %token END_OF_FILE 0
  94. %token AND
  95. %token OR
  96. %token NOT
  97. %token INT
  98. %token BOOL
  99. %token TYPE
  100. %token FN
  101. %token FNTY
  102. %token ARROW "->"
  103. %token FNARROW "-> in return type"
  104. %token VAR
  105. %token EQUAL_EQUAL
  106. %token IF
  107. %token ELSE
  108. %token WHILE
  109. %token CONTINUATION_TYPE
  110. %token CONTINUATION
  111. %token RUN
  112. %token AWAIT
  113. %token BREAK
  114. %token CONTINUE
  115. %token RETURN
  116. %token TRUE
  117. %token FALSE
  118. %token STRUCT
  119. %token CHOICE
  120. %token MATCH
  121. %token CASE
  122. %token DBLARROW "=>"
  123. %token DEFAULT
  124. %token AUTO
  125. %token UNDERSCORE
  126. %token
  127. EQUAL "="
  128. MINUS "-"
  129. PLUS "+"
  130. // The lexer determines the arity and fixity of each `*` based on whitespace
  131. // and adjacent tokens. UNARY_STAR indicates that the operator is unary but
  132. // could be either prefix or postfix.
  133. UNARY_STAR "unary *"
  134. PREFIX_STAR "prefix *"
  135. POSTFIX_STAR "postfix *"
  136. BINARY_STAR "binary *"
  137. SLASH "/"
  138. LEFT_PARENTHESIS "("
  139. RIGHT_PARENTHESIS ")"
  140. LEFT_CURLY_BRACE "{"
  141. RIGHT_CURLY_BRACE "}"
  142. LEFT_SQUARE_BRACKET "["
  143. RIGHT_SQUARE_BRACKET "]"
  144. PERIOD "."
  145. COMMA ","
  146. SEMICOLON ";"
  147. COLON ":"
  148. ;
  149. %precedence FNARROW
  150. %precedence "{" "}"
  151. %precedence ":" "," DBLARROW
  152. %left OR AND
  153. %nonassoc EQUAL_EQUAL
  154. %left "+" "-"
  155. %left BINARY_STAR
  156. %precedence NOT UNARY_MINUS PREFIX_STAR
  157. // We need to give the `UNARY_STAR` token a precedence, rather than overriding
  158. // the precedence of the `expression UNARY_STAR` rule below, because bison
  159. // compares the precedence of the final token (for a shift) to the precedence
  160. // of the other rule (for a reduce) when attempting to resolve a shift-reduce
  161. // conflict. See https://stackoverflow.com/a/26188429/1041090. When UNARY_STAR
  162. // is the final token of a rule, it must be a postfix usage, so we give it the
  163. // same precedence as POSTFIX_STAR.
  164. %precedence POSTFIX_STAR UNARY_STAR
  165. %left "." ARROW
  166. %precedence "(" ")" "[" "]"
  167. %start input
  168. %locations
  169. %%
  170. input: declaration_list
  171. { parsed_program = $1; }
  172. ;
  173. pattern:
  174. expression
  175. { $$ = $1; }
  176. ;
  177. binding_lhs:
  178. identifier { $$ = $1; }
  179. | UNDERSCORE { $$ = std::nullopt; }
  180. ;
  181. expression:
  182. identifier
  183. { $$ = Carbon::Expression::MakeIdentifierExpression(yylineno, $1); }
  184. | expression designator
  185. { $$ = Carbon::Expression::MakeFieldAccessExpression(yylineno, $1, $2); }
  186. | expression "[" expression "]"
  187. { $$ = Carbon::Expression::MakeIndexExpression(yylineno, $1, $3); }
  188. | binding_lhs ":" expression
  189. {
  190. $$ = Carbon::Expression::MakeBindingExpression(yylineno, $1, $3);
  191. }
  192. | integer_literal
  193. { $$ = Carbon::Expression::MakeIntLiteral(yylineno, $1); }
  194. | TRUE
  195. { $$ = Carbon::Expression::MakeBoolLiteral(yylineno, true); }
  196. | FALSE
  197. { $$ = Carbon::Expression::MakeBoolLiteral(yylineno, false); }
  198. | INT
  199. { $$ = Carbon::Expression::MakeIntTypeLiteral(yylineno); }
  200. | BOOL
  201. { $$ = Carbon::Expression::MakeBoolTypeLiteral(yylineno); }
  202. | TYPE
  203. { $$ = Carbon::Expression::MakeTypeTypeLiteral(yylineno); }
  204. | AUTO
  205. { $$ = Carbon::Expression::MakeAutoTypeLiteral(yylineno); }
  206. | CONTINUATION_TYPE
  207. { $$ = Carbon::Expression::MakeContinuationTypeLiteral(yylineno); }
  208. | paren_expression { $$ = $1; }
  209. | expression EQUAL_EQUAL expression
  210. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  211. yylineno, Carbon::Operator::Eq, {$1, $3}); }
  212. | expression "+" expression
  213. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  214. yylineno, Carbon::Operator::Add, {$1, $3}); }
  215. | expression "-" expression
  216. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  217. yylineno, Carbon::Operator::Sub, {$1, $3}); }
  218. | expression BINARY_STAR expression
  219. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  220. yylineno, Carbon::Operator::Mul, {$1, $3}); }
  221. | expression AND expression
  222. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  223. yylineno, Carbon::Operator::And, {$1, $3}); }
  224. | expression OR expression
  225. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  226. yylineno, Carbon::Operator::Or, {$1, $3}); }
  227. | NOT expression
  228. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  229. yylineno, Carbon::Operator::Not, {$2}); }
  230. | "-" expression %prec UNARY_MINUS
  231. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  232. yylineno, Carbon::Operator::Neg, {$2}); }
  233. | PREFIX_STAR expression
  234. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  235. yylineno, Carbon::Operator::Deref, {$2}); }
  236. | UNARY_STAR expression %prec PREFIX_STAR
  237. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  238. yylineno, Carbon::Operator::Deref, {$2}); }
  239. | expression tuple
  240. { $$ = Carbon::Expression::MakeCallExpression(yylineno, $1, $2); }
  241. | expression POSTFIX_STAR
  242. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  243. yylineno, Carbon::Operator::Ptr, {$1}); }
  244. | expression UNARY_STAR
  245. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  246. yylineno, Carbon::Operator::Ptr, {$1}); }
  247. | FNTY tuple return_type
  248. { $$ = Carbon::Expression::MakeFunctionTypeLiteral(yylineno, $2, $3); }
  249. ;
  250. designator: "." identifier { $$ = $2; }
  251. ;
  252. paren_expression: "(" paren_contents ")"
  253. { $$ = $2.AsExpression(yylineno); }
  254. ;
  255. tuple: "(" paren_contents ")"
  256. { $$ = $2.AsTuple(yylineno); }
  257. ;
  258. field_initializer:
  259. pattern
  260. { $$ = Carbon::FieldInitializer({"", $1}); }
  261. | designator "=" pattern
  262. { $$ = Carbon::FieldInitializer({$1, $3}); }
  263. ;
  264. paren_contents:
  265. // Empty
  266. { $$ = Carbon::ParenContents(); }
  267. | paren_contents_without_trailing_comma
  268. {
  269. $$ = Carbon::ParenContents($1,
  270. Carbon::ParenContents::HasTrailingComma::No);
  271. }
  272. | paren_contents_without_trailing_comma ","
  273. {
  274. $$ = Carbon::ParenContents($1,
  275. Carbon::ParenContents::HasTrailingComma::Yes);
  276. }
  277. ;
  278. paren_contents_without_trailing_comma:
  279. field_initializer
  280. { $$ = {$1}; }
  281. | paren_contents_without_trailing_comma "," field_initializer
  282. {
  283. $$ = $1;
  284. $$.push_back($3);
  285. }
  286. ;
  287. clause:
  288. CASE pattern DBLARROW statement
  289. { $$ = new std::pair<const Carbon::Expression*, const Carbon::Statement*>($2, $4); }
  290. | DEFAULT DBLARROW statement
  291. {
  292. auto vp = Carbon::Expression::MakeBindingExpression(
  293. yylineno, "_", Carbon::Expression::MakeAutoTypeLiteral(yylineno));
  294. $$ = new std::pair<const Carbon::Expression*, const Carbon::Statement*>(vp, $3);
  295. }
  296. ;
  297. clause_list:
  298. // Empty
  299. {
  300. $$ = new std::list<std::pair<const Carbon::Expression*, const Carbon::Statement*>>();
  301. }
  302. | clause clause_list
  303. { $$ = $2; $$->push_front(*$1); }
  304. ;
  305. statement:
  306. expression "=" expression ";"
  307. { $$ = Carbon::Statement::MakeAssign(yylineno, $1, $3); }
  308. | VAR pattern "=" expression ";"
  309. { $$ = Carbon::Statement::MakeVariableDefinition(yylineno, $2, $4); }
  310. | expression ";"
  311. { $$ = Carbon::Statement::MakeExpressionStatement(yylineno, $1); }
  312. | IF "(" expression ")" statement optional_else
  313. { $$ = Carbon::Statement::MakeIf(yylineno, $3, $5, $6); }
  314. | WHILE "(" expression ")" statement
  315. { $$ = Carbon::Statement::MakeWhile(yylineno, $3, $5); }
  316. | BREAK ";"
  317. { $$ = Carbon::Statement::MakeBreak(yylineno); }
  318. | CONTINUE ";"
  319. { $$ = Carbon::Statement::MakeContinue(yylineno); }
  320. | RETURN expression ";"
  321. { $$ = Carbon::Statement::MakeReturn(yylineno, $2); }
  322. | "{" statement_list "}"
  323. { $$ = Carbon::Statement::MakeBlock(yylineno, $2); }
  324. | MATCH "(" expression ")" "{" clause_list "}"
  325. { $$ = Carbon::Statement::MakeMatch(yylineno, $3, $6); }
  326. | CONTINUATION identifier statement
  327. { $$ = Carbon::Statement::MakeContinuation(yylineno, $2, $3); }
  328. | RUN expression ";"
  329. { $$ = Carbon::Statement::MakeRun(yylineno, $2); }
  330. | AWAIT ";"
  331. { $$ = Carbon::Statement::MakeAwait(yylineno); }
  332. ;
  333. optional_else:
  334. // Empty
  335. { $$ = 0; }
  336. | ELSE statement { $$ = $2; }
  337. ;
  338. statement_list:
  339. // Empty
  340. { $$ = 0; }
  341. | statement statement_list
  342. { $$ = Carbon::Statement::MakeSequence(yylineno, $1, $2); }
  343. ;
  344. return_type:
  345. // Empty
  346. { $$ = Carbon::Expression::MakeTupleLiteral(yylineno, {}); }
  347. | ARROW expression %prec FNARROW
  348. { $$ = $2; }
  349. ;
  350. function_definition:
  351. FN identifier tuple return_type "{" statement_list "}"
  352. { $$ = Carbon::FunctionDefinition(yylineno, $2, $3, $4, $6); }
  353. | FN identifier tuple DBLARROW expression ";"
  354. {
  355. $$ = Carbon::FunctionDefinition(
  356. yylineno, $2, $3,
  357. Carbon::Expression::MakeAutoTypeLiteral(yylineno),
  358. Carbon::Statement::MakeReturn(yylineno, $5));
  359. }
  360. ;
  361. function_declaration:
  362. FN identifier tuple return_type ";"
  363. { $$ = Carbon::FunctionDefinition(yylineno, $2, $3, $4, 0); }
  364. ;
  365. variable_declaration: identifier ":" expression
  366. { $$ = Carbon::Member::MakeFieldMember(yylineno, $1, $3); }
  367. ;
  368. member: VAR variable_declaration ";"
  369. { $$ = $2; }
  370. ;
  371. member_list:
  372. // Empty
  373. { $$ = std::list<Carbon::Member*>(); }
  374. | member member_list
  375. { $$ = $2; $$.push_front($1); }
  376. ;
  377. alternative:
  378. identifier tuple
  379. { $$ = std::pair<std::string, const Carbon::Expression*>($1, $2); }
  380. | identifier
  381. {
  382. $$ = std::pair<std::string, const Carbon::Expression*>(
  383. $1, Carbon::Expression::MakeTupleLiteral(yylineno, {}));
  384. }
  385. ;
  386. alternative_list:
  387. // Empty
  388. { $$ = std::list<std::pair<std::string, const Carbon::Expression*>>(); }
  389. | alternative
  390. {
  391. $$ = std::list<std::pair<std::string, const Carbon::Expression*>>();
  392. $$.push_front($1);
  393. }
  394. | alternative "," alternative_list
  395. { $$ = std::move($3); $$.push_front($1); }
  396. ;
  397. declaration:
  398. function_definition
  399. { $$ = Carbon::Declaration::MakeFunctionDeclaration(std::move($1)); }
  400. | function_declaration
  401. { $$ = Carbon::Declaration::MakeFunctionDeclaration(std::move($1)); }
  402. | STRUCT identifier "{" member_list "}"
  403. {
  404. $$ = Carbon::Declaration::MakeStructDeclaration(yylineno, $2, $4);
  405. }
  406. | CHOICE identifier "{" alternative_list "}"
  407. {
  408. $$ = Carbon::Declaration::MakeChoiceDeclaration(yylineno, $2, $4);
  409. }
  410. | VAR variable_declaration "=" expression ";"
  411. {
  412. $$ = Carbon::Declaration::MakeVariableDeclaration(
  413. yylineno, $2->GetFieldMember().name, $2->GetFieldMember().type, $4);
  414. }
  415. ;
  416. declaration_list:
  417. // Empty
  418. { $$ = std::list<Carbon::Declaration>(); }
  419. | declaration declaration_list
  420. {
  421. $$ = $2;
  422. $$.push_front($1);
  423. }
  424. ;
  425. %%