parser.ypp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452
  1. // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
  2. // Exceptions. See /LICENSE for license information.
  3. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. // -----------------------------------------------------------------------------
  5. // Bison Configuration
  6. // -----------------------------------------------------------------------------
  7. %require "3.2"
  8. %language "c++"
  9. // We don't need a separate header for Bison locations.
  10. %define api.location.file none
  11. // Use a type-safe C++ variant for semantic values
  12. %define api.value.type variant
  13. // Have Bison generate the functions ‘make_TEXT’ and ‘make_NUMBER’, but also
  14. // ‘make_YYEOF’, for the end of input.
  15. %define api.token.constructor
  16. // Make parse error messages more detailed
  17. %define parse.error verbose
  18. // Enable support for parser debugging
  19. %define parse.trace true
  20. //
  21. // Parameters to the parser and lexer
  22. //
  23. // Parameters to the parser are stored therein as protected data members, and
  24. // thus available to its methods.
  25. // "out" parameter passed to the parser, where the AST is written.
  26. %parse-param {std::optional<Carbon::AST>& parsed_program}
  27. // "inout" parameter passed to both the parser and the lexer.
  28. %param {Carbon::ParseAndLexContext& context}
  29. // The following shift-reduce conflicts are expected; any others should be
  30. // treated as errors:
  31. // - The "dangling else" ambiguity: `if (b) if (c) x = 1; else x = 2;`
  32. // could parse as either `if (b) { if (c) x = 1; else x = 2;}` or
  33. // `if (b) { if (c) x = 1; } else x = 2;`. Following C++, we want Carbon
  34. // to choose the first option. Resolving this by restructuring the grammar
  35. // would make it harder to read, and resolving it by assigning precedence to
  36. // `if` and `else` could mask other ambiguities, especially if we allow
  37. // `if`/`else` in expressions, so we allow Bison to resolve it through its
  38. // default behavior of preferring to shift rather than reduce.
  39. %expect 1
  40. // -----------------------------------------------------------------------------
  41. %code top {
  42. #include <algorithm>
  43. #include <cstdarg>
  44. #include <cstdio>
  45. #include <cstdlib>
  46. #include <iostream>
  47. #include <list>
  48. #include "executable_semantics/syntax/syntax_helpers.h"
  49. #include "executable_semantics/syntax/parse_and_lex_context.h"
  50. }
  51. %code requires {
  52. #include <optional>
  53. #include "executable_semantics/ast/abstract_syntax_tree.h"
  54. #include "executable_semantics/ast/declaration.h"
  55. #include "executable_semantics/ast/function_definition.h"
  56. #include "executable_semantics/syntax/paren_contents.h"
  57. namespace Carbon {
  58. class ParseAndLexContext;
  59. }
  60. }
  61. %code {
  62. extern int yylineno;
  63. void yy::parser::error(
  64. const location_type&, const std::string& message)
  65. {
  66. context.PrintDiagnostic(message, yylineno);
  67. }
  68. }
  69. %token <int> integer_literal
  70. %token <char*> identifier
  71. %type <char*> designator
  72. %type <Carbon::Declaration> declaration
  73. %type <Carbon::FunctionDefinition> function_declaration
  74. %type <Carbon::FunctionDefinition> function_definition
  75. %type <std::list<Carbon::Declaration>> declaration_list
  76. %type <const Carbon::Statement*> statement
  77. %type <const Carbon::Statement*> optional_else
  78. %type <const Carbon::Statement*> statement_list
  79. %type <const Carbon::Expression*> expression
  80. %type <const Carbon::Expression*> pattern
  81. %type <const Carbon::Expression*> return_type
  82. %type <const Carbon::Expression*> paren_expression
  83. %type <const Carbon::Expression*> tuple
  84. %type <std::optional<std::string>> binding_lhs
  85. %type <Carbon::Member*> variable_declaration
  86. %type <Carbon::Member*> member
  87. %type <std::list<Carbon::Member*>> member_list
  88. %type <Carbon::FieldInitializer> field_initializer
  89. %type <Carbon::ParenContents> paren_contents
  90. %type <std::vector<Carbon::FieldInitializer>> paren_contents_without_trailing_comma
  91. %type <std::pair<std::string, const Carbon::Expression*>> alternative
  92. %type <std::list<std::pair<std::string, const Carbon::Expression*>>> alternative_list
  93. %type <std::pair<const Carbon::Expression*, const Carbon::Statement*>*> clause
  94. %type <std::list<std::pair<const Carbon::Expression*, const Carbon::Statement*>>*> clause_list
  95. %token END_OF_FILE 0
  96. %token AND
  97. %token OR
  98. %token NOT
  99. %token INT
  100. %token BOOL
  101. %token TYPE
  102. %token FN
  103. %token FNTY
  104. %token ARROW "->"
  105. %token FNARROW "-> in return type"
  106. %token VAR
  107. %token EQUAL_EQUAL
  108. %token IF
  109. %token ELSE
  110. %token WHILE
  111. %token CONTINUATION_TYPE
  112. %token CONTINUATION
  113. %token RUN
  114. %token AWAIT
  115. %token BREAK
  116. %token CONTINUE
  117. %token RETURN
  118. %token TRUE
  119. %token FALSE
  120. %token STRUCT
  121. %token CHOICE
  122. %token MATCH
  123. %token CASE
  124. %token DBLARROW "=>"
  125. %token DEFAULT
  126. %token AUTO
  127. %token UNDERSCORE
  128. %token
  129. EQUAL "="
  130. MINUS "-"
  131. PLUS "+"
  132. // The lexer determines the arity and fixity of each `*` based on whitespace
  133. // and adjacent tokens. UNARY_STAR indicates that the operator is unary but
  134. // could be either prefix or postfix.
  135. UNARY_STAR "unary *"
  136. PREFIX_STAR "prefix *"
  137. POSTFIX_STAR "postfix *"
  138. BINARY_STAR "binary *"
  139. SLASH "/"
  140. LEFT_PARENTHESIS "("
  141. RIGHT_PARENTHESIS ")"
  142. LEFT_CURLY_BRACE "{"
  143. RIGHT_CURLY_BRACE "}"
  144. LEFT_SQUARE_BRACKET "["
  145. RIGHT_SQUARE_BRACKET "]"
  146. PERIOD "."
  147. COMMA ","
  148. SEMICOLON ";"
  149. COLON ":"
  150. ;
  151. %precedence FNARROW
  152. %precedence "{" "}"
  153. %precedence ":" "," DBLARROW
  154. %left OR AND
  155. %nonassoc EQUAL_EQUAL
  156. %left "+" "-"
  157. %left BINARY_STAR
  158. %precedence NOT UNARY_MINUS PREFIX_STAR
  159. // We need to give the `UNARY_STAR` token a precedence, rather than overriding
  160. // the precedence of the `expression UNARY_STAR` rule below, because bison
  161. // compares the precedence of the final token (for a shift) to the precedence
  162. // of the other rule (for a reduce) when attempting to resolve a shift-reduce
  163. // conflict. See https://stackoverflow.com/a/26188429/1041090. When UNARY_STAR
  164. // is the final token of a rule, it must be a postfix usage, so we give it the
  165. // same precedence as POSTFIX_STAR.
  166. %precedence POSTFIX_STAR UNARY_STAR
  167. %left "." ARROW
  168. %precedence "(" ")" "[" "]"
  169. %start input
  170. %locations
  171. %%
  172. input: declaration_list
  173. { parsed_program = $1; }
  174. ;
  175. pattern:
  176. expression
  177. { $$ = $1; }
  178. ;
  179. binding_lhs:
  180. identifier { $$ = $1; }
  181. | UNDERSCORE { $$ = std::nullopt; }
  182. ;
  183. expression:
  184. identifier
  185. { $$ = Carbon::Expression::MakeIdentifierExpression(yylineno, $1); }
  186. | expression designator
  187. { $$ = Carbon::Expression::MakeFieldAccessExpression(yylineno, $1, $2); }
  188. | expression "[" expression "]"
  189. { $$ = Carbon::Expression::MakeIndexExpression(yylineno, $1, $3); }
  190. | binding_lhs ":" expression
  191. {
  192. $$ = Carbon::Expression::MakeBindingExpression(yylineno, $1, $3);
  193. }
  194. | integer_literal
  195. { $$ = Carbon::Expression::MakeIntLiteral(yylineno, $1); }
  196. | TRUE
  197. { $$ = Carbon::Expression::MakeBoolLiteral(yylineno, true); }
  198. | FALSE
  199. { $$ = Carbon::Expression::MakeBoolLiteral(yylineno, false); }
  200. | INT
  201. { $$ = Carbon::Expression::MakeIntTypeLiteral(yylineno); }
  202. | BOOL
  203. { $$ = Carbon::Expression::MakeBoolTypeLiteral(yylineno); }
  204. | TYPE
  205. { $$ = Carbon::Expression::MakeTypeTypeLiteral(yylineno); }
  206. | AUTO
  207. { $$ = Carbon::Expression::MakeAutoTypeLiteral(yylineno); }
  208. | CONTINUATION_TYPE
  209. { $$ = Carbon::Expression::MakeContinuationTypeLiteral(yylineno); }
  210. | paren_expression { $$ = $1; }
  211. | expression EQUAL_EQUAL expression
  212. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  213. yylineno, Carbon::Operator::Eq, {$1, $3}); }
  214. | expression "+" expression
  215. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  216. yylineno, Carbon::Operator::Add, {$1, $3}); }
  217. | expression "-" expression
  218. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  219. yylineno, Carbon::Operator::Sub, {$1, $3}); }
  220. | expression BINARY_STAR expression
  221. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  222. yylineno, Carbon::Operator::Mul, {$1, $3}); }
  223. | expression AND expression
  224. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  225. yylineno, Carbon::Operator::And, {$1, $3}); }
  226. | expression OR expression
  227. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  228. yylineno, Carbon::Operator::Or, {$1, $3}); }
  229. | NOT expression
  230. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  231. yylineno, Carbon::Operator::Not, {$2}); }
  232. | "-" expression %prec UNARY_MINUS
  233. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  234. yylineno, Carbon::Operator::Neg, {$2}); }
  235. | PREFIX_STAR expression
  236. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  237. yylineno, Carbon::Operator::Deref, {$2}); }
  238. | UNARY_STAR expression %prec PREFIX_STAR
  239. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  240. yylineno, Carbon::Operator::Deref, {$2}); }
  241. | expression tuple
  242. { $$ = Carbon::Expression::MakeCallExpression(yylineno, $1, $2); }
  243. | expression POSTFIX_STAR
  244. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  245. yylineno, Carbon::Operator::Ptr, {$1}); }
  246. | expression UNARY_STAR
  247. { $$ = Carbon::Expression::MakePrimitiveOperatorExpression(
  248. yylineno, Carbon::Operator::Ptr, {$1}); }
  249. | FNTY tuple return_type
  250. { $$ = Carbon::Expression::MakeFunctionTypeLiteral(yylineno, $2, $3); }
  251. ;
  252. designator: "." identifier { $$ = $2; }
  253. ;
  254. paren_expression: "(" paren_contents ")"
  255. { $$ = $2.AsExpression(yylineno); }
  256. ;
  257. tuple: "(" paren_contents ")"
  258. { $$ = $2.AsTuple(yylineno); }
  259. ;
  260. field_initializer:
  261. pattern
  262. { $$ = Carbon::FieldInitializer({"", $1}); }
  263. | designator "=" pattern
  264. { $$ = Carbon::FieldInitializer({$1, $3}); }
  265. ;
  266. paren_contents:
  267. // Empty
  268. { $$ = Carbon::ParenContents(); }
  269. | paren_contents_without_trailing_comma
  270. {
  271. $$ = Carbon::ParenContents($1,
  272. Carbon::ParenContents::HasTrailingComma::No);
  273. }
  274. | paren_contents_without_trailing_comma ","
  275. {
  276. $$ = Carbon::ParenContents($1,
  277. Carbon::ParenContents::HasTrailingComma::Yes);
  278. }
  279. ;
  280. paren_contents_without_trailing_comma:
  281. field_initializer
  282. { $$ = {$1}; }
  283. | paren_contents_without_trailing_comma "," field_initializer
  284. {
  285. $$ = $1;
  286. $$.push_back($3);
  287. }
  288. ;
  289. clause:
  290. CASE pattern DBLARROW statement
  291. { $$ = new std::pair<const Carbon::Expression*, const Carbon::Statement*>($2, $4); }
  292. | DEFAULT DBLARROW statement
  293. {
  294. auto vp = Carbon::Expression::MakeBindingExpression(
  295. yylineno, "_", Carbon::Expression::MakeAutoTypeLiteral(yylineno));
  296. $$ = new std::pair<const Carbon::Expression*, const Carbon::Statement*>(vp, $3);
  297. }
  298. ;
  299. clause_list:
  300. // Empty
  301. {
  302. $$ = new std::list<std::pair<const Carbon::Expression*, const Carbon::Statement*>>();
  303. }
  304. | clause clause_list
  305. { $$ = $2; $$->push_front(*$1); }
  306. ;
  307. statement:
  308. expression "=" expression ";"
  309. { $$ = Carbon::Statement::MakeAssign(yylineno, $1, $3); }
  310. | VAR pattern "=" expression ";"
  311. { $$ = Carbon::Statement::MakeVariableDefinition(yylineno, $2, $4); }
  312. | expression ";"
  313. { $$ = Carbon::Statement::MakeExpressionStatement(yylineno, $1); }
  314. | IF "(" expression ")" statement optional_else
  315. { $$ = Carbon::Statement::MakeIf(yylineno, $3, $5, $6); }
  316. | WHILE "(" expression ")" statement
  317. { $$ = Carbon::Statement::MakeWhile(yylineno, $3, $5); }
  318. | BREAK ";"
  319. { $$ = Carbon::Statement::MakeBreak(yylineno); }
  320. | CONTINUE ";"
  321. { $$ = Carbon::Statement::MakeContinue(yylineno); }
  322. | RETURN expression ";"
  323. { $$ = Carbon::Statement::MakeReturn(yylineno, $2); }
  324. | "{" statement_list "}"
  325. { $$ = Carbon::Statement::MakeBlock(yylineno, $2); }
  326. | MATCH "(" expression ")" "{" clause_list "}"
  327. { $$ = Carbon::Statement::MakeMatch(yylineno, $3, $6); }
  328. | CONTINUATION identifier statement
  329. { $$ = Carbon::Statement::MakeContinuation(yylineno, $2, $3); }
  330. | RUN expression ";"
  331. { $$ = Carbon::Statement::MakeRun(yylineno, $2); }
  332. | AWAIT ";"
  333. { $$ = Carbon::Statement::MakeAwait(yylineno); }
  334. ;
  335. optional_else:
  336. // Empty
  337. { $$ = 0; }
  338. | ELSE statement { $$ = $2; }
  339. ;
  340. statement_list:
  341. // Empty
  342. { $$ = 0; }
  343. | statement statement_list
  344. { $$ = Carbon::Statement::MakeSequence(yylineno, $1, $2); }
  345. ;
  346. return_type:
  347. // Empty
  348. { $$ = Carbon::Expression::MakeTupleLiteral(yylineno, {}); }
  349. | ARROW expression %prec FNARROW
  350. { $$ = $2; }
  351. ;
  352. function_definition:
  353. FN identifier tuple return_type "{" statement_list "}"
  354. { $$ = Carbon::FunctionDefinition(yylineno, $2, $3, $4, $6); }
  355. | FN identifier tuple DBLARROW expression ";"
  356. {
  357. $$ = Carbon::FunctionDefinition(
  358. yylineno, $2, $3,
  359. Carbon::Expression::MakeAutoTypeLiteral(yylineno),
  360. Carbon::Statement::MakeReturn(yylineno, $5));
  361. }
  362. ;
  363. function_declaration:
  364. FN identifier tuple return_type ";"
  365. { $$ = Carbon::FunctionDefinition(yylineno, $2, $3, $4, 0); }
  366. ;
  367. variable_declaration: identifier ":" expression
  368. { $$ = Carbon::Member::MakeFieldMember(yylineno, $1, $3); }
  369. ;
  370. member: VAR variable_declaration ";"
  371. { $$ = $2; }
  372. ;
  373. member_list:
  374. // Empty
  375. { $$ = std::list<Carbon::Member*>(); }
  376. | member member_list
  377. { $$ = $2; $$.push_front($1); }
  378. ;
  379. alternative:
  380. identifier tuple
  381. { $$ = std::pair<std::string, const Carbon::Expression*>($1, $2); }
  382. | identifier
  383. {
  384. $$ = std::pair<std::string, const Carbon::Expression*>(
  385. $1, Carbon::Expression::MakeTupleLiteral(yylineno, {}));
  386. }
  387. ;
  388. alternative_list:
  389. // Empty
  390. { $$ = std::list<std::pair<std::string, const Carbon::Expression*>>(); }
  391. | alternative
  392. {
  393. $$ = std::list<std::pair<std::string, const Carbon::Expression*>>();
  394. $$.push_front($1);
  395. }
  396. | alternative "," alternative_list
  397. { $$ = std::move($3); $$.push_front($1); }
  398. ;
  399. declaration:
  400. function_definition
  401. { $$ = Carbon::Declaration::MakeFunctionDeclaration(std::move($1)); }
  402. | function_declaration
  403. { $$ = Carbon::Declaration::MakeFunctionDeclaration(std::move($1)); }
  404. | STRUCT identifier "{" member_list "}"
  405. {
  406. $$ = Carbon::Declaration::MakeStructDeclaration(yylineno, $2, $4);
  407. }
  408. | CHOICE identifier "{" alternative_list "}"
  409. {
  410. $$ = Carbon::Declaration::MakeChoiceDeclaration(yylineno, $2, $4);
  411. }
  412. | VAR variable_declaration "=" expression ";"
  413. {
  414. $$ = Carbon::Declaration::MakeVariableDeclaration(
  415. yylineno, $2->GetFieldMember().name, $2->GetFieldMember().type, $4);
  416. }
  417. ;
  418. declaration_list:
  419. // Empty
  420. { $$ = std::list<Carbon::Declaration>(); }
  421. | declaration declaration_list
  422. {
  423. $$ = $2;
  424. $$.push_front($1);
  425. }
  426. ;
  427. %%