| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158 |
- // Part of the Carbon Language project, under the Apache License v2.0 with LLVM
- // Exceptions. See /LICENSE for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- #ifndef CARBON_TOOLCHAIN_LEX_TOKEN_KIND_H_
- #define CARBON_TOOLCHAIN_LEX_TOKEN_KIND_H_
- #include <cstdint>
- #include "common/check.h"
- #include "common/enum_base.h"
- #include "llvm/ADT/ArrayRef.h"
- #include "llvm/ADT/StringRef.h"
- #include "llvm/Support/FormatVariadicDetails.h"
- namespace Carbon::Lex {
- CARBON_DEFINE_RAW_ENUM_CLASS(TokenKind, uint8_t) {
- #define CARBON_TOKEN(TokenName) CARBON_RAW_ENUM_ENUMERATOR(TokenName)
- #include "toolchain/lex/token_kind.def"
- };
- class TokenKind : public CARBON_ENUM_BASE(TokenKind) {
- public:
- #define CARBON_TOKEN(TokenName) CARBON_ENUM_CONSTANT_DECL(TokenName)
- #include "toolchain/lex/token_kind.def"
- // An array of all the keyword tokens.
- static const llvm::ArrayRef<TokenKind> KeywordTokens;
- using EnumBase::EnumBase;
- // Permit creation from RawEnumType for templates.
- using EnumBase::Make;
- // Permit conversion to integer for use as an array index.
- using EnumBase::AsInt;
- // Test whether this kind of token is a simple symbol sequence (punctuation,
- // not letters) that appears directly in the source text and can be
- // unambiguously lexed with `starts_with` logic. While these may appear
- // inside of other tokens, outside of the contents of other tokens they
- // don't require any specific characters before or after to distinguish them
- // in the source. Returns false otherwise.
- auto is_symbol() const -> bool { return IsSymbol[AsInt()]; }
- // Test whether this kind of token is a grouping symbol (part of an opening
- // and closing pair that must always be matched in the token stream).
- auto is_grouping_symbol() const -> bool { return IsGroupingSymbol[AsInt()]; }
- // Test whether this kind of token is an opening symbol for a group.
- auto is_opening_symbol() const -> bool { return IsOpeningSymbol[AsInt()]; }
- // Returns the associated closing symbol for an opening symbol.
- //
- // The token kind must be an opening symbol.
- auto closing_symbol() const -> TokenKind {
- auto result = ClosingSymbol[AsInt()];
- CARBON_DCHECK(result != Error, "Only opening symbols are valid!");
- return result;
- }
- // Test whether this kind of token is a closing symbol for a group.
- auto is_closing_symbol() const -> bool { return IsClosingSymbol[AsInt()]; }
- // Returns the associated opening symbol for a closing symbol.
- //
- // The token kind must be a closing symbol.
- auto opening_symbol() const -> TokenKind {
- auto result = OpeningSymbol[AsInt()];
- CARBON_DCHECK(result != Error, "Only closing symbols are valid!");
- return result;
- }
- // Test whether this kind of token is a one-character symbol whose character
- // is not part of any other symbol.
- auto is_one_char_symbol() const -> bool { return IsOneCharSymbol[AsInt()]; }
- // Test whether this kind of token is a keyword.
- auto is_keyword() const -> bool { return IsKeyword[AsInt()]; }
- // Test whether this kind of token is a sized type literal.
- auto is_sized_type_literal() const -> bool {
- return *this == TokenKind::IntTypeLiteral ||
- *this == TokenKind::UnsignedIntTypeLiteral ||
- *this == TokenKind::FloatTypeLiteral;
- }
- // If this token kind has a fixed spelling when in source code, returns it.
- // Otherwise returns an empty string.
- auto fixed_spelling() const -> llvm::StringLiteral {
- return FixedSpelling[AsInt()];
- }
- // Get the expected number of parse tree nodes that will be created for this
- // token.
- auto expected_max_parse_tree_size() const -> int {
- return ExpectedParseTreeSize[AsInt()];
- }
- // Test whether this token kind is in the provided list.
- auto IsOneOf(std::initializer_list<TokenKind> kinds) const -> bool {
- for (TokenKind kind : kinds) {
- if (*this == kind) {
- return true;
- }
- }
- return false;
- }
- private:
- static const TokenKind KeywordTokensStorage[];
- static const bool IsSymbol[];
- static const bool IsGroupingSymbol[];
- static const bool IsOpeningSymbol[];
- static const TokenKind ClosingSymbol[];
- static const bool IsClosingSymbol[];
- static const TokenKind OpeningSymbol[];
- static const bool IsOneCharSymbol[];
- static const bool IsKeyword[];
- static const llvm::StringLiteral FixedSpelling[];
- static const int8_t ExpectedParseTreeSize[];
- };
- #define CARBON_TOKEN(TokenName) \
- CARBON_ENUM_CONSTANT_DEFINITION(TokenKind, TokenName)
- #include "toolchain/lex/token_kind.def"
- inline constexpr TokenKind TokenKind::KeywordTokensStorage[] = {
- #define CARBON_KEYWORD_TOKEN(TokenName, Spelling) TokenKind::TokenName,
- #include "toolchain/lex/token_kind.def"
- };
- inline constexpr llvm::ArrayRef<TokenKind> TokenKind::KeywordTokens =
- KeywordTokensStorage;
- } // namespace Carbon::Lex
- // We use formatv primarily for diagnostics. In these cases, it's expected that
- // the spelling in source code should be used.
- template <>
- struct llvm::format_provider<Carbon::Lex::TokenKind> {
- static void format(const Carbon::Lex::TokenKind& kind, raw_ostream& out,
- StringRef /*style*/) {
- auto spelling = kind.fixed_spelling();
- if (!spelling.empty()) {
- out << spelling;
- } else {
- // Default to the name if there's no fixed spelling.
- out << kind;
- }
- }
- };
- #endif // CARBON_TOOLCHAIN_LEX_TOKEN_KIND_H_
|