Files
swift-mirror/include/swift/Parse/Token.h
Anthony Latsis 06a5670c8f Basic: Untie swift::SourceLoc from llvm::SMLoc
Storing a `llvm::SMLoc` is a superfluous indirection, and getting rid of
it enables us to unconditionally import `SourceLoc` into Swift.
2025-07-11 18:48:42 +01:00

353 lines
10 KiB
C++

//===--- Token.h - Token interface ------------------------------*- C++ -*-===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2025 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
//
// This file defines the Token interface.
//
//===----------------------------------------------------------------------===//
#ifndef SWIFT_TOKEN_H
#define SWIFT_TOKEN_H
#include "swift/Basic/SourceLoc.h"
#include "swift/Basic/LLVM.h"
#include "swift/Config.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/ADT/StringSwitch.h"
namespace swift {
enum class tok : uint8_t {
#define TOKEN(X) X,
#include "swift/AST/TokenKinds.def"
NUM_TOKENS
};
/// If a token kind has determined text, return the text; otherwise assert.
StringRef getTokenText(tok kind);
/// Token - This structure provides full information about a lexed token.
/// It is not intended to be space efficient, it is intended to return as much
/// information as possible about each returned token. This is expected to be
/// compressed into a smaller form if memory footprint is important.
///
class Token {
/// Kind - The actual flavor of token this is.
///
tok Kind;
/// Whether this token is the first token on the line.
unsigned AtStartOfLine : 1;
/// Whether this token is an escaped `identifier` token.
unsigned EscapedIdentifier : 1;
/// Modifiers for string literals
unsigned MultilineString : 1;
/// Length of custom delimiter of "raw" string literals
unsigned CustomDelimiterLen : 8;
// Padding bits == 32 - 11;
/// The length of the comment that precedes the token.
unsigned CommentLength;
/// Text - The actual string covered by the token in the source buffer.
StringRef Text;
StringRef trimComment() const {
assert(hasComment() && "Has no comment to trim.");
StringRef Raw(Text.begin() - CommentLength, CommentLength);
return Raw.trim();
}
public:
Token(tok Kind, StringRef Text, unsigned CommentLength = 0)
: Kind(Kind), AtStartOfLine(false), EscapedIdentifier(false),
MultilineString(false), CustomDelimiterLen(0),
CommentLength(CommentLength), Text(Text) {}
Token() : Token(tok::NUM_TOKENS, {}, 0) {}
tok getKind() const { return Kind; }
void setKind(tok K) { Kind = K; }
void clearCommentLength() { CommentLength = 0; }
/// is/isNot - Predicates to check if this token is a specific kind, as in
/// "if (Tok.is(tok::l_brace)) {...}".
bool is(tok K) const { return Kind == K; }
bool isNot(tok K) const { return Kind != K; }
// Predicates to check to see if the token is any of a list of tokens.
bool isAny(tok K1) const {
return is(K1);
}
template <typename ...T>
bool isAny(tok K1, tok K2, T... K) const {
if (is(K1))
return true;
return isAny(K2, K...);
}
// Predicates to check to see if the token is not the same as any of a list.
template <typename ...T>
bool isNot(tok K1, T... K) const { return !isAny(K1, K...); }
bool isBinaryOperator() const {
return Kind == tok::oper_binary_spaced || Kind == tok::oper_binary_unspaced;
}
/// Checks whether the token is either a binary operator, or is a token that
/// acts like a binary operator (e.g infix '=', '?', '->').
bool isBinaryOperatorLike() const {
if (isBinaryOperator())
return true;
switch (Kind) {
case tok::equal:
case tok::arrow:
case tok::question_infix:
return true;
default:
return false;
}
llvm_unreachable("Unhandled case in switch!");
}
/// Checks whether the token is either a postfix operator, or is a token that
/// acts like a postfix operator (e.g postfix '!' and '?').
bool isPostfixOperatorLike() const {
switch (Kind) {
case tok::oper_postfix:
case tok::exclaim_postfix:
case tok::question_postfix:
return true;
default:
return false;
}
llvm_unreachable("Unhandled case in switch!");
}
bool isAnyOperator() const {
return isBinaryOperator() || Kind == tok::oper_postfix ||
Kind == tok::oper_prefix;
}
bool isNotAnyOperator() const {
return !isAnyOperator();
}
bool isEllipsis() const {
return isAnyOperator() && Text == "...";
}
bool isNotEllipsis() const {
return !isEllipsis();
}
bool isTilde() const {
return isAnyOperator() && Text == "~";
}
bool isMinus() const {
return isAnyOperator() && Text == "-";
}
/// Determine whether this token occurred at the start of a line.
bool isAtStartOfLine() const { return AtStartOfLine; }
/// Set whether this token occurred at the start of a line.
void setAtStartOfLine(bool value) { AtStartOfLine = value; }
/// True if this token is an escaped identifier token.
bool isEscapedIdentifier() const { return EscapedIdentifier; }
/// Set whether this token is an escaped identifier token.
void setEscapedIdentifier(bool value) {
assert((!value || Kind == tok::identifier) &&
"only identifiers can be escaped identifiers");
EscapedIdentifier = value;
}
bool isContextualKeyword(StringRef ContextKW) const {
return isAny(tok::identifier, tok::contextual_keyword) &&
!isEscapedIdentifier() && Text == ContextKW;
}
/// Return true if this is a contextual keyword that could be the start of a
/// decl.
bool isContextualDeclKeyword() const {
if (isNot(tok::identifier) || isEscapedIdentifier() || Text.empty())
return false;
return llvm::StringSwitch<bool>(Text)
#define CONTEXTUAL_CASE(KW) .Case(#KW, true)
#define CONTEXTUAL_DECL_ATTR(KW, ...) CONTEXTUAL_CASE(KW)
#define CONTEXTUAL_DECL_ATTR_ALIAS(KW, ...) CONTEXTUAL_CASE(KW)
#define CONTEXTUAL_SIMPLE_DECL_ATTR(KW, ...) CONTEXTUAL_CASE(KW)
#include "swift/AST/DeclAttr.def"
#undef CONTEXTUAL_CASE
.Case("macro", true)
.Case("using", true)
.Default(false);
}
bool isContextualPunctuator(StringRef ContextPunc) const {
return isAnyOperator() && Text == ContextPunc;
}
/// Determine whether the token can be an argument label.
///
/// This covers all identifiers and keywords except those keywords
/// used
bool canBeArgumentLabel() const {
// Identifiers, escaped identifiers, and '_' can be argument labels.
if (is(tok::identifier) || isEscapedIdentifier() || is(tok::kw__)) {
return true;
}
// inout cannot be used as an argument label.
if (is(tok::kw_inout))
return false;
// All other keywords can be argument labels.
return isKeyword();
}
/// True if the token is an identifier or '_'.
bool isIdentifierOrUnderscore() const {
return isAny(tok::identifier, tok::kw__);
}
/// True if the token is an l_paren token that does not start a new line.
bool isFollowingLParen() const {
return !isAtStartOfLine() && Kind == tok::l_paren;
}
/// True if the token is an l_square token that does not start a new line.
bool isFollowingLSquare() const {
return !isAtStartOfLine() && Kind == tok::l_square;
}
/// True if the token is any keyword.
bool isKeyword() const {
switch (Kind) {
#define KEYWORD(X) case tok::kw_##X: return true;
#include "swift/AST/TokenKinds.def"
default: return false;
}
}
/// True if the token is any literal.
bool isLiteral() const {
switch(Kind) {
case tok::integer_literal:
case tok::floating_literal:
case tok::string_literal:
return true;
default:
return false;
}
}
bool isPunctuation() const {
switch (Kind) {
#define PUNCTUATOR(Name, Str) case tok::Name: return true;
#include "swift/AST/TokenKinds.def"
default: return false;
}
}
/// True if the token is an editor placeholder.
bool isEditorPlaceholder() const;
/// True if the string literal token is multiline.
bool isMultilineString() const {
return MultilineString;
}
/// Count of extending escaping '#'.
unsigned getCustomDelimiterLen() const {
return CustomDelimiterLen;
}
/// Set characteristics of string literal token.
void setStringLiteral(bool IsMultilineString, unsigned CustomDelimiterLen) {
assert(Kind == tok::string_literal);
this->MultilineString = IsMultilineString;
this->CustomDelimiterLen = CustomDelimiterLen;
}
/// getLoc - Return a source location identifier for the specified
/// offset in the current file.
SourceLoc getLoc() const { return SourceLoc::getFromPointer(Text.begin()); }
unsigned getLength() const { return Text.size(); }
CharSourceRange getRange() const {
return CharSourceRange(getLoc(), getLength());
}
bool hasComment() const {
return CommentLength != 0;
}
CharSourceRange getCommentRange() const {
if (CommentLength == 0)
return CharSourceRange(SourceLoc::getFromPointer(Text.begin()), 0);
auto TrimedComment = trimComment();
return CharSourceRange(SourceLoc::getFromPointer(TrimedComment.begin()),
TrimedComment.size());
}
SourceLoc getCommentStart() const {
if (CommentLength == 0) return SourceLoc();
return SourceLoc::getFromPointer(trimComment().begin());
}
StringRef getRawText() const {
return Text;
}
StringRef getText() const {
if (EscapedIdentifier) {
// Strip off the backticks on either side.
assert(Text.front() == '`' && Text.back() == '`');
return Text.slice(1, Text.size() - 1);
}
return Text;
}
void setText(StringRef T) { Text = T; }
/// Set the token to the specified kind and source range.
void setToken(tok K, StringRef T, unsigned CommentLength = 0) {
Kind = K;
Text = T;
this->CommentLength = CommentLength;
EscapedIdentifier = false;
this->MultilineString = false;
this->CustomDelimiterLen = 0;
assert(this->CustomDelimiterLen == CustomDelimiterLen &&
"custom string delimiter length > 255");
}
};
} // end namespace swift
namespace llvm {
template <typename T> struct isPodLike;
template <>
struct isPodLike<swift::Token> { static const bool value = true; };
} // end namespace llvm
#endif