use std::borrow::Cow; use std::fmt; pub use LitKind::*; pub use NtExprKind::*; pub use NtPatKind::*; pub use TokenKind::*; use rustc_macros::{Decodable, Encodable, HashStable_Generic}; use rustc_span::edition::Edition; use rustc_span::{DUMMY_SP, ErrorGuaranteed, Span, kw, sym}; #[allow(clippy::useless_attribute)] // FIXME: following use of `hidden_glob_reexports` incorrectly triggers `useless_attribute` lint. #[allow(hidden_glob_reexports)] use rustc_span::{Ident, Symbol}; use crate::ast; use crate::util::case::Case; #[derive(Clone, Copy, PartialEq, Encodable, Decodable, Debug, HashStable_Generic)] pub enum CommentKind { Line, Block, } // This type must not implement `Hash` due to the unusual `PartialEq` impl below. #[derive(Copy, Clone, Debug, Encodable, Decodable, HashStable_Generic)] pub enum InvisibleOrigin { // From the expansion of a metavariable in a declarative macro. MetaVar(MetaVarKind), // Converted from `proc_macro::Delimiter` in // `proc_macro::Delimiter::to_internal`, i.e. returned by a proc macro. ProcMacro, } impl InvisibleOrigin { // Should the parser skip these invisible delimiters? Ideally this function // will eventually disappear and no invisible delimiters will be skipped. #[inline] pub fn skip(&self) -> bool { match self { InvisibleOrigin::MetaVar(_) => false, InvisibleOrigin::ProcMacro => true, } } } impl PartialEq for InvisibleOrigin { #[inline] fn eq(&self, _other: &InvisibleOrigin) -> bool { // When we had AST-based nonterminals we couldn't compare them, and the // old `Nonterminal` type had an `eq` that always returned false, // resulting in this restriction: // https://doc.rust-lang.org/nightly/reference/macros-by-example.html#forwarding-a-matched-fragment // This `eq` emulates that behaviour. We could consider lifting this // restriction now but there are still cases involving invisible // delimiters that make it harder than it first appears. false } } /// Annoyingly similar to `NonterminalKind`, but the slight differences are important. #[derive(Debug, Copy, Clone, PartialEq, Eq, Encodable, Decodable, Hash, HashStable_Generic)] pub enum MetaVarKind { Item, Block, Stmt, Pat(NtPatKind), Expr { kind: NtExprKind, // This field is needed for `Token::can_begin_literal_maybe_minus`. can_begin_literal_maybe_minus: bool, // This field is needed for `Token::can_begin_string_literal`. can_begin_string_literal: bool, }, Ty { is_path: bool, }, Ident, Lifetime, Literal, Meta { /// Will `AttrItem::meta` succeed on this, if reparsed? has_meta_form: bool, }, Path, Vis, TT, } impl fmt::Display for MetaVarKind { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { let sym = match self { MetaVarKind::Item => sym::item, MetaVarKind::Block => sym::block, MetaVarKind::Stmt => sym::stmt, MetaVarKind::Pat(PatParam { inferred: true } | PatWithOr) => sym::pat, MetaVarKind::Pat(PatParam { inferred: false }) => sym::pat_param, MetaVarKind::Expr { kind: Expr2021 { inferred: true } | Expr, .. } => sym::expr, MetaVarKind::Expr { kind: Expr2021 { inferred: false }, .. } => sym::expr_2021, MetaVarKind::Ty { .. } => sym::ty, MetaVarKind::Ident => sym::ident, MetaVarKind::Lifetime => sym::lifetime, MetaVarKind::Literal => sym::literal, MetaVarKind::Meta { .. } => sym::meta, MetaVarKind::Path => sym::path, MetaVarKind::Vis => sym::vis, MetaVarKind::TT => sym::tt, }; write!(f, "{sym}") } } /// Describes how a sequence of token trees is delimited. /// Cannot use `proc_macro::Delimiter` directly because this /// structure should implement some additional traits. #[derive(Copy, Clone, Debug, PartialEq, Encodable, Decodable, HashStable_Generic)] pub enum Delimiter { /// `( ... )` Parenthesis, /// `{ ... }` Brace, /// `[ ... ]` Bracket, /// `∅ ... ∅` /// An invisible delimiter, that may, for example, appear around tokens coming from a /// "macro variable" `$var`. It is important to preserve operator priorities in cases like /// `$var * 3` where `$var` is `1 + 2`. /// Invisible delimiters might not survive roundtrip of a token stream through a string. Invisible(InvisibleOrigin), } impl Delimiter { // Should the parser skip these delimiters? Only happens for certain kinds // of invisible delimiters. Ideally this function will eventually disappear // and no invisible delimiters will be skipped. #[inline] pub fn skip(&self) -> bool { match self { Delimiter::Parenthesis | Delimiter::Bracket | Delimiter::Brace => false, Delimiter::Invisible(origin) => origin.skip(), } } // This exists because `InvisibleOrigin`s should be compared. It is only used for assertions. pub fn eq_ignoring_invisible_origin(&self, other: &Delimiter) -> bool { match (self, other) { (Delimiter::Parenthesis, Delimiter::Parenthesis) => true, (Delimiter::Brace, Delimiter::Brace) => true, (Delimiter::Bracket, Delimiter::Bracket) => true, (Delimiter::Invisible(_), Delimiter::Invisible(_)) => true, _ => false, } } pub fn as_open_token_kind(&self) -> TokenKind { match *self { Delimiter::Parenthesis => OpenParen, Delimiter::Brace => OpenBrace, Delimiter::Bracket => OpenBracket, Delimiter::Invisible(origin) => OpenInvisible(origin), } } pub fn as_close_token_kind(&self) -> TokenKind { match *self { Delimiter::Parenthesis => CloseParen, Delimiter::Brace => CloseBrace, Delimiter::Bracket => CloseBracket, Delimiter::Invisible(origin) => CloseInvisible(origin), } } } // Note that the suffix is *not* considered when deciding the `LitKind` in this // type. This means that float literals like `1f32` are classified by this type // as `Int`. Only upon conversion to `ast::LitKind` will such a literal be // given the `Float` kind. #[derive(Clone, Copy, PartialEq, Encodable, Decodable, Debug, HashStable_Generic)] pub enum LitKind { Bool, // AST only, must never appear in a `Token` Byte, Char, Integer, // e.g. `1`, `1u8`, `1f32` Float, // e.g. `1.`, `1.0`, `1e3f32` Str, StrRaw(u8), // raw string delimited by `n` hash symbols ByteStr, ByteStrRaw(u8), // raw byte string delimited by `n` hash symbols CStr, CStrRaw(u8), Err(ErrorGuaranteed), } /// A literal token. #[derive(Clone, Copy, PartialEq, Encodable, Decodable, Debug, HashStable_Generic)] pub struct Lit { pub kind: LitKind, pub symbol: Symbol, pub suffix: Option, } impl Lit { pub fn new(kind: LitKind, symbol: Symbol, suffix: Option) -> Lit { Lit { kind, symbol, suffix } } /// Returns `true` if this is semantically a float literal. This includes /// ones like `1f32` that have an `Integer` kind but a float suffix. pub fn is_semantic_float(&self) -> bool { match self.kind { LitKind::Float => true, LitKind::Integer => match self.suffix { Some(sym) => sym == sym::f32 || sym == sym::f64, None => false, }, _ => false, } } /// Keep this in sync with `Token::can_begin_literal_maybe_minus` and /// `Parser::eat_token_lit` (excluding unary negation). pub fn from_token(token: &Token) -> Option { match token.uninterpolate().kind { Ident(name, IdentIsRaw::No) if name.is_bool_lit() => Some(Lit::new(Bool, name, None)), Literal(token_lit) => Some(token_lit), OpenInvisible(InvisibleOrigin::MetaVar( MetaVarKind::Literal | MetaVarKind::Expr { .. }, )) => { // Unreachable with the current test suite. panic!("from_token metavar"); } _ => None, } } } impl fmt::Display for Lit { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { let Lit { kind, symbol, suffix } = *self; match kind { Byte => write!(f, "b'{symbol}'")?, Char => write!(f, "'{symbol}'")?, Str => write!(f, "\"{symbol}\"")?, StrRaw(n) => write!( f, "r{delim}\"{string}\"{delim}", delim = "#".repeat(n as usize), string = symbol )?, ByteStr => write!(f, "b\"{symbol}\"")?, ByteStrRaw(n) => write!( f, "br{delim}\"{string}\"{delim}", delim = "#".repeat(n as usize), string = symbol )?, CStr => write!(f, "c\"{symbol}\"")?, CStrRaw(n) => { write!(f, "cr{delim}\"{symbol}\"{delim}", delim = "#".repeat(n as usize))? } Integer | Float | Bool | Err(_) => write!(f, "{symbol}")?, } if let Some(suffix) = suffix { write!(f, "{suffix}")?; } Ok(()) } } impl LitKind { /// An English article for the literal token kind. pub fn article(self) -> &'static str { match self { Integer | Err(_) => "an", _ => "a", } } pub fn descr(self) -> &'static str { match self { Bool => "boolean", Byte => "byte", Char => "char", Integer => "integer", Float => "float", Str | StrRaw(..) => "string", ByteStr | ByteStrRaw(..) => "byte string", CStr | CStrRaw(..) => "C string", Err(_) => "error", } } pub(crate) fn may_have_suffix(self) -> bool { matches!(self, Integer | Float | Err(_)) } } pub fn ident_can_begin_expr(name: Symbol, span: Span, is_raw: IdentIsRaw) -> bool { let ident_token = Token::new(Ident(name, is_raw), span); !ident_token.is_reserved_ident() || ident_token.is_path_segment_keyword() || [ kw::Async, kw::Do, kw::Box, kw::Break, kw::Const, kw::Continue, kw::False, kw::For, kw::Gen, kw::If, kw::Let, kw::Loop, kw::Match, kw::Move, kw::Return, kw::True, kw::Try, kw::Unsafe, kw::While, kw::Yield, kw::Safe, kw::Static, ] .contains(&name) } fn ident_can_begin_type(name: Symbol, span: Span, is_raw: IdentIsRaw) -> bool { let ident_token = Token::new(Ident(name, is_raw), span); !ident_token.is_reserved_ident() || ident_token.is_path_segment_keyword() || [kw::Underscore, kw::For, kw::Impl, kw::Fn, kw::Unsafe, kw::Extern, kw::Typeof, kw::Dyn] .contains(&name) } #[derive(PartialEq, Encodable, Decodable, Debug, Copy, Clone, HashStable_Generic)] pub enum IdentIsRaw { No, Yes, } impl From for IdentIsRaw { fn from(b: bool) -> Self { if b { Self::Yes } else { Self::No } } } impl From for bool { fn from(is_raw: IdentIsRaw) -> bool { matches!(is_raw, IdentIsRaw::Yes) } } #[derive(Clone, Copy, PartialEq, Encodable, Decodable, Debug, HashStable_Generic)] pub enum TokenKind { /* Expression-operator symbols. */ /// `=` Eq, /// `<` Lt, /// `<=` Le, /// `==` EqEq, /// `!=` Ne, /// `>=` Ge, /// `>` Gt, /// `&&` AndAnd, /// `||` OrOr, /// `!` Bang, /// `~` Tilde, // `+` Plus, // `-` Minus, // `*` Star, // `/` Slash, // `%` Percent, // `^` Caret, // `&` And, // `|` Or, // `<<` Shl, // `>>` Shr, // `+=` PlusEq, // `-=` MinusEq, // `*=` StarEq, // `/=` SlashEq, // `%=` PercentEq, // `^=` CaretEq, // `&=` AndEq, // `|=` OrEq, // `<<=` ShlEq, // `>>=` ShrEq, /* Structural symbols */ /// `@` At, /// `.` Dot, /// `..` DotDot, /// `...` DotDotDot, /// `..=` DotDotEq, /// `,` Comma, /// `;` Semi, /// `:` Colon, /// `::` PathSep, /// `->` RArrow, /// `<-` LArrow, /// `=>` FatArrow, /// `#` Pound, /// `$` Dollar, /// `?` Question, /// Used by proc macros for representing lifetimes, not generated by lexer right now. SingleQuote, /// `(` OpenParen, /// `)` CloseParen, /// `{` OpenBrace, /// `}` CloseBrace, /// `[` OpenBracket, /// `]` CloseBracket, /// Invisible opening delimiter, produced by a macro. OpenInvisible(InvisibleOrigin), /// Invisible closing delimiter, produced by a macro. CloseInvisible(InvisibleOrigin), /* Literals */ Literal(Lit), /// Identifier token. /// Do not forget about `NtIdent` when you want to match on identifiers. /// It's recommended to use `Token::{ident,uninterpolate}` and /// `Parser::token_uninterpolated_span` to treat regular and interpolated /// identifiers in the same way. Ident(Symbol, IdentIsRaw), /// This identifier (and its span) is the identifier passed to the /// declarative macro. The span in the surrounding `Token` is the span of /// the `ident` metavariable in the macro's RHS. NtIdent(Ident, IdentIsRaw), /// Lifetime identifier token. /// Do not forget about `NtLifetime` when you want to match on lifetime identifiers. /// It's recommended to use `Token::{ident,uninterpolate}` and /// `Parser::token_uninterpolated_span` to treat regular and interpolated /// identifiers in the same way. Lifetime(Symbol, IdentIsRaw), /// This identifier (and its span) is the lifetime passed to the /// declarative macro. The span in the surrounding `Token` is the span of /// the `lifetime` metavariable in the macro's RHS. NtLifetime(Ident, IdentIsRaw), /// A doc comment token. /// `Symbol` is the doc comment's data excluding its "quotes" (`///`, `/**`, etc) /// similarly to symbols in string literal tokens. DocComment(CommentKind, ast::AttrStyle, Symbol), /// End Of File Eof, } #[derive(Clone, Copy, PartialEq, Encodable, Decodable, Debug, HashStable_Generic)] pub struct Token { pub kind: TokenKind, pub span: Span, } impl TokenKind { pub fn lit(kind: LitKind, symbol: Symbol, suffix: Option) -> TokenKind { Literal(Lit::new(kind, symbol, suffix)) } /// An approximation to proc-macro-style single-character operators used by /// rustc parser. If the operator token can be broken into two tokens, the /// first of which has `n` (1 or 2) chars, then this function performs that /// operation, otherwise it returns `None`. pub fn break_two_token_op(&self, n: u32) -> Option<(TokenKind, TokenKind)> { assert!(n == 1 || n == 2); Some(match (self, n) { (Le, 1) => (Lt, Eq), (EqEq, 1) => (Eq, Eq), (Ne, 1) => (Bang, Eq), (Ge, 1) => (Gt, Eq), (AndAnd, 1) => (And, And), (OrOr, 1) => (Or, Or), (Shl, 1) => (Lt, Lt), (Shr, 1) => (Gt, Gt), (PlusEq, 1) => (Plus, Eq), (MinusEq, 1) => (Minus, Eq), (StarEq, 1) => (Star, Eq), (SlashEq, 1) => (Slash, Eq), (PercentEq, 1) => (Percent, Eq), (CaretEq, 1) => (Caret, Eq), (AndEq, 1) => (And, Eq), (OrEq, 1) => (Or, Eq), (ShlEq, 1) => (Lt, Le), // `<` + `<=` (ShlEq, 2) => (Shl, Eq), // `<<` + `=` (ShrEq, 1) => (Gt, Ge), // `>` + `>=` (ShrEq, 2) => (Shr, Eq), // `>>` + `=` (DotDot, 1) => (Dot, Dot), (DotDotDot, 1) => (Dot, DotDot), // `.` + `..` (DotDotDot, 2) => (DotDot, Dot), // `..` + `.` (DotDotEq, 2) => (DotDot, Eq), (PathSep, 1) => (Colon, Colon), (RArrow, 1) => (Minus, Gt), (LArrow, 1) => (Lt, Minus), (FatArrow, 1) => (Eq, Gt), _ => return None, }) } /// Returns tokens that are likely to be typed accidentally instead of the current token. /// Enables better error recovery when the wrong token is found. pub fn similar_tokens(&self) -> &[TokenKind] { match self { Comma => &[Dot, Lt, Semi], Semi => &[Colon, Comma], Colon => &[Semi], FatArrow => &[Eq, RArrow, Ge, Gt], _ => &[], } } pub fn should_end_const_arg(&self) -> bool { matches!(self, Gt | Ge | Shr | ShrEq) } pub fn is_delim(&self) -> bool { self.open_delim().is_some() || self.close_delim().is_some() } pub fn open_delim(&self) -> Option { match *self { OpenParen => Some(Delimiter::Parenthesis), OpenBrace => Some(Delimiter::Brace), OpenBracket => Some(Delimiter::Bracket), OpenInvisible(origin) => Some(Delimiter::Invisible(origin)), _ => None, } } pub fn close_delim(&self) -> Option { match *self { CloseParen => Some(Delimiter::Parenthesis), CloseBrace => Some(Delimiter::Brace), CloseBracket => Some(Delimiter::Bracket), CloseInvisible(origin) => Some(Delimiter::Invisible(origin)), _ => None, } } pub fn is_close_delim_or_eof(&self) -> bool { match self { CloseParen | CloseBrace | CloseBracket | CloseInvisible(_) | Eof => true, _ => false, } } } impl Token { pub fn new(kind: TokenKind, span: Span) -> Self { Token { kind, span } } /// Some token that will be thrown away later. pub fn dummy() -> Self { Token::new(TokenKind::Question, DUMMY_SP) } /// Recovers a `Token` from an `Ident`. This creates a raw identifier if necessary. pub fn from_ast_ident(ident: Ident) -> Self { Token::new(Ident(ident.name, ident.is_raw_guess().into()), ident.span) } pub fn is_range_separator(&self) -> bool { [DotDot, DotDotDot, DotDotEq].contains(&self.kind) } pub fn is_punct(&self) -> bool { match self.kind { Eq | Lt | Le | EqEq | Ne | Ge | Gt | AndAnd | OrOr | Bang | Tilde | Plus | Minus | Star | Slash | Percent | Caret | And | Or | Shl | Shr | PlusEq | MinusEq | StarEq | SlashEq | PercentEq | CaretEq | AndEq | OrEq | ShlEq | ShrEq | At | Dot | DotDot | DotDotDot | DotDotEq | Comma | Semi | Colon | PathSep | RArrow | LArrow | FatArrow | Pound | Dollar | Question | SingleQuote => true, OpenParen | CloseParen | OpenBrace | CloseBrace | OpenBracket | CloseBracket | OpenInvisible(_) | CloseInvisible(_) | Literal(..) | DocComment(..) | Ident(..) | NtIdent(..) | Lifetime(..) | NtLifetime(..) | Eof => false, } } pub fn is_like_plus(&self) -> bool { matches!(self.kind, Plus | PlusEq) } /// Returns `true` if the token can appear at the start of an expression. /// /// **NB**: Take care when modifying this function, since it will change /// the stable set of tokens that are allowed to match an expr nonterminal. pub fn can_begin_expr(&self) -> bool { match self.uninterpolate().kind { Ident(name, is_raw) => ident_can_begin_expr(name, self.span, is_raw), // value name or keyword OpenParen | // tuple OpenBrace | // block OpenBracket | // array Literal(..) | // literal Bang | // operator not Minus | // unary minus Star | // dereference Or | OrOr | // closure And | // reference AndAnd | // double reference // DotDotDot is no longer supported, but we need some way to display the error DotDot | DotDotDot | DotDotEq | // range notation Lt | Shl | // associated path PathSep | // global path Lifetime(..) | // labeled loop Pound => true, // expression attributes OpenInvisible(InvisibleOrigin::MetaVar( MetaVarKind::Block | MetaVarKind::Expr { .. } | MetaVarKind::Literal | MetaVarKind::Path )) => true, _ => false, } } /// Returns `true` if the token can appear at the start of a pattern. /// /// Shamelessly borrowed from `can_begin_expr`, only used for diagnostics right now. pub fn can_begin_pattern(&self, pat_kind: NtPatKind) -> bool { match &self.uninterpolate().kind { // box, ref, mut, and other identifiers (can stricten) Ident(..) | NtIdent(..) | OpenParen | // tuple pattern OpenBracket | // slice pattern And | // reference Minus | // negative literal AndAnd | // double reference Literal(_) | // literal DotDot | // range pattern (future compat) DotDotDot | // range pattern (future compat) PathSep | // path Lt | // path (UFCS constant) Shl => true, // path (double UFCS) Or => matches!(pat_kind, PatWithOr), // leading vert `|` or-pattern OpenInvisible(InvisibleOrigin::MetaVar( MetaVarKind::Expr { .. } | MetaVarKind::Literal | MetaVarKind::Meta { .. } | MetaVarKind::Pat(_) | MetaVarKind::Path | MetaVarKind::Ty { .. } )) => true, _ => false, } } /// Returns `true` if the token can appear at the start of a type. pub fn can_begin_type(&self) -> bool { match self.uninterpolate().kind { Ident(name, is_raw) => ident_can_begin_type(name, self.span, is_raw), // type name or keyword OpenParen | // tuple OpenBracket | // array Bang | // never Star | // raw pointer And | // reference AndAnd | // double reference Question | // maybe bound in trait object Lifetime(..) | // lifetime bound in trait object Lt | Shl | // associated path PathSep => true, // global path OpenInvisible(InvisibleOrigin::MetaVar( MetaVarKind::Ty { .. } | MetaVarKind::Path )) => true, // For anonymous structs or unions, which only appear in specific positions // (type of struct fields or union fields), we don't consider them as regular types _ => false, } } /// Returns `true` if the token can appear at the start of a const param. pub fn can_begin_const_arg(&self) -> bool { match self.kind { OpenBrace | Literal(..) | Minus => true, Ident(name, IdentIsRaw::No) if name.is_bool_lit() => true, OpenInvisible(InvisibleOrigin::MetaVar( MetaVarKind::Expr { .. } | MetaVarKind::Block | MetaVarKind::Literal, )) => true, _ => false, } } /// Returns `true` if the token can appear at the start of an item. pub fn can_begin_item(&self) -> bool { match self.kind { Ident(name, _) => [ kw::Fn, kw::Use, kw::Struct, kw::Enum, kw::Pub, kw::Trait, kw::Extern, kw::Impl, kw::Unsafe, kw::Const, kw::Safe, kw::Static, kw::Union, kw::Macro, kw::Mod, kw::Type, ] .contains(&name), _ => false, } } /// Returns `true` if the token is any literal. pub fn is_lit(&self) -> bool { matches!(self.kind, Literal(..)) } /// Returns `true` if the token is any literal, a minus (which can prefix a literal, /// for example a '-42', or one of the boolean idents). /// /// In other words, would this token be a valid start of `parse_literal_maybe_minus`? /// /// Keep this in sync with `Lit::from_token` and `Parser::eat_token_lit` /// (excluding unary negation). pub fn can_begin_literal_maybe_minus(&self) -> bool { match self.uninterpolate().kind { Literal(..) | Minus => true, Ident(name, IdentIsRaw::No) if name.is_bool_lit() => true, OpenInvisible(InvisibleOrigin::MetaVar(mv_kind)) => match mv_kind { MetaVarKind::Literal => true, MetaVarKind::Expr { can_begin_literal_maybe_minus, .. } => { can_begin_literal_maybe_minus } _ => false, }, _ => false, } } pub fn can_begin_string_literal(&self) -> bool { match self.uninterpolate().kind { Literal(..) => true, OpenInvisible(InvisibleOrigin::MetaVar(mv_kind)) => match mv_kind { MetaVarKind::Literal => true, MetaVarKind::Expr { can_begin_string_literal, .. } => can_begin_string_literal, _ => false, }, _ => false, } } /// A convenience function for matching on identifiers during parsing. /// Turns interpolated identifier (`$i: ident`) or lifetime (`$l: lifetime`) token /// into the regular identifier or lifetime token it refers to, /// otherwise returns the original token. pub fn uninterpolate(&self) -> Cow<'_, Token> { match self.kind { NtIdent(ident, is_raw) => Cow::Owned(Token::new(Ident(ident.name, is_raw), ident.span)), NtLifetime(ident, is_raw) => { Cow::Owned(Token::new(Lifetime(ident.name, is_raw), ident.span)) } _ => Cow::Borrowed(self), } } /// Returns an identifier if this token is an identifier. #[inline] pub fn ident(&self) -> Option<(Ident, IdentIsRaw)> { // We avoid using `Token::uninterpolate` here because it's slow. match self.kind { Ident(name, is_raw) => Some((Ident::new(name, self.span), is_raw)), NtIdent(ident, is_raw) => Some((ident, is_raw)), _ => None, } } /// Returns a lifetime identifier if this token is a lifetime. #[inline] pub fn lifetime(&self) -> Option<(Ident, IdentIsRaw)> { // We avoid using `Token::uninterpolate` here because it's slow. match self.kind { Lifetime(name, is_raw) => Some((Ident::new(name, self.span), is_raw)), NtLifetime(ident, is_raw) => Some((ident, is_raw)), _ => None, } } /// Returns `true` if the token is an identifier. pub fn is_ident(&self) -> bool { self.ident().is_some() } /// Returns `true` if the token is a lifetime. pub fn is_lifetime(&self) -> bool { self.lifetime().is_some() } /// Returns `true` if the token is an identifier whose name is the given /// string slice. pub fn is_ident_named(&self, name: Symbol) -> bool { self.ident().is_some_and(|(ident, _)| ident.name == name) } /// Is this a pre-parsed expression dropped into the token stream /// (which happens while parsing the result of macro expansion)? pub fn is_metavar_expr(&self) -> bool { matches!( self.is_metavar_seq(), Some( MetaVarKind::Expr { .. } | MetaVarKind::Literal | MetaVarKind::Path | MetaVarKind::Block ) ) } /// Are we at a block from a metavar (`$b:block`)? pub fn is_metavar_block(&self) -> bool { matches!(self.is_metavar_seq(), Some(MetaVarKind::Block)) } /// Returns `true` if the token is either the `mut` or `const` keyword. pub fn is_mutability(&self) -> bool { self.is_keyword(kw::Mut) || self.is_keyword(kw::Const) } pub fn is_qpath_start(&self) -> bool { self == &Lt || self == &Shl } pub fn is_path_start(&self) -> bool { self == &PathSep || self.is_qpath_start() || matches!(self.is_metavar_seq(), Some(MetaVarKind::Path)) || self.is_path_segment_keyword() || self.is_non_reserved_ident() } /// Returns `true` if the token is a given keyword, `kw`. pub fn is_keyword(&self, kw: Symbol) -> bool { self.is_non_raw_ident_where(|id| id.name == kw) } /// Returns `true` if the token is a given keyword, `kw` or if `case` is `Insensitive` and this /// token is an identifier equal to `kw` ignoring the case. pub fn is_keyword_case(&self, kw: Symbol, case: Case) -> bool { self.is_keyword(kw) || (case == Case::Insensitive && self.is_non_raw_ident_where(|id| { // Do an ASCII case-insensitive match, because all keywords are ASCII. id.name.as_str().eq_ignore_ascii_case(kw.as_str()) })) } pub fn is_path_segment_keyword(&self) -> bool { self.is_non_raw_ident_where(Ident::is_path_segment_keyword) } /// Returns true for reserved identifiers used internally for elided lifetimes, /// unnamed method parameters, crate root module, error recovery etc. pub fn is_special_ident(&self) -> bool { self.is_non_raw_ident_where(Ident::is_special) } /// Returns `true` if the token is a keyword used in the language. pub fn is_used_keyword(&self) -> bool { self.is_non_raw_ident_where(Ident::is_used_keyword) } /// Returns `true` if the token is a keyword reserved for possible future use. pub fn is_unused_keyword(&self) -> bool { self.is_non_raw_ident_where(Ident::is_unused_keyword) } /// Returns `true` if the token is either a special identifier or a keyword. pub fn is_reserved_ident(&self) -> bool { self.is_non_raw_ident_where(Ident::is_reserved) } pub fn is_non_reserved_ident(&self) -> bool { self.ident().is_some_and(|(id, raw)| raw == IdentIsRaw::Yes || !Ident::is_reserved(id)) } /// Returns `true` if the token is the identifier `true` or `false`. pub fn is_bool_lit(&self) -> bool { self.is_non_raw_ident_where(|id| id.name.is_bool_lit()) } pub fn is_numeric_lit(&self) -> bool { matches!( self.kind, Literal(Lit { kind: LitKind::Integer, .. }) | Literal(Lit { kind: LitKind::Float, .. }) ) } /// Returns `true` if the token is the integer literal. pub fn is_integer_lit(&self) -> bool { matches!(self.kind, Literal(Lit { kind: LitKind::Integer, .. })) } /// Returns `true` if the token is a non-raw identifier for which `pred` holds. pub fn is_non_raw_ident_where(&self, pred: impl FnOnce(Ident) -> bool) -> bool { match self.ident() { Some((id, IdentIsRaw::No)) => pred(id), _ => false, } } /// Is this an invisible open delimiter at the start of a token sequence /// from an expanded metavar? pub fn is_metavar_seq(&self) -> Option { match self.kind { OpenInvisible(InvisibleOrigin::MetaVar(kind)) => Some(kind), _ => None, } } pub fn glue(&self, joint: &Token) -> Option { let kind = match (&self.kind, &joint.kind) { (Eq, Eq) => EqEq, (Eq, Gt) => FatArrow, (Eq, _) => return None, (Lt, Eq) => Le, (Lt, Lt) => Shl, (Lt, Le) => ShlEq, (Lt, Minus) => LArrow, (Lt, _) => return None, (Gt, Eq) => Ge, (Gt, Gt) => Shr, (Gt, Ge) => ShrEq, (Gt, _) => return None, (Bang, Eq) => Ne, (Bang, _) => return None, (Plus, Eq) => PlusEq, (Plus, _) => return None, (Minus, Eq) => MinusEq, (Minus, Gt) => RArrow, (Minus, _) => return None, (Star, Eq) => StarEq, (Star, _) => return None, (Slash, Eq) => SlashEq, (Slash, _) => return None, (Percent, Eq) => PercentEq, (Percent, _) => return None, (Caret, Eq) => CaretEq, (Caret, _) => return None, (And, Eq) => AndEq, (And, And) => AndAnd, (And, _) => return None, (Or, Eq) => OrEq, (Or, Or) => OrOr, (Or, _) => return None, (Shl, Eq) => ShlEq, (Shl, _) => return None, (Shr, Eq) => ShrEq, (Shr, _) => return None, (Dot, Dot) => DotDot, (Dot, DotDot) => DotDotDot, (Dot, _) => return None, (DotDot, Dot) => DotDotDot, (DotDot, Eq) => DotDotEq, (DotDot, _) => return None, (Colon, Colon) => PathSep, (Colon, _) => return None, (SingleQuote, Ident(name, is_raw)) => { Lifetime(Symbol::intern(&format!("'{name}")), *is_raw) } (SingleQuote, _) => return None, ( Le | EqEq | Ne | Ge | AndAnd | OrOr | Tilde | PlusEq | MinusEq | StarEq | SlashEq | PercentEq | CaretEq | AndEq | OrEq | ShlEq | ShrEq | At | DotDotDot | DotDotEq | Comma | Semi | PathSep | RArrow | LArrow | FatArrow | Pound | Dollar | Question | OpenParen | CloseParen | OpenBrace | CloseBrace | OpenBracket | CloseBracket | OpenInvisible(_) | CloseInvisible(_) | Literal(..) | Ident(..) | NtIdent(..) | Lifetime(..) | NtLifetime(..) | DocComment(..) | Eof, _, ) => { return None; } }; Some(Token::new(kind, self.span.to(joint.span))) } } impl PartialEq for Token { #[inline] fn eq(&self, rhs: &TokenKind) -> bool { self.kind == *rhs } } #[derive(Debug, Copy, Clone, PartialEq, Eq, Encodable, Decodable, Hash, HashStable_Generic)] pub enum NtPatKind { // Matches or-patterns. Was written using `pat` in edition 2021 or later. PatWithOr, // Doesn't match or-patterns. // - `inferred`: was written using `pat` in edition 2015 or 2018. // - `!inferred`: was written using `pat_param`. PatParam { inferred: bool }, } #[derive(Debug, Copy, Clone, PartialEq, Eq, Encodable, Decodable, Hash, HashStable_Generic)] pub enum NtExprKind { // Matches expressions using the post-edition 2024. Was written using // `expr` in edition 2024 or later. Expr, // Matches expressions using the pre-edition 2024 rules. // - `inferred`: was written using `expr` in edition 2021 or earlier. // - `!inferred`: was written using `expr_2021`. Expr2021 { inferred: bool }, } /// A macro nonterminal, known in documentation as a fragment specifier. #[derive(Debug, Copy, Clone, PartialEq, Eq, Encodable, Decodable, Hash, HashStable_Generic)] pub enum NonterminalKind { Item, Block, Stmt, Pat(NtPatKind), Expr(NtExprKind), Ty, Ident, Lifetime, Literal, Meta, Path, Vis, TT, } impl NonterminalKind { /// The `edition` closure is used to get the edition for the given symbol. Doing /// `span.edition()` is expensive, so we do it lazily. pub fn from_symbol( symbol: Symbol, edition: impl FnOnce() -> Edition, ) -> Option { Some(match symbol { sym::item => NonterminalKind::Item, sym::block => NonterminalKind::Block, sym::stmt => NonterminalKind::Stmt, sym::pat => { if edition().at_least_rust_2021() { NonterminalKind::Pat(PatWithOr) } else { NonterminalKind::Pat(PatParam { inferred: true }) } } sym::pat_param => NonterminalKind::Pat(PatParam { inferred: false }), sym::expr => { if edition().at_least_rust_2024() { NonterminalKind::Expr(Expr) } else { NonterminalKind::Expr(Expr2021 { inferred: true }) } } sym::expr_2021 => NonterminalKind::Expr(Expr2021 { inferred: false }), sym::ty => NonterminalKind::Ty, sym::ident => NonterminalKind::Ident, sym::lifetime => NonterminalKind::Lifetime, sym::literal => NonterminalKind::Literal, sym::meta => NonterminalKind::Meta, sym::path => NonterminalKind::Path, sym::vis => NonterminalKind::Vis, sym::tt => NonterminalKind::TT, _ => return None, }) } fn symbol(self) -> Symbol { match self { NonterminalKind::Item => sym::item, NonterminalKind::Block => sym::block, NonterminalKind::Stmt => sym::stmt, NonterminalKind::Pat(PatParam { inferred: true } | PatWithOr) => sym::pat, NonterminalKind::Pat(PatParam { inferred: false }) => sym::pat_param, NonterminalKind::Expr(Expr2021 { inferred: true } | Expr) => sym::expr, NonterminalKind::Expr(Expr2021 { inferred: false }) => sym::expr_2021, NonterminalKind::Ty => sym::ty, NonterminalKind::Ident => sym::ident, NonterminalKind::Lifetime => sym::lifetime, NonterminalKind::Literal => sym::literal, NonterminalKind::Meta => sym::meta, NonterminalKind::Path => sym::path, NonterminalKind::Vis => sym::vis, NonterminalKind::TT => sym::tt, } } } impl fmt::Display for NonterminalKind { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { write!(f, "{}", self.symbol()) } } // Some types are used a lot. Make sure they don't unintentionally get bigger. #[cfg(target_pointer_width = "64")] mod size_asserts { use rustc_data_structures::static_assert_size; use super::*; // tidy-alphabetical-start static_assert_size!(Lit, 12); static_assert_size!(LitKind, 2); static_assert_size!(Token, 24); static_assert_size!(TokenKind, 16); // tidy-alphabetical-end }