Move functions to librustc_parse

2020-05-20 00:00:33 -04:00 · 2020-05-20 00:00:33 -04:00 · 7a4c1865fb
commit 7a4c1865fb
parent a9ca1ec928
3 changed files with 123 additions and 179 deletions
--- a/src/librustc_ast/token.rs
+++ b/src/librustc_ast/token.rs
@ -673,62 +673,6 @@ impl Token {
        Some(Token::new(kind, self.span.to(joint.span)))
    }
    // See comments in `Nonterminal::to_tokenstream` for why we care about
    // *probably* equal here rather than actual equality
    crate fn probably_equal_for_proc_macro(&self, other: &Token) -> bool {
        if mem::discriminant(&self.kind) != mem::discriminant(&other.kind) {
            return false;
        }
        match (&self.kind, &other.kind) {
            (&Eq, &Eq)
            | (&Lt, &Lt)
            | (&Le, &Le)
            | (&EqEq, &EqEq)
            | (&Ne, &Ne)
            | (&Ge, &Ge)
            | (&Gt, &Gt)
            | (&AndAnd, &AndAnd)
            | (&OrOr, &OrOr)
            | (&Not, &Not)
            | (&Tilde, &Tilde)
            | (&At, &At)
            | (&Dot, &Dot)
            | (&DotDot, &DotDot)
            | (&DotDotDot, &DotDotDot)
            | (&DotDotEq, &DotDotEq)
            | (&Comma, &Comma)
            | (&Semi, &Semi)
            | (&Colon, &Colon)
            | (&ModSep, &ModSep)
            | (&RArrow, &RArrow)
            | (&LArrow, &LArrow)
            | (&FatArrow, &FatArrow)
            | (&Pound, &Pound)
            | (&Dollar, &Dollar)
            | (&Question, &Question)
            | (&Whitespace, &Whitespace)
            | (&Comment, &Comment)
            | (&Eof, &Eof) => true,
            (&BinOp(a), &BinOp(b)) | (&BinOpEq(a), &BinOpEq(b)) => a == b,
            (&OpenDelim(a), &OpenDelim(b)) | (&CloseDelim(a), &CloseDelim(b)) => a == b,
            (&DocComment(a), &DocComment(b)) | (&Shebang(a), &Shebang(b)) => a == b,
            (&Literal(a), &Literal(b)) => a == b,
            (&Lifetime(a), &Lifetime(b)) => a == b,
            (&Ident(a, b), &Ident(c, d)) => {
                b == d && (a == c || a == kw::DollarCrate || c == kw::DollarCrate)
            }
            (&Interpolated(_), &Interpolated(_)) => false,
            _ => panic!("forgot to add a token?"),
        }
    }
 }
 impl PartialEq<TokenKind> for Token {
--- a/src/librustc_ast/tokenstream.rs
+++ b/src/librustc_ast/tokenstream.rs
@ -68,23 +68,6 @@ impl TokenTree {
        }
    }
    // See comments in `Nonterminal::to_tokenstream` for why we care about
    // *probably* equal here rather than actual equality
    //
    // This is otherwise the same as `eq_unspanned`, only recursing with a
    // different method.
    pub fn probably_equal_for_proc_macro(&self, other: &TokenTree) -> bool {
        match (self, other) {
            (TokenTree::Token(token), TokenTree::Token(token2)) => {
                token.probably_equal_for_proc_macro(token2)
            }
            (TokenTree::Delimited(_, delim, tts), TokenTree::Delimited(_, delim2, tts2)) => {
                delim == delim2 && tts.probably_equal_for_proc_macro(&tts2)
            }
            _ => false,
        }
    }
    /// Retrieves the TokenTree's span.
    pub fn span(&self) -> Span {
        match self {
@ -307,111 +290,7 @@ impl TokenStream {
        t1.next().is_none() && t2.next().is_none()
    }
    // See comments in `Nonterminal::to_tokenstream` for why we care about
    // *probably* equal here rather than actual equality
    //
    // This is otherwise the same as `eq_unspanned`, only recursing with a
    // different method.
    pub fn probably_equal_for_proc_macro(&self, other: &TokenStream) -> bool {
        // When checking for `probably_eq`, we ignore certain tokens that aren't
        // preserved in the AST. Because they are not preserved, the pretty
        // printer arbitrarily adds or removes them when printing as token
        // streams, making a comparison between a token stream generated from an
        // AST and a token stream which was parsed into an AST more reliable.
        fn semantic_tree(tree: &TokenTree) -> bool {
            if let TokenTree::Token(token) = tree {
                if let
                    // The pretty printer tends to add trailing commas to
                    // everything, and in particular, after struct fields.
                    | token::Comma
                    // The pretty printer emits `NoDelim` as whitespace.
                    | token::OpenDelim(DelimToken::NoDelim)
                    | token::CloseDelim(DelimToken::NoDelim)
                    // The pretty printer collapses many semicolons into one.
                    | token::Semi
                    // The pretty printer collapses whitespace arbitrarily and can
                    // introduce whitespace from `NoDelim`.
                    | token::Whitespace
                    // The pretty printer can turn `$crate` into `::crate_name`
                    | token::ModSep = token.kind {
                    return false;
                }
            }
            true
        }
        // When comparing two `TokenStream`s, we ignore the `IsJoint` information.
        //
        // However, `rustc_parse::lexer::tokentrees::TokenStreamBuilder` will
        // use `Token.glue` on adjacent tokens with the proper `IsJoint`.
        // Since we are ignoreing `IsJoint`, a 'glued' token (e.g. `BinOp(Shr)`)
        // and its 'split'/'unglued' compoenents (e.g. `Gt, Gt`) are equivalent
        // when determining if two `TokenStream`s are 'probably equal'.
        //
        // Therefore, we use `break_two_token_op` to convert all tokens
        // to the 'unglued' form (if it exists). This ensures that two
        // `TokenStream`s which differ only in how their tokens are glued
        // will be considered 'probably equal', which allows us to keep spans.
        //
        // This is important when the original `TokenStream` contained
        // extra spaces (e.g. `f :: < Vec < _ > > ( ) ;'). These extra spaces
        // will be omitted when we pretty-print, which can cause the original
        // and reparsed `TokenStream`s to differ in the assignment of `IsJoint`,
        // leading to some tokens being 'glued' together in one stream but not
        // the other. See #68489 for more details.
        fn break_tokens(tree: TokenTree) -> impl Iterator<Item = TokenTree> {
            // In almost all cases, we should have either zero or one levels
            // of 'unglueing'. However, in some unusual cases, we may need
            // to iterate breaking tokens mutliple times. For example:
            // '[BinOpEq(Shr)] => [Gt, Ge] -> [Gt, Gt, Eq]'
            let mut token_trees: SmallVec<[_; 2]>;
            if let TokenTree::Token(token) = &tree {
                let mut out = SmallVec::<[_; 2]>::new();
                out.push(token.clone());
                // Iterate to fixpoint:
                // * We start off with 'out' containing our initial token, and `temp` empty
                // * If we are able to break any tokens in `out`, then `out` will have
                //   at least one more element than 'temp', so we will try to break tokens
                //   again.
                // * If we cannot break any tokens in 'out', we are done
                loop {
                    let mut temp = SmallVec::<[_; 2]>::new();
                    let mut changed = false;
                    for token in out.into_iter() {
                        if let Some((first, second)) = token.kind.break_two_token_op() {
                            temp.push(Token::new(first, DUMMY_SP));
                            temp.push(Token::new(second, DUMMY_SP));
                            changed = true;
                        } else {
                            temp.push(token);
                        }
                    }
                    out = temp;
                    if !changed {
                        break;
                    }
                }
                token_trees = out.into_iter().map(|t| TokenTree::Token(t)).collect();
                if token_trees.len() != 1 {
                    debug!("break_tokens: broke {:?} to {:?}", tree, token_trees);
                }
            } else {
                token_trees = SmallVec::new();
                token_trees.push(tree);
            }
            token_trees.into_iter()
        }
        let mut t1 = self.trees().filter(semantic_tree).flat_map(break_tokens);
        let mut t2 = other.trees().filter(semantic_tree).flat_map(break_tokens);
        for (t1, t2) in t1.by_ref().zip(t2.by_ref()) {
            if !t1.probably_equal_for_proc_macro(&t2) {
                return false;
            }
        }
        t1.next().is_none() && t2.next().is_none()
    }
    pub fn map_enumerated<F: FnMut(usize, TokenTree) -> TokenTree>(self, mut f: F) -> TokenStream {
        TokenStream(Lrc::new(
--- a/src/librustc_parse/lib.rs
+++ b/src/librustc_parse/lib.rs
@ -7,16 +7,18 @@
 #![feature(or_patterns)]
 use rustc_ast::ast;
-use rustc_ast::token::{self, Nonterminal};
+use rustc_ast::token::{self, Nonterminal, Token, TokenKind, DelimToken};
 use rustc_ast::tokenstream::{self, TokenStream, TokenTree};
 use rustc_ast_pretty::pprust;
 use rustc_data_structures::sync::Lrc;
 use rustc_errors::{Diagnostic, FatalError, Level, PResult};
 use rustc_session::parse::ParseSess;
 use rustc_span::{FileName, SourceFile, Span};
 use rustc_span::symbol::kw;
 use std::path::Path;
 use std::str;
 use std::mem;
 use log::info;
@ -300,7 +302,7 @@ pub fn nt_to_tokenstream(nt: &Nonterminal, sess: &ParseSess, span: Span) -> Toke
    // modifications, including adding/removing typically non-semantic
    // tokens such as extra braces and commas, don't happen.
    if let Some(tokens) = tokens {
-        if tokens.probably_equal_for_proc_macro(&tokens_for_real) {
+        if tokenstream_probably_equal_for_proc_macro(&tokens, &tokens_for_real) {
            return tokens;
        }
        info!(
@ -373,3 +375,122 @@ fn prepend_attrs(
    builder.push(tokens.clone());
    Some(builder.build())
 }
 // See comments in `Nonterminal::to_tokenstream` for why we care about
 // *probably* equal here rather than actual equality
 //
 // This is otherwise the same as `eq_unspanned`, only recursing with a
 // different method.
 pub fn tokenstream_probably_equal_for_proc_macro(first: &TokenStream, other: &TokenStream) -> bool {
    // When checking for `probably_eq`, we ignore certain tokens that aren't
    // preserved in the AST. Because they are not preserved, the pretty
    // printer arbitrarily adds or removes them when printing as token
    // streams, making a comparison between a token stream generated from an
    // AST and a token stream which was parsed into an AST more reliable.
    fn semantic_tree(tree: &TokenTree) -> bool {
        if let TokenTree::Token(token) = tree {
            if let
                // The pretty printer tends to add trailing commas to
                // everything, and in particular, after struct fields.
                | token::Comma
                // The pretty printer emits `NoDelim` as whitespace.
                | token::OpenDelim(DelimToken::NoDelim)
                | token::CloseDelim(DelimToken::NoDelim)
                // The pretty printer collapses many semicolons into one.
                | token::Semi
                // The pretty printer collapses whitespace arbitrarily and can
                // introduce whitespace from `NoDelim`.
                | token::Whitespace
                // The pretty printer can turn `$crate` into `::crate_name`
                | token::ModSep = token.kind {
                return false;
            }
        }
        true
    }
    let mut t1 = first.trees().filter(semantic_tree);
    let mut t2 = other.trees().filter(semantic_tree);
    for (t1, t2) in t1.by_ref().zip(t2.by_ref()) {
        if !tokentree_probably_equal_for_proc_macro(&t1, &t2) {
            return false;
        }
    }
    t1.next().is_none() && t2.next().is_none()
 }
 // See comments in `Nonterminal::to_tokenstream` for why we care about
 // *probably* equal here rather than actual equality
 crate fn token_probably_equal_for_proc_macro(first: &Token, other: &Token) -> bool {
    use TokenKind::*;
    if mem::discriminant(&first.kind) != mem::discriminant(&other.kind) {
        return false;
    }
    match (&first.kind, &other.kind) {
        (&Eq, &Eq)
        | (&Lt, &Lt)
        | (&Le, &Le)
        | (&EqEq, &EqEq)
        | (&Ne, &Ne)
        | (&Ge, &Ge)
        | (&Gt, &Gt)
        | (&AndAnd, &AndAnd)
        | (&OrOr, &OrOr)
        | (&Not, &Not)
        | (&Tilde, &Tilde)
        | (&At, &At)
        | (&Dot, &Dot)
        | (&DotDot, &DotDot)
        | (&DotDotDot, &DotDotDot)
        | (&DotDotEq, &DotDotEq)
        | (&Comma, &Comma)
        | (&Semi, &Semi)
        | (&Colon, &Colon)
        | (&ModSep, &ModSep)
        | (&RArrow, &RArrow)
        | (&LArrow, &LArrow)
        | (&FatArrow, &FatArrow)
        | (&Pound, &Pound)
        | (&Dollar, &Dollar)
        | (&Question, &Question)
        | (&Whitespace, &Whitespace)
        | (&Comment, &Comment)
        | (&Eof, &Eof) => true,
        (&BinOp(a), &BinOp(b)) | (&BinOpEq(a), &BinOpEq(b)) => a == b,
        (&OpenDelim(a), &OpenDelim(b)) | (&CloseDelim(a), &CloseDelim(b)) => a == b,
        (&DocComment(a), &DocComment(b)) | (&Shebang(a), &Shebang(b)) => a == b,
        (&Literal(a), &Literal(b)) => a == b,
        (&Lifetime(a), &Lifetime(b)) => a == b,
        (&Ident(a, b), &Ident(c, d)) => {
            b == d && (a == c || a == kw::DollarCrate || c == kw::DollarCrate)
        }
        (&Interpolated(_), &Interpolated(_)) => false,
        _ => panic!("forgot to add a token?"),
    }
 }
 // See comments in `Nonterminal::to_tokenstream` for why we care about
 // *probably* equal here rather than actual equality
 //
 // This is otherwise the same as `eq_unspanned`, only recursing with a
 // different method.
 pub fn tokentree_probably_equal_for_proc_macro(first: &TokenTree, other: &TokenTree) -> bool {
    match (first, other) {
        (TokenTree::Token(token), TokenTree::Token(token2)) => {
            token_probably_equal_for_proc_macro(token, token2)
        }
        (TokenTree::Delimited(_, delim, tts), TokenTree::Delimited(_, delim2, tts2)) => {
            delim == delim2 && tokenstream_probably_equal_for_proc_macro(&tts, &tts2)
        }
        _ => false,
    }
 }