Shrink Token
.
From 72 bytes to 12 bytes (on x86-64). There are two parts to this: - Changing various source code offsets from 64-bit to 32-bit. This is not a problem because the rest of rustc also uses 32-bit source code offsets. This means `Token` is no longer `Copy` but this causes no problems. - Removing the `RawStrError` from `LiteralKind`. Raw string literal invalidity is now indicated by a `None` value within `RawStr`/`RawByteStr`, and the new `validate_raw_str` function can be used to re-lex an invalid raw string literal to get the `RawStrError`. There is one very small change in behaviour. Previously, if a raw string literal matched both the `InvalidStarter` and `TooManyHashes` cases, the latter would override the former. This has now changed, because `raw_double_quoted_string` now uses `?` and so returns immediately upon detecting the `InvalidStarter` case. I think this is a slight improvement to report the earlier-detected error, and it explains the change in the `test_too_many_hashes` test. The commit also removes a couple of comments that refer to #77629 and say that the size of these types don't affect performance. These comments are wrong, though the performance effect is small.
This commit is contained in:
parent
e6b9fccfb1
commit
99f5c79d64
9 changed files with 111 additions and 103 deletions
|
@ -27,7 +27,7 @@ use unescape_error_reporting::{emit_unescape_error, escaped_char};
|
|||
// This assertion is in this crate, rather than in `rustc_lexer`, because that
|
||||
// crate cannot depend on `rustc_data_structures`.
|
||||
#[cfg(all(target_arch = "x86_64", target_pointer_width = "64"))]
|
||||
rustc_data_structures::static_assert_size!(rustc_lexer::Token, 72);
|
||||
rustc_data_structures::static_assert_size!(rustc_lexer::Token, 12);
|
||||
|
||||
#[derive(Clone, Debug)]
|
||||
pub struct UnmatchedBrace {
|
||||
|
@ -88,7 +88,7 @@ impl<'a> StringReader<'a> {
|
|||
let token = rustc_lexer::first_token(text);
|
||||
|
||||
let start = self.pos;
|
||||
self.pos = self.pos + BytePos::from_usize(token.len);
|
||||
self.pos = self.pos + BytePos(token.len);
|
||||
|
||||
debug!("next_token: {:?}({:?})", token.kind, self.str_from(start));
|
||||
|
||||
|
@ -240,7 +240,7 @@ impl<'a> StringReader<'a> {
|
|||
token::Ident(sym, false)
|
||||
}
|
||||
rustc_lexer::TokenKind::Literal { kind, suffix_start } => {
|
||||
let suffix_start = start + BytePos(suffix_start as u32);
|
||||
let suffix_start = start + BytePos(suffix_start);
|
||||
let (kind, symbol) = self.cook_lexer_literal(start, suffix_start, kind);
|
||||
let suffix = if suffix_start < self.pos {
|
||||
let string = self.str_from(suffix_start);
|
||||
|
@ -405,15 +405,21 @@ impl<'a> StringReader<'a> {
|
|||
}
|
||||
(token::ByteStr, Mode::ByteStr, 2, 1) // b" "
|
||||
}
|
||||
rustc_lexer::LiteralKind::RawStr { n_hashes, err } => {
|
||||
self.report_raw_str_error(start, err);
|
||||
let n = u32::from(n_hashes);
|
||||
(token::StrRaw(n_hashes), Mode::RawStr, 2 + n, 1 + n) // r##" "##
|
||||
rustc_lexer::LiteralKind::RawStr { n_hashes } => {
|
||||
if let Some(n_hashes) = n_hashes {
|
||||
let n = u32::from(n_hashes);
|
||||
(token::StrRaw(n_hashes), Mode::RawStr, 2 + n, 1 + n) // r##" "##
|
||||
} else {
|
||||
self.report_raw_str_error(start, 1);
|
||||
}
|
||||
}
|
||||
rustc_lexer::LiteralKind::RawByteStr { n_hashes, err } => {
|
||||
self.report_raw_str_error(start, err);
|
||||
let n = u32::from(n_hashes);
|
||||
(token::ByteStrRaw(n_hashes), Mode::RawByteStr, 3 + n, 1 + n) // br##" "##
|
||||
rustc_lexer::LiteralKind::RawByteStr { n_hashes } => {
|
||||
if let Some(n_hashes) = n_hashes {
|
||||
let n = u32::from(n_hashes);
|
||||
(token::ByteStrRaw(n_hashes), Mode::RawByteStr, 3 + n, 1 + n) // br##" "##
|
||||
} else {
|
||||
self.report_raw_str_error(start, 2);
|
||||
}
|
||||
}
|
||||
rustc_lexer::LiteralKind::Int { base, empty_int } => {
|
||||
return if empty_int {
|
||||
|
@ -484,17 +490,17 @@ impl<'a> StringReader<'a> {
|
|||
&self.src[self.src_index(start)..self.src_index(end)]
|
||||
}
|
||||
|
||||
fn report_raw_str_error(&self, start: BytePos, opt_err: Option<RawStrError>) {
|
||||
match opt_err {
|
||||
Some(RawStrError::InvalidStarter { bad_char }) => {
|
||||
fn report_raw_str_error(&self, start: BytePos, prefix_len: u32) -> ! {
|
||||
match rustc_lexer::validate_raw_str(self.str_from(start), prefix_len) {
|
||||
Err(RawStrError::InvalidStarter { bad_char }) => {
|
||||
self.report_non_started_raw_string(start, bad_char)
|
||||
}
|
||||
Some(RawStrError::NoTerminator { expected, found, possible_terminator_offset }) => self
|
||||
Err(RawStrError::NoTerminator { expected, found, possible_terminator_offset }) => self
|
||||
.report_unterminated_raw_string(start, expected, possible_terminator_offset, found),
|
||||
Some(RawStrError::TooManyDelimiters { found }) => {
|
||||
Err(RawStrError::TooManyDelimiters { found }) => {
|
||||
self.report_too_many_hashes(start, found)
|
||||
}
|
||||
None => (),
|
||||
Ok(()) => panic!("no error found for supposedly invalid raw string literal"),
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -511,9 +517,9 @@ impl<'a> StringReader<'a> {
|
|||
fn report_unterminated_raw_string(
|
||||
&self,
|
||||
start: BytePos,
|
||||
n_hashes: usize,
|
||||
possible_offset: Option<usize>,
|
||||
found_terminators: usize,
|
||||
n_hashes: u32,
|
||||
possible_offset: Option<u32>,
|
||||
found_terminators: u32,
|
||||
) -> ! {
|
||||
let mut err = self.sess.span_diagnostic.struct_span_fatal_with_code(
|
||||
self.mk_sp(start, start),
|
||||
|
@ -526,7 +532,7 @@ impl<'a> StringReader<'a> {
|
|||
if n_hashes > 0 {
|
||||
err.note(&format!(
|
||||
"this raw string should be terminated with `\"{}`",
|
||||
"#".repeat(n_hashes)
|
||||
"#".repeat(n_hashes as usize)
|
||||
));
|
||||
}
|
||||
|
||||
|
@ -537,7 +543,7 @@ impl<'a> StringReader<'a> {
|
|||
err.span_suggestion(
|
||||
span,
|
||||
"consider terminating the string here",
|
||||
"#".repeat(n_hashes),
|
||||
"#".repeat(n_hashes as usize),
|
||||
Applicability::MaybeIncorrect,
|
||||
);
|
||||
}
|
||||
|
@ -638,7 +644,7 @@ impl<'a> StringReader<'a> {
|
|||
}
|
||||
}
|
||||
|
||||
fn report_too_many_hashes(&self, start: BytePos, found: usize) -> ! {
|
||||
fn report_too_many_hashes(&self, start: BytePos, found: u32) -> ! {
|
||||
self.fatal_span_(
|
||||
start,
|
||||
self.pos,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue