Auto merge of #103185 - chenyukang:yukang/fix-span-next-point, r=davidtwco
Fix the bug of next_point in source_map There is a bug in `next_point`, the new span won't move to next position when be called in the first time. For this reason, our current code is working like this: 1. When we really want to move to the next position, we called two times of `next_point` 2. Some code which use `next_point` actually done the same thing with `shrink_to_hi` This fix make sure when `next_point` is called, span will move with the width at least 1, and also work correctly in the scenario of multiple bytes. Ref: https://github.com/rust-lang/rust/pull/103140#discussion_r997710998 r? `@davidtwco`
This commit is contained in:
commit
53728ff751
9 changed files with 71 additions and 20 deletions
|
@ -853,20 +853,27 @@ impl SourceMap {
|
|||
}
|
||||
|
||||
/// Returns a new span representing the next character after the end-point of this span.
|
||||
/// Special cases:
|
||||
/// - if span is a dummy one, returns the same span
|
||||
/// - if next_point reached the end of source, return span with lo = hi
|
||||
/// - respect multi-byte characters
|
||||
pub fn next_point(&self, sp: Span) -> Span {
|
||||
if sp.is_dummy() {
|
||||
return sp;
|
||||
}
|
||||
let start_of_next_point = sp.hi().0;
|
||||
|
||||
let width = self.find_width_of_character_at_span(sp.shrink_to_hi(), true);
|
||||
// If the width is 1, then the next span should point to the same `lo` and `hi`. However,
|
||||
// in the case of a multibyte character, where the width != 1, the next span should
|
||||
let width = self.find_width_of_character_at_span(sp, true);
|
||||
if width == 0 {
|
||||
return Span::new(sp.hi(), sp.hi(), sp.ctxt(), None);
|
||||
}
|
||||
// If the width is 1, then the next span should only contain the next char besides current ending.
|
||||
// However, in the case of a multibyte character, where the width != 1, the next span should
|
||||
// span multiple bytes to include the whole character.
|
||||
let end_of_next_point =
|
||||
start_of_next_point.checked_add(width - 1).unwrap_or(start_of_next_point);
|
||||
start_of_next_point.checked_add(width).unwrap_or(start_of_next_point);
|
||||
|
||||
let end_of_next_point = BytePos(cmp::max(sp.lo().0 + 1, end_of_next_point));
|
||||
let end_of_next_point = BytePos(cmp::max(start_of_next_point + 1, end_of_next_point));
|
||||
Span::new(BytePos(start_of_next_point), end_of_next_point, sp.ctxt(), None)
|
||||
}
|
||||
|
||||
|
@ -874,7 +881,8 @@ impl SourceMap {
|
|||
/// depending on the `forwards` parameter.
|
||||
fn find_width_of_character_at_span(&self, sp: Span, forwards: bool) -> u32 {
|
||||
let sp = sp.data();
|
||||
if sp.lo == sp.hi {
|
||||
|
||||
if sp.lo == sp.hi && !forwards {
|
||||
debug!("find_width_of_character_at_span: early return empty span");
|
||||
return 1;
|
||||
}
|
||||
|
@ -908,9 +916,9 @@ impl SourceMap {
|
|||
let source_len = (local_begin.sf.end_pos - local_begin.sf.start_pos).to_usize();
|
||||
debug!("find_width_of_character_at_span: source_len=`{:?}`", source_len);
|
||||
// Ensure indexes are also not malformed.
|
||||
if start_index > end_index || end_index > source_len {
|
||||
if start_index > end_index || end_index > source_len - 1 {
|
||||
debug!("find_width_of_character_at_span: source indexes are malformed");
|
||||
return 1;
|
||||
return 0;
|
||||
}
|
||||
|
||||
let src = local_begin.sf.external_src.borrow();
|
||||
|
|
|
@ -479,3 +479,48 @@ fn path_prefix_remapping_expand_to_absolute() {
|
|||
RealFileName::Remapped { local_path: None, virtual_name: path("XYZ/src/main.rs") }
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn test_next_point() {
|
||||
let sm = SourceMap::new(FilePathMapping::empty());
|
||||
sm.new_source_file(PathBuf::from("example.rs").into(), "a…b".to_string());
|
||||
|
||||
// Dummy spans don't advance.
|
||||
let span = DUMMY_SP;
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(span.lo().0, 0);
|
||||
assert_eq!(span.hi().0, 0);
|
||||
|
||||
// Span advance respect multi-byte character
|
||||
let span = Span::with_root_ctxt(BytePos(0), BytePos(1));
|
||||
assert_eq!(sm.span_to_snippet(span), Ok("a".to_string()));
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(sm.span_to_snippet(span), Ok("…".to_string()));
|
||||
assert_eq!(span.lo().0, 1);
|
||||
assert_eq!(span.hi().0, 4);
|
||||
|
||||
// An empty span pointing just before a multi-byte character should
|
||||
// advance to contain the multi-byte character.
|
||||
let span = Span::with_root_ctxt(BytePos(1), BytePos(1));
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(span.lo().0, 1);
|
||||
assert_eq!(span.hi().0, 4);
|
||||
|
||||
let span = Span::with_root_ctxt(BytePos(1), BytePos(4));
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(span.lo().0, 4);
|
||||
assert_eq!(span.hi().0, 5);
|
||||
|
||||
// A non-empty span at the last byte should advance to create an empty
|
||||
// span pointing at the end of the file.
|
||||
let span = Span::with_root_ctxt(BytePos(4), BytePos(5));
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(span.lo().0, 5);
|
||||
assert_eq!(span.hi().0, 5);
|
||||
|
||||
// Empty span pointing just past the last byte.
|
||||
let span = Span::with_root_ctxt(BytePos(5), BytePos(5));
|
||||
let span = sm.next_point(span);
|
||||
assert_eq!(span.lo().0, 5);
|
||||
assert_eq!(span.hi().0, 5);
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue