Fix large block comments

This commit is contained in:
Marcus Klaas 2015-10-19 21:41:47 +02:00
parent 3970748f59
commit e8447a8210
13 changed files with 314 additions and 68 deletions

4
Cargo.lock generated
View file

@ -7,7 +7,7 @@ dependencies = [
"rustc-serialize 0.3.16 (registry+https://github.com/rust-lang/crates.io-index)", "rustc-serialize 0.3.16 (registry+https://github.com/rust-lang/crates.io-index)",
"strings 0.0.1 (git+https://github.com/nrc/strings.rs.git)", "strings 0.0.1 (git+https://github.com/nrc/strings.rs.git)",
"term 0.2.12 (registry+https://github.com/rust-lang/crates.io-index)", "term 0.2.12 (registry+https://github.com/rust-lang/crates.io-index)",
"toml 0.1.22 (registry+https://github.com/rust-lang/crates.io-index)", "toml 0.1.23 (registry+https://github.com/rust-lang/crates.io-index)",
"unicode-segmentation 0.1.2 (registry+https://github.com/rust-lang/crates.io-index)", "unicode-segmentation 0.1.2 (registry+https://github.com/rust-lang/crates.io-index)",
] ]
@ -93,7 +93,7 @@ dependencies = [
[[package]] [[package]]
name = "toml" name = "toml"
version = "0.1.22" version = "0.1.23"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
dependencies = [ dependencies = [
"rustc-serialize 0.3.16 (registry+https://github.com/rust-lang/crates.io-index)", "rustc-serialize 0.3.16 (registry+https://github.com/rust-lang/crates.io-index)",

View file

@ -81,11 +81,11 @@ pub fn rewrite_comment(orig: &str,
let rewrite = try_opt!(rewrite_string(line, &fmt)); let rewrite = try_opt!(rewrite_string(line, &fmt));
result.push_str(&rewrite); result.push_str(&rewrite);
} else { } else {
if line.len() == 0 { if line.len() == 0 || line.starts_with('!') {
result.pop(); // Remove space if this is an empty comment. // Remove space if this is an empty comment or a doc comment.
} else { result.pop();
result.push_str(line);
} }
result.push_str(line);
} }
first = false; first = false;
@ -162,7 +162,7 @@ pub fn contains_comment(text: &str) -> bool {
CharClasses::new(text.chars()).any(|(kind, _)| kind == CodeCharKind::Comment) CharClasses::new(text.chars()).any(|(kind, _)| kind == CodeCharKind::Comment)
} }
pub struct CharClasses<T> struct CharClasses<T>
where T: Iterator, where T: Iterator,
T::Item: RichChar T::Item: RichChar
{ {
@ -170,7 +170,7 @@ pub struct CharClasses<T>
status: CharClassesStatus, status: CharClassesStatus,
} }
pub trait RichChar { trait RichChar {
fn get_char(&self) -> char; fn get_char(&self) -> char;
} }
@ -211,7 +211,7 @@ pub enum CodeCharKind {
} }
impl<T> CharClasses<T> where T: Iterator, T::Item: RichChar { impl<T> CharClasses<T> where T: Iterator, T::Item: RichChar {
pub fn new(base: T) -> CharClasses<T> { fn new(base: T) -> CharClasses<T> {
CharClasses { CharClasses {
base: base.peekable(), base: base.peekable(),
status: CharClassesStatus::Normal, status: CharClassesStatus::Normal,
@ -291,10 +291,6 @@ impl<T> Iterator for CharClasses<T> where T: Iterator, T::Item: RichChar {
'\n' => CharClassesStatus::Normal, '\n' => CharClassesStatus::Normal,
_ => CharClassesStatus::LineComment, _ => CharClassesStatus::LineComment,
}; };
// let code_char_kind = match chr {
// '\n' => CodeCharKind::Normal,
// _ => CodeCharKind::Comment,
// };
return Some((CodeCharKind::Comment, item)); return Some((CodeCharKind::Comment, item));
} }
}; };
@ -302,9 +298,12 @@ impl<T> Iterator for CharClasses<T> where T: Iterator, T::Item: RichChar {
} }
} }
/// Iterator over an alternating sequence of functional and commented parts of
/// a string. The first item is always a, possibly zero length, subslice of
/// functional text. Line style comments contain their ending newlines.
pub struct CommentCodeSlices<'a> { pub struct CommentCodeSlices<'a> {
slice: &'a str, slice: &'a str,
last_slice_type: CodeCharKind, last_slice_kind: CodeCharKind,
last_slice_end: usize, last_slice_end: usize,
} }
@ -312,7 +311,7 @@ impl<'a> CommentCodeSlices<'a> {
pub fn new(slice: &'a str) -> CommentCodeSlices<'a> { pub fn new(slice: &'a str) -> CommentCodeSlices<'a> {
CommentCodeSlices { CommentCodeSlices {
slice: slice, slice: slice,
last_slice_type: CodeCharKind::Comment, last_slice_kind: CodeCharKind::Comment,
last_slice_end: 0, last_slice_end: 0,
} }
} }
@ -327,32 +326,52 @@ impl<'a> Iterator for CommentCodeSlices<'a> {
} }
let mut sub_slice_end = self.last_slice_end; let mut sub_slice_end = self.last_slice_end;
for (kind, (i, _)) in CharClasses::new(self.slice[self.last_slice_end..].char_indices()) { let mut first_whitespace = None;
if kind == self.last_slice_type { let subslice = &self.slice[self.last_slice_end..];
sub_slice_end = self.last_slice_end + i; let mut iter = CharClasses::new(subslice.char_indices());
for (kind, (i, c)) in &mut iter {
let is_comment_connector = self.last_slice_kind == CodeCharKind::Normal &&
&subslice[..2] == "//" &&
[' ', '\t'].contains(&c);
if is_comment_connector && first_whitespace.is_none() {
first_whitespace = Some(i);
}
if kind == self.last_slice_kind && !is_comment_connector {
let last_index = match first_whitespace {
Some(j) => j,
None => i,
};
sub_slice_end = self.last_slice_end + last_index;
break; break;
} }
if !is_comment_connector {
first_whitespace = None;
}
} }
let kind = match self.last_slice_type { if let (None, true) = (iter.next(), sub_slice_end == self.last_slice_end) {
// This was the last subslice.
sub_slice_end = match first_whitespace {
Some(i) => self.last_slice_end + i,
None => self.slice.len(),
};
}
let kind = match self.last_slice_kind {
CodeCharKind::Comment => CodeCharKind::Normal, CodeCharKind::Comment => CodeCharKind::Normal,
CodeCharKind::Normal => CodeCharKind::Comment, CodeCharKind::Normal => CodeCharKind::Comment,
}; };
self.last_slice_type = kind; let res = (kind,
self.last_slice_end,
&self.slice[self.last_slice_end..sub_slice_end]);
self.last_slice_end = sub_slice_end;
self.last_slice_kind = kind;
// FIXME: be consistent in use of kind vs type. Some(res)
if sub_slice_end == self.last_slice_end {
// This was the last subslice.
self.last_slice_end = self.slice.len();
Some((kind, sub_slice_end, &self.slice[sub_slice_end..]))
} else {
let res = (kind,
self.last_slice_end,
&self.slice[self.last_slice_end..sub_slice_end]);
self.last_slice_end = sub_slice_end;
Some(res)
}
} }
} }
@ -362,10 +381,20 @@ mod test {
CommentCodeSlices}; CommentCodeSlices};
use Indent; use Indent;
#[test]
fn char_classes() {
let mut iter = CharClasses::new("//\n\n".chars());
assert_eq!((CodeCharKind::Comment, '/'), iter.next().unwrap());
assert_eq!((CodeCharKind::Comment, '/'), iter.next().unwrap());
assert_eq!((CodeCharKind::Comment, '\n'), iter.next().unwrap());
assert_eq!((CodeCharKind::Normal, '\n'), iter.next().unwrap());
assert_eq!(None, iter.next());
}
#[test] #[test]
fn comment_code_slices() { fn comment_code_slices() {
let input = "code(); /* test */ 1 + 1"; let input = "code(); /* test */ 1 + 1";
let mut iter = CommentCodeSlices::new(input); let mut iter = CommentCodeSlices::new(input);
assert_eq!((CodeCharKind::Normal, 0, "code(); "), iter.next().unwrap()); assert_eq!((CodeCharKind::Normal, 0, "code(); "), iter.next().unwrap());
@ -375,6 +404,31 @@ mod test {
assert_eq!(None, iter.next()); assert_eq!(None, iter.next());
} }
#[test]
fn comment_code_slices_two() {
let input = "// comment\n test();";
let mut iter = CommentCodeSlices::new(input);
assert_eq!((CodeCharKind::Normal, 0, ""), iter.next().unwrap());
assert_eq!((CodeCharKind::Comment, 0, "// comment\n"),
iter.next().unwrap());
assert_eq!((CodeCharKind::Normal, 11, " test();"),
iter.next().unwrap());
assert_eq!(None, iter.next());
}
#[test]
fn comment_code_slices_three() {
let input = "1 // comment\n // comment2\n\n";
let mut iter = CommentCodeSlices::new(input);
assert_eq!((CodeCharKind::Normal, 0, "1 "), iter.next().unwrap());
assert_eq!((CodeCharKind::Comment, 2, "// comment\n // comment2\n"),
iter.next().unwrap());
assert_eq!((CodeCharKind::Normal, 29, "\n"), iter.next().unwrap());
assert_eq!(None, iter.next());
}
#[test] #[test]
#[rustfmt_skip] #[rustfmt_skip]
fn format_comments() { fn format_comments() {
@ -434,7 +488,6 @@ mod test {
#[test] #[test]
fn test_find_uncommented() { fn test_find_uncommented() {
fn check(haystack: &str, needle: &str, expected: Option<usize>) { fn check(haystack: &str, needle: &str, expected: Option<usize>) {
println!("haystack {:?}, needle: {:?}", haystack, needle);
assert_eq!(expected, haystack.find_uncommented(needle)); assert_eq!(expected, haystack.find_uncommented(needle));
} }

View file

@ -471,10 +471,6 @@ impl Rewrite for ast::Block {
visitor.visit_block(self); visitor.visit_block(self);
// Push text between last block item and end of block
let snippet = visitor.snippet(mk_sp(visitor.last_pos, self.span.hi));
visitor.buffer.push_str(&snippet);
Some(format!("{}{}", prefix, visitor.buffer)) Some(format!("{}{}", prefix, visitor.buffer))
} }
} }
@ -1534,8 +1530,8 @@ pub fn rewrite_assign_rhs<S: Into<String>>(context: &RewriteContext,
let new_offset = offset.block_indent(context.config); let new_offset = offset.block_indent(context.config);
result.push_str(&format!("\n{}", new_offset.to_string(context.config))); result.push_str(&format!("\n{}", new_offset.to_string(context.config)));
// FIXME: we probably should related max_width to width instead of config.max_width // FIXME: we probably should related max_width to width instead of
// where is the 1 coming from anyway? // config.max_width where is the 1 coming from anyway?
let max_width = try_opt!(context.config.max_width.checked_sub(new_offset.width() + 1)); let max_width = try_opt!(context.config.max_width.checked_sub(new_offset.width() + 1));
let inner_context = context.nested_context(); let inner_context = context.nested_context();
let rhs = ex.rewrite(&inner_context, max_width, new_offset); let rhs = ex.rewrite(&inner_context, max_width, new_offset);

View file

@ -287,8 +287,8 @@ impl<'a> FmtVisitor<'a> {
has_body: bool) has_body: bool)
-> Option<(String, bool)> { -> Option<(String, bool)> {
let mut force_new_line_for_brace = false; let mut force_new_line_for_brace = false;
// FIXME we'll lose any comments in between parts of the function decl, but anyone // FIXME we'll lose any comments in between parts of the function decl, but
// who comments there probably deserves what they get. // anyone who comments there probably deserves what they get.
let where_clause = &generics.where_clause; let where_clause = &generics.where_clause;
@ -1008,7 +1008,8 @@ impl<'a> FmtVisitor<'a> {
span_start, span_start,
span_end); span_end);
let item_vec = items.collect::<Vec<_>>(); let item_vec = items.collect::<Vec<_>>();
// FIXME: we don't need to collect here if the where_layout isnt horizontalVertical // FIXME: we don't need to collect here if the where_layout isnt
// HorizontalVertical.
let tactic = definitive_tactic(&item_vec, self.config.where_layout, budget); let tactic = definitive_tactic(&item_vec, self.config.where_layout, budget);
let fmt = ListFormatting { let fmt = ListFormatting {

View file

@ -10,7 +10,7 @@
use visitor::FmtVisitor; use visitor::FmtVisitor;
use syntax::codemap::{self, BytePos, Span}; use syntax::codemap::{self, BytePos, Span, Pos};
use comment::{CodeCharKind, CommentCodeSlices, rewrite_comment}; use comment::{CodeCharKind, CommentCodeSlices, rewrite_comment};
impl<'a> FmtVisitor<'a> { impl<'a> FmtVisitor<'a> {
@ -55,22 +55,116 @@ impl<'a> FmtVisitor<'a> {
self.last_pos = end; self.last_pos = end;
let span = codemap::mk_sp(start, end); let span = codemap::mk_sp(start, end);
self.write_snippet(&snippet, &process_last_snippet); self.write_snippet(span, &process_last_snippet);
} }
fn write_snippet<F: Fn(&mut FmtVisitor, &str, &str)>(&mut self, fn write_snippet<F>(&mut self, span: Span, process_last_snippet: F)
snippet: &str, where F: Fn(&mut FmtVisitor, &str, &str)
process_last_snippet: F) { {
let mut lines: Vec<&str> = snippet.lines().collect(); // Get a snippet from the file start to the span's hi without allocating.
let last_snippet = if snippet.ends_with("\n") { // We need it to determine what precedes the current comment. If the comment
"" // follows code on the same line, we won't touch it.
} else { let big_span_lo = self.codemap.lookup_char_pos(span.lo).file.start_pos;
lines.pop().unwrap() let local_begin = self.codemap.lookup_byte_offset(big_span_lo);
}; let local_end = self.codemap.lookup_byte_offset(span.hi);
for line in lines.iter() { let start_index = local_begin.pos.to_usize();
self.buffer.push_str(line.trim_right()); let end_index = local_end.pos.to_usize();
self.buffer.push_str("\n"); let big_snippet = &local_begin.fm.src.as_ref().unwrap()[start_index..end_index];
let big_diff = (span.lo - big_span_lo).to_usize();
let snippet = self.snippet(span);
self.write_snippet_inner(big_snippet, big_diff, &snippet, process_last_snippet);
}
fn write_snippet_inner<F>(&mut self,
big_snippet: &str,
big_diff: usize,
snippet: &str,
process_last_snippet: F)
where F: Fn(&mut FmtVisitor, &str, &str)
{
// Trim whitespace from the right hand side of each line.
// Annoyingly, the library functions for splitting by lines etc. are not
// quite right, so we must do it ourselves.
let mut line_start = 0;
let mut last_wspace = None;
let mut rewrite_next_comment = true;
for (kind, offset, subslice) in CommentCodeSlices::new(snippet) {
if let CodeCharKind::Comment = kind {
let last_char = big_snippet[..(offset + big_diff)]
.chars()
.rev()
.skip_while(|rev_c| [' ', '\t'].contains(&rev_c))
.next();
let fix_indent = last_char.map(|rev_c| ['{', '\n'].contains(&rev_c))
.unwrap_or(true);
if rewrite_next_comment && fix_indent {
if let Some('{') = last_char {
self.buffer.push_str("\n");
}
let comment_width = ::std::cmp::min(self.config.ideal_width,
self.config.max_width -
self.block_indent.width());
self.buffer.push_str(&self.block_indent.to_string(self.config));
self.buffer.push_str(&rewrite_comment(subslice,
false,
comment_width,
self.block_indent,
self.config)
.unwrap());
last_wspace = None;
line_start = offset + subslice.len();
if let Some('/') = subslice.chars().skip(1).next() {
self.buffer.push_str("\n");
} else if line_start < snippet.len() {
let x = (&snippet[line_start..]).chars().next().unwrap() != '\n';
if x {
self.buffer.push_str("\n");
}
}
continue;
} else {
rewrite_next_comment = false;
}
}
for (mut i, c) in subslice.char_indices() {
i += offset;
if c == '\n' {
if let Some(lw) = last_wspace {
self.buffer.push_str(&snippet[line_start..lw]);
self.buffer.push_str("\n");
} else {
self.buffer.push_str(&snippet[line_start..i + 1]);
}
line_start = i + 1;
last_wspace = None;
rewrite_next_comment = rewrite_next_comment || kind == CodeCharKind::Normal;
} else {
if c.is_whitespace() {
if last_wspace.is_none() {
last_wspace = Some(i);
}
} else {
rewrite_next_comment = rewrite_next_comment || kind == CodeCharKind::Normal;
last_wspace = None;
}
}
}
} }
process_last_snippet(self, &last_snippet, snippet);
process_last_snippet(self, &snippet[line_start..], &snippet);
} }
} }

View file

@ -101,11 +101,22 @@ impl<'a, 'v> visit::Visitor<'v> for FmtVisitor<'a> {
} }
} }
self.block_indent = self.block_indent.block_unindent(self.config);
// TODO: we should compress any newlines here to just one // TODO: we should compress any newlines here to just one
self.format_missing_with_indent(b.span.hi - brace_compensation); self.format_missing_with_indent(b.span.hi - brace_compensation);
// FIXME: this is a terrible hack to indent the comments between the last
// item in the block and the closing brace to the block's level.
// The closing brace itself, however, should be indented at a shallower
// level.
let total_len = self.buffer.len;
let chars_too_many = if self.config.hard_tabs {
1
} else {
self.config.tab_spaces
};
self.buffer.truncate(total_len - chars_too_many);
self.buffer.push_str("}"); self.buffer.push_str("}");
self.last_pos = b.span.hi; self.last_pos = b.span.hi;
self.block_indent = self.block_indent.block_unindent(self.config);
} }
// Note that this only gets called for function definitions. Required methods // Note that this only gets called for function definitions. Required methods
@ -177,6 +188,7 @@ impl<'a, 'v> visit::Visitor<'v> for FmtVisitor<'a> {
// FIXME(#78): format traits and impl definitions. // FIXME(#78): format traits and impl definitions.
ast::Item_::ItemImpl(..) | ast::Item_::ItemImpl(..) |
ast::Item_::ItemTrait(..) => { ast::Item_::ItemTrait(..) => {
self.format_missing_with_indent(item.span.lo);
self.block_indent = self.block_indent.block_indent(self.config); self.block_indent = self.block_indent.block_indent(self.config);
visit::walk_item(self, item); visit::walk_item(self, item);
self.block_indent = self.block_indent.block_unindent(self.config); self.block_indent = self.block_indent.block_unindent(self.config);
@ -215,6 +227,9 @@ impl<'a, 'v> visit::Visitor<'v> for FmtVisitor<'a> {
} }
ast::Item_::ItemMac(..) => { ast::Item_::ItemMac(..) => {
self.format_missing_with_indent(item.span.lo); self.format_missing_with_indent(item.span.lo);
let snippet = self.snippet(item.span);
self.buffer.push_str(&snippet);
self.last_pos = item.span.hi;
// FIXME: we cannot format these yet, because of a bad span. // FIXME: we cannot format these yet, because of a bad span.
// See rust lang issue #28424. // See rust lang issue #28424.
// visit::walk_item(self, item); // visit::walk_item(self, item);

39
tests/source/comment.rs Normal file
View file

@ -0,0 +1,39 @@
//! Doc comment
fn test() {
// comment
// comment2
code(); /* leave this comment alone!
* ok? */
/* Lorem ipsum dolor sit amet, consectetur adipiscing elit. Donec a
* diam lectus. Sed sit amet ipsum mauris. Maecenas congue ligula ac quam
* viverra nec consectetur ante hendrerit. Donec et mollis dolor.
* Praesent et diam eget libero egestas mattis sit amet vitae augue. Nam
* tincidunt congue enim, ut porta lorem lacinia consectetur. Donec ut
* libero sed arcu vehicula ultricies a non tortor. Lorem ipsum dolor sit
* amet, consectetur adipiscing elit. Aenean ut gravida lorem. Ut turpis
* felis, pulvinar a semper sed, adipiscing id dolor. */
// Very looooooooooooooooooooooooooooooooooooooooooooooooooooooooong comment that should be split
// println!("{:?}", rewrite_comment(subslice,
// false,
// comment_width,
// self.block_indent,
// self.config)
// .unwrap());
funk(); //dontchangeme
// or me
}
/// test123
fn doc_comment() {
}
fn chains() {
foo.bar(|| {
let x = 10;
/* comment */ x })
}

View file

@ -19,7 +19,7 @@ fn main() {
}; };
let loooooooooooooong_name = |field| { let loooooooooooooong_name = |field| {
// TODO(#27): format comments. // TODO(#27): format comments.
if field.node.attrs.len() > 0 { if field.node.attrs.len() > 0 {
field.node.attrs[0].span.lo field.node.attrs[0].span.lo
} else { } else {
@ -39,7 +39,8 @@ fn main() {
let empty = |arg| {}; let empty = |arg| {};
let simple = |arg| { /* TODO(#27): comment formatting */ let simple = |arg| {
// TODO(#27): comment formatting
foo(arg) foo(arg)
}; };

42
tests/target/comment.rs Normal file
View file

@ -0,0 +1,42 @@
//! Doc comment
fn test() {
// comment
// comment2
code(); /* leave this comment alone!
* ok? */
// Lorem ipsum dolor sit amet, consectetur adipiscing elit. Donec a
// diam lectus. Sed sit amet ipsum mauris. Maecenas congue ligula ac quam
// viverra nec consectetur ante hendrerit. Donec et mollis dolor.
// Praesent et diam eget libero egestas mattis sit amet vitae augue. Nam
// tincidunt congue enim, ut porta lorem lacinia consectetur. Donec ut
// libero sed arcu vehicula ultricies a non tortor. Lorem ipsum dolor sit
// amet, consectetur adipiscing elit. Aenean ut gravida lorem. Ut turpis
// felis, pulvinar a semper sed, adipiscing id dolor.
// Very looooooooooooooooooooooooooooooooooooooooooooooooooooooooong comment
// that should be split
// println!("{:?}", rewrite_comment(subslice,
// false,
// comment_width,
// self.block_indent,
// self.config)
// .unwrap());
funk(); //dontchangeme
// or me
}
/// test123
fn doc_comment() {
}
fn chains() {
foo.bar(|| {
let x = 10;
// comment
x
})
}

View file

@ -1,3 +1,3 @@
// sadfsdfa // sadfsdfa
//sdffsdfasdf // sdffsdfasdf

View file

@ -142,7 +142,8 @@ fn baz() {
fn qux() { fn qux() {
{} {}
// FIXME this one could be done better. // FIXME this one could be done better.
{ /* a block with a comment */ {
// a block with a comment
} }
{ {

View file

@ -6,7 +6,8 @@ fn foo() {
// Some comment. // Some comment.
a => foo(), a => foo(),
b if 0 < 42 => foo(), b if 0 < 42 => foo(),
c => { // Another comment. c => {
// Another comment.
// Comment. // Comment.
an_expression; an_expression;
foo() foo()
@ -112,7 +113,8 @@ fn issue339() {
// collapsing here exceeds line length // collapsing here exceeds line length
ffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffg => { ffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffffg => {
} }
h => { // comment above block h => {
// comment above block
} }
i => {} // comment below block i => {} // comment below block
j => { j => {
@ -133,7 +135,8 @@ fn issue339() {
m => {} m => {}
n => {} n => {}
o => {} o => {}
p => { // Dont collapse me p => {
// Dont collapse me
} }
q => {} q => {}
r => {} r => {}

View file

@ -22,7 +22,8 @@ mod doc;
mod other; mod other;
// sfdgfffffffffffffffffffffffffffffffffffffffffffffffffffffff ffffffffffffffffffffffffffffffffffffffffff // sfdgfffffffffffffffffffffffffffffffffffffffffffffffffffffff
// ffffffffffffffffffffffffffffffffffffffffff
fn foo(a: isize, b: u32 /* blah blah */, c: f64) { fn foo(a: isize, b: u32 /* blah blah */, c: f64) {