discard trailing blank comments

[rust.git] / src / comment.rs
diff --git a/src/comment.rs b/src/comment.rs

index 378fe40d569890a30aad1289f055f2a75e274daa..4f2f813166b09d1080cd03fa0635d1804d100316 100644 (file)
--- a/src/comment.rs
+++ b/src/comment.rs
@@ -20,6 +20,7 @@
  use shape::{Indent, Shape};
  use string::{rewrite_string, StringFormat};
  use utils::{count_newlines, first_line_width, last_line_width};
+use {ErrorKind, FormattingError};
  
  fn is_custom_comment(comment: &str) -> bool {
      if !comment.starts_with("//") {
@@ -95,21 +96,6 @@ pub fn line_start(&self) -> &'a str {
      pub fn to_str_tuplet(&self) -> (&'a str, &'a str, &'a str) {
          (self.opener(), self.closer(), self.line_start())
      }
-
-    pub fn line_with_same_comment_style(&self, line: &str, normalize_comments: bool) -> bool {
-        match *self {
-            CommentStyle::DoubleSlash | CommentStyle::TripleSlash | CommentStyle::Doc => {
-                line.trim_left().starts_with(self.line_start().trim_left())
-                    || comment_style(line, normalize_comments) == *self
-            }
-            CommentStyle::DoubleBullet | CommentStyle::SingleBullet | CommentStyle::Exclamation => {
-                line.trim_left().starts_with(self.closer().trim_left())
-                    || line.trim_left().starts_with(self.line_start().trim_left())
-                    || comment_style(line, normalize_comments) == *self
-            }
-            CommentStyle::Custom(opener) => line.trim_left().starts_with(opener.trim_right()),
-        }
-    }
  }
  
  fn comment_style(orig: &str, normalize_comments: bool) -> CommentStyle {
@@ -249,7 +235,8 @@ fn _rewrite_comment(
      // If there are lines without a starting sigil, we won't format them correctly
      // so in that case we won't even re-align (if !config.normalize_comments()) and
      // we should stop now.
-    let num_bare_lines = orig.lines()
+    let num_bare_lines = orig
+        .lines()
          .map(|line| line.trim())
          .filter(|l| !(l.starts_with('*') || l.starts_with("//") || l.starts_with("/*")))
          .count();
@@ -271,17 +258,56 @@ fn identify_comment(
      is_doc_comment: bool,
  ) -> Option<String> {
      let style = comment_style(orig, false);
-    let first_group = orig.lines()
-        .take_while(|l| style.line_with_same_comment_style(l, false))
-        .collect::<Vec<_>>()
-        .join("\n");
-    let rest = orig.lines()
-        .skip(first_group.lines().count())
-        .collect::<Vec<_>>()
-        .join("\n");
+    let mut first_group_ending = 0;
+
+    fn compute_len(orig: &str, line: &str) -> usize {
+        if orig.len() > line.len() {
+            if orig.as_bytes()[line.len()] == b'\r' {
+                line.len() + 2
+            } else {
+                line.len() + 1
+            }
+        } else {
+            line.len()
+        }
+    }
+
+    match style {
+        CommentStyle::DoubleSlash | CommentStyle::TripleSlash | CommentStyle::Doc => {
+            let line_start = style.line_start().trim_left();
+            for line in orig.lines() {
+                if line.trim_left().starts_with(line_start) || comment_style(line, false) == style {
+                    first_group_ending += compute_len(&orig[first_group_ending..], line);
+                } else {
+                    break;
+                }
+            }
+        }
+        CommentStyle::Custom(opener) => {
+            let trimmed_opener = opener.trim_right();
+            for line in orig.lines() {
+                if line.trim_left().starts_with(trimmed_opener) {
+                    first_group_ending += compute_len(&orig[first_group_ending..], line);
+                } else {
+                    break;
+                }
+            }
+        }
+        // for a block comment, search for the closing symbol
+        CommentStyle::DoubleBullet | CommentStyle::SingleBullet | CommentStyle::Exclamation => {
+            let closer = style.closer().trim_left();
+            for line in orig.lines() {
+                first_group_ending += compute_len(&orig[first_group_ending..], line);
+                if line.trim_left().ends_with(closer) {
+                    break;
+                }
+            }
+        }
+    }
  
+    let (first_group, rest) = orig.split_at(first_group_ending);
      let first_group_str = rewrite_comment_inner(
-        &first_group,
+        first_group,
          block_style,
          style,
          shape,
@@ -291,7 +317,7 @@ fn identify_comment(
      if rest.is_empty() {
          Some(first_group_str)
      } else {
-        identify_comment(&rest, block_style, shape, config, is_doc_comment).map(|rest_str| {
+        identify_comment(rest, block_style, shape, config, is_doc_comment).map(|rest_str| {
              format!(
                  "{}\n{}{}",
                  first_group_str,
@@ -333,7 +359,8 @@ fn rewrite_comment_inner(
      };
  
      let line_breaks = count_newlines(orig.trim_right());
-    let lines = orig.lines()
+    let lines = orig
+        .lines()
          .enumerate()
          .map(|(i, mut line)| {
              line = trim_right_unless_two_whitespaces(line.trim_left(), is_doc_comment);
@@ -343,8 +370,7 @@ fn rewrite_comment_inner(
              }
  
              line
-        })
-        .map(|s| left_trim_comment_line(s, &style))
+        }).map(|s| left_trim_comment_line(s, &style))
          .map(|(line, has_leading_whitespace)| {
              if orig.starts_with("/*") && line_breaks == 0 {
                  (
@@ -383,14 +409,20 @@ fn rewrite_comment_inner(
              if line.starts_with("```") {
                  inside_code_block = false;
                  result.push_str(&comment_line_separator);
-                let code_block = ::format_code_block(&code_block_buffer, config)
-                    .unwrap_or_else(|| code_block_buffer.to_owned());
+                let code_block = {
+                    let mut config = config.clone();
+                    config.set().wrap_comments(false);
+                    match ::format_code_block(&code_block_buffer, &config) {
+                        Some(ref s) => trim_custom_comment_prefix(s),
+                        None => trim_custom_comment_prefix(&code_block_buffer),
+                    }
+                };
                  result.push_str(&join_code_block_with_comment_line_separator(&code_block));
                  code_block_buffer.clear();
                  result.push_str(&comment_line_separator);
                  result.push_str(line);
              } else {
-                code_block_buffer.push_str(line);
+                code_block_buffer.push_str(&hide_sharp_behind_comment(line));
                  code_block_buffer.push('\n');
  
                  if is_last {
@@ -398,14 +430,14 @@ fn rewrite_comment_inner(
                      // We will leave them untouched.
                      result.push_str(&comment_line_separator);
                      result.push_str(&join_code_block_with_comment_line_separator(
-                        &code_block_buffer,
+                        &trim_custom_comment_prefix(&code_block_buffer),
                      ));
                  }
              }
  
              continue;
          } else {
-            inside_code_block = line.starts_with("```rust");
+            inside_code_block = line.starts_with("```");
  
              if result == opener {
                  let force_leading_whitespace = opener == "/* " && count_newlines(orig) == 0;
@@ -417,8 +449,12 @@ fn rewrite_comment_inner(
                  }
              } else if is_prev_line_multi_line && !line.is_empty() {
                  result.push(' ')
-            } else if is_last && !closer.is_empty() && line.is_empty() {
-                result.push_str(&indent_str);
+            } else if is_last && line.is_empty() {
+                // trailing blank lines are unwanted
+                if !closer.is_empty() {
+                    result.push_str(&indent_str);
+                }
+                break;
              } else {
                  result.push_str(&comment_line_separator);
                  if !has_leading_whitespace && result.ends_with(' ') {
@@ -428,7 +464,7 @@ fn rewrite_comment_inner(
          }
  
          if config.wrap_comments() && line.len() > fmt.shape.width && !has_url(line) {
-            match rewrite_string(line, &fmt, Some(max_chars)) {
+            match rewrite_string(line, &fmt) {
                  Some(ref s) => {
                      is_prev_line_multi_line = s.contains('\n');
                      result.push_str(s);
@@ -439,7 +475,7 @@ fn rewrite_comment_inner(
                      result.pop();
                      result.push_str(&comment_line_separator);
                      fmt.shape = Shape::legacy(max_chars, fmt_indent);
-                    match rewrite_string(line, &fmt, Some(max_chars)) {
+                    match rewrite_string(line, &fmt) {
                          Some(ref s) => {
                              is_prev_line_multi_line = s.contains('\n');
                              result.push_str(s);
@@ -460,7 +496,7 @@ fn rewrite_comment_inner(
                  // 1 = " "
                  let offset = 1 + last_line_width(&result) - line_start.len();
                  Shape {
-                    width: max_chars.checked_sub(offset).unwrap_or(0),
+                    width: max_chars.saturating_sub(offset),
                      indent: fmt_indent,
                      offset: fmt.shape.offset + offset,
                  }
@@ -487,6 +523,29 @@ fn rewrite_comment_inner(
      Some(result)
  }
  
+const RUSTFMT_CUSTOM_COMMENT_PREFIX: &str = "//#### ";
+
+fn hide_sharp_behind_comment<'a>(s: &'a str) -> Cow<'a, str> {
+    if s.trim_left().starts_with("# ") {
+        Cow::from(format!("{}{}", RUSTFMT_CUSTOM_COMMENT_PREFIX, s))
+    } else {
+        Cow::from(s)
+    }
+}
+
+fn trim_custom_comment_prefix(s: &str) -> String {
+    s.lines()
+        .map(|line| {
+            let left_trimmed = line.trim_left();
+            if left_trimmed.starts_with(RUSTFMT_CUSTOM_COMMENT_PREFIX) {
+                left_trimmed.trim_left_matches(RUSTFMT_CUSTOM_COMMENT_PREFIX)
+            } else {
+                line
+            }
+        }).collect::<Vec<_>>()
+        .join("\n")
+}
+
  /// Returns true if the given string MAY include URLs or alike.
  fn has_url(s: &str) -> bool {
      // This function may return false positive, but should get its job done in most cases.
@@ -553,7 +612,8 @@ fn light_rewrite_comment(
      config: &Config,
      is_doc_comment: bool,
  ) -> Option<String> {
-    let lines: Vec<&str> = orig.lines()
+    let lines: Vec<&str> = orig
+        .lines()
          .map(|l| {
              // This is basically just l.trim(), but in the case that a line starts
              // with `*` we want to leave one space before it, so it aligns with the
@@ -570,8 +630,7 @@ fn light_rewrite_comment(
              };
              // Preserve markdown's double-space line break syntax in doc comment.
              trim_right_unless_two_whitespaces(left_trimmed, is_doc_comment)
-        })
-        .collect();
+        }).collect();
      Some(lines.join(&format!("\n{}", offset.to_string(config))))
  }
  
@@ -579,7 +638,9 @@ fn light_rewrite_comment(
  /// Does not trim all whitespace. If a single space is trimmed from the left of the string,
  /// this function returns true.
  fn left_trim_comment_line<'a>(line: &'a str, style: &CommentStyle) -> (&'a str, bool) {
-    if line.starts_with("//! ") || line.starts_with("/// ") || line.starts_with("/*! ")
+    if line.starts_with("//! ")
+        || line.starts_with("/// ")
+        || line.starts_with("/*! ")
          || line.starts_with("/** ")
      {
          (&line[4..], true)
@@ -589,13 +650,18 @@ fn left_trim_comment_line<'a>(line: &'a str, style: &CommentStyle) -> (&'a str,
          } else {
              (&line[opener.trim_right().len()..], false)
          }
-    } else if line.starts_with("/* ") || line.starts_with("// ") || line.starts_with("//!")
-        || line.starts_with("///") || line.starts_with("** ")
+    } else if line.starts_with("/* ")
+        || line.starts_with("// ")
+        || line.starts_with("//!")
+        || line.starts_with("///")
+        || line.starts_with("** ")
          || line.starts_with("/*!")
          || (line.starts_with("/**") && !line.starts_with("/**/"))
      {
          (&line[3..], line.chars().nth(2).unwrap() == ' ')
-    } else if line.starts_with("/*") || line.starts_with("* ") || line.starts_with("//")
+    } else if line.starts_with("/*")
+        || line.starts_with("* ")
+        || line.starts_with("//")
          || line.starts_with("**")
      {
          (&line[2..], line.chars().nth(1).unwrap() == ' ')
@@ -1082,13 +1148,38 @@ pub fn recover_comment_removed(
  ) -> Option<String> {
      let snippet = context.snippet(span);
      if snippet != new && changed_comment_content(snippet, &new) {
-        // We missed some comments. Keep the original text.
+        // We missed some comments. Warn and keep the original text.
+        if context.config.error_on_unformatted() {
+            context.report.append(
+                context.codemap.span_to_filename(span).into(),
+                vec![FormattingError::from_span(
+                    &span,
+                    &context.codemap,
+                    ErrorKind::LostComment,
+                )],
+            );
+        }
          Some(snippet.to_owned())
      } else {
          Some(new)
      }
  }
  
+pub fn filter_normal_code(code: &str) -> String {
+    let mut buffer = String::with_capacity(code.len());
+    LineClasses::new(code).for_each(|(kind, line)| match kind {
+        FullCodeCharKind::Normal | FullCodeCharKind::InString => {
+            buffer.push_str(&line);
+            buffer.push('\n');
+        }
+        _ => (),
+    });
+    if !code.ends_with("\n") && buffer.ends_with("\n") {
+        buffer.pop();
+    }
+    buffer
+}
+
  /// Return true if the two strings of code have the same payload of comments.
  /// The payload of comments is everything in the string except:
  ///     - actual code (not comments)
@@ -1139,6 +1230,7 @@ fn new(comment: &'a str) -> CommentReducer<'a> {
  
  impl<'a> Iterator for CommentReducer<'a> {
      type Item = char;
+
      fn next(&mut self) -> Option<Self::Item> {
          loop {
              let mut c = self.iter.next()?;
@@ -1240,7 +1332,7 @@ fn comment_code_slices_three() {
      }
  
      #[test]
-    #[cfg_attr(rustfmt, rustfmt_skip)]
+    #[rustfmt::skip]
      fn format_comments() {
          let mut config: ::config::Config = Default::default();
          config.set().wrap_comments(true);
@@ -1287,8 +1379,7 @@ fn uncommented(text: &str) -> String {
              .filter_map(|(s, c)| match s {
                  FullCodeCharKind::Normal | FullCodeCharKind::InString => Some(c),
                  _ => None,
-            })
-            .collect()
+            }).collect()
      }
  
      #[test]
@@ -1342,4 +1433,21 @@ fn test_remove_trailing_white_spaces() {
          let s = format!("    r#\"\n        test\n    \"#");
          assert_eq!(remove_trailing_white_spaces(&s), s);
      }
+
+    #[test]
+    fn test_filter_normal_code() {
+        let s = r#"
+fn main() {
+    println!("hello, world");
+}
+"#;
+        assert_eq!(s, filter_normal_code(s));
+        let s_with_comment = r#"
+fn main() {
+    // hello, world
+    println!("hello, world");
+}
+"#;
+        assert_eq!(s, filter_normal_code(s_with_comment));
+    }
  }