auto merge of #15421 : catharsis/rust/doc-ffi-minor-fixes, r=alexcrichton

[rust.git] / src / librustdoc / html / highlight.rs
diff --git a/src/librustdoc/html/highlight.rs b/src/librustdoc/html/highlight.rs

index 7ac2db2184bf4be02ec2945c99d191cc74dfc7fb..3cb5cdc04396227677bc8cdfd9e09636e5f8f133 100644 (file)
--- a/src/librustdoc/html/highlight.rs
+++ b/src/librustdoc/html/highlight.rs
@@ -18,26 +18,26 @@
  
  use syntax::parse;
  use syntax::parse::lexer;
-use syntax::codemap::{BytePos, Span};
  
  use html::escape::Escape;
  
  use t = syntax::parse::token;
  
  /// Highlights some source code, returning the HTML output.
-pub fn highlight(src: &str, class: Option<&str>) -> StrBuf {
+pub fn highlight(src: &str, class: Option<&str>, id: Option<&str>) -> String {
      debug!("highlighting: ================\n{}\n==============", src);
      let sess = parse::new_parse_sess();
      let fm = parse::string_to_filemap(&sess,
-                                      src.to_strbuf(),
-                                      "<stdin>".to_strbuf());
+                                      src.to_string(),
+                                      "<stdin>".to_string());
  
      let mut out = io::MemWriter::new();
      doit(&sess,
-         lexer::new_string_reader(&sess.span_diagnostic, fm),
+         lexer::StringReader::new(&sess.span_diagnostic, fm),
           class,
+         id,
           &mut out).unwrap();
-    str::from_utf8_lossy(out.unwrap().as_slice()).to_strbuf()
+    str::from_utf8_lossy(out.unwrap().as_slice()).to_string()
  }
  
  /// Exhausts the `lexer` writing the output into `out`.
@@ -47,43 +47,41 @@ pub fn highlight(src: &str, class: Option<&str>) -> StrBuf {
  /// it's used. All source code emission is done as slices from the source map,
  /// not from the tokens themselves, in order to stay true to the original
  /// source.
-fn doit(sess: &parse::ParseSess, mut lexer: lexer::StringReader, class: Option<&str>,
+fn doit(sess: &parse::ParseSess, mut lexer: lexer::StringReader,
+        class: Option<&str>, id: Option<&str>,
          out: &mut Writer) -> io::IoResult<()> {
      use syntax::parse::lexer::Reader;
  
-    try!(write!(out, "<pre class='rust {}'>\n", class.unwrap_or("")));
-    let mut last = BytePos(0);
+    try!(write!(out, "<pre "));
+    match id {
+        Some(id) => try!(write!(out, "id='{}' ", id)),
+        None => {}
+    }
+    try!(write!(out, "class='rust {}'>\n", class.unwrap_or("")));
      let mut is_attribute = false;
      let mut is_macro = false;
      let mut is_macro_nonterminal = false;
      loop {
          let next = lexer.next_token();
-        let test = if next.tok == t::EOF {lexer.pos} else {next.sp.lo};
-
-        // The lexer consumes all whitespace and non-doc-comments when iterating
-        // between tokens. If this token isn't directly adjacent to our last
-        // token, then we need to emit the whitespace/comment.
-        //
-        // If the gap has any '/' characters then we consider the whole thing a
-        // comment. This will classify some whitespace as a comment, but that
-        // doesn't matter too much for syntax highlighting purposes.
-        if test > last {
-            let snip = sess.span_diagnostic.cm.span_to_snippet(Span {
-                lo: last,
-                hi: test,
-                expn_info: None,
-            }).unwrap();
-            if snip.as_slice().contains("/") {
-                try!(write!(out, "<span class='comment'>{}</span>",
-                              Escape(snip.as_slice())));
-            } else {
-                try!(write!(out, "{}", Escape(snip.as_slice())));
-            }
-        }
-        last = next.sp.hi;
+
+        let snip = |sp| sess.span_diagnostic.cm.span_to_snippet(sp).unwrap();
+
          if next.tok == t::EOF { break }
  
          let klass = match next.tok {
+            t::WS => {
+                try!(write!(out, "{}", Escape(snip(next.sp).as_slice())));
+                continue
+            },
+            t::COMMENT => {
+                try!(write!(out, "<span class='comment'>{}</span>",
+                            Escape(snip(next.sp).as_slice())));
+                continue
+            },
+            t::SHEBANG(s) => {
+                try!(write!(out, "{}", Escape(s.as_str())));
+                continue
+            },
              // If this '&' token is directly adjacent to another token, assume
              // that it's the address-of operator instead of the and-operator.
              // This allows us to give all pointers their own class (`Box` and
@@ -103,7 +101,7 @@ fn doit(sess: &parse::ParseSess, mut lexer: lexer::StringReader, class: Option<&
              // miscellaneous, no highlighting
              t::DOT | t::DOTDOT | t::DOTDOTDOT | t::COMMA | t::SEMI |
                  t::COLON | t::MOD_SEP | t::LARROW | t::LPAREN |
-                t::RPAREN | t::LBRACKET | t::LBRACE | t::RBRACE => "",
+                t::RPAREN | t::LBRACKET | t::LBRACE | t::RBRACE | t::QUESTION => "",
              t::DOLLAR => {
                  if t::is_ident(&lexer.peek().tok) {
                      is_macro_nonterminal = true;
@@ -119,7 +117,7 @@ fn doit(sess: &parse::ParseSess, mut lexer: lexer::StringReader, class: Option<&
              // span when we see the ']'.
              t::POUND => {
                  is_attribute = true;
-                try!(write!(out, r"<span class='attribute'>\#"));
+                try!(write!(out, r"<span class='attribute'>#"));
                  continue
              }
              t::RBRACKET => {
@@ -133,11 +131,11 @@ fn doit(sess: &parse::ParseSess, mut lexer: lexer::StringReader, class: Option<&
              }
  
              // text literals
-            t::LIT_CHAR(..) | t::LIT_STR(..) | t::LIT_STR_RAW(..) => "string",
+            t::LIT_BYTE(..) | t::LIT_BINARY(..) | t::LIT_BINARY_RAW(..) |
+                t::LIT_CHAR(..) | t::LIT_STR(..) | t::LIT_STR_RAW(..) => "string",
  
              // number literals
-            t::LIT_INT(..) | t::LIT_UINT(..) | t::LIT_INT_UNSUFFIXED(..) |
-                t::LIT_FLOAT(..) | t::LIT_FLOAT_UNSUFFIXED(..) => "number",
+            t::LIT_INTEGER(..) | t::LIT_FLOAT(..) => "number",
  
              // keywords are also included in the identifier set
              t::IDENT(ident, _is_mod_sep) => {