Update pulldown-cmark dependency

This commit is contained in:
Guillaume Gomez 2020-02-13 18:39:40 +01:00
parent 2e6eaceede
commit d8589de1f0
3 changed files with 114 additions and 100 deletions

View File

@ -1564,7 +1564,7 @@ dependencies = [
"rand_xoshiro", "rand_xoshiro",
"sized-chunks", "sized-chunks",
"typenum", "typenum",
"version_check 0.9.1", "version_check",
] ]
[[package]] [[package]]
@ -2014,9 +2014,9 @@ dependencies = [
[[package]] [[package]]
name = "memchr" name = "memchr"
version = "2.2.0" version = "2.3.2"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "2efc7bc57c883d4a4d6e3246905283d8dae951bb3bd32f49d6ef297f546e1c39" checksum = "53445de381a1f436797497c61d851644d0e8e88e6140f22872ad33a704933978"
[[package]] [[package]]
name = "memmap" name = "memmap"
@ -2602,17 +2602,6 @@ dependencies = [
"url 2.1.0", "url 2.1.0",
] ]
[[package]]
name = "pulldown-cmark"
version = "0.5.3"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "77043da1282374688ee212dc44b3f37ff929431de9c9adc3053bd3cee5630357"
dependencies = [
"bitflags",
"memchr",
"unicase",
]
[[package]] [[package]]
name = "pulldown-cmark" name = "pulldown-cmark"
version = "0.6.1" version = "0.6.1"
@ -2625,6 +2614,17 @@ dependencies = [
"unicase", "unicase",
] ]
[[package]]
name = "pulldown-cmark"
version = "0.7.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "2c2d7fd131800e0d63df52aff46201acaab70b431a4a1ec6f0343fe8e64f35a4"
dependencies = [
"bitflags",
"memchr",
"unicase",
]
[[package]] [[package]]
name = "punycode" name = "punycode"
version = "0.4.0" version = "0.4.0"
@ -4158,7 +4158,7 @@ version = "0.0.0"
dependencies = [ dependencies = [
"itertools 0.8.0", "itertools 0.8.0",
"minifier", "minifier",
"pulldown-cmark 0.5.3", "pulldown-cmark 0.7.0",
"rustc-rayon", "rustc-rayon",
"serde", "serde",
"serde_json", "serde_json",
@ -5158,11 +5158,11 @@ checksum = "535c204ee4d8434478593480b8f86ab45ec9aae0e83c568ca81abf0fd0e88f86"
[[package]] [[package]]
name = "unicase" name = "unicase"
version = "2.5.1" version = "2.6.0"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "2e2e6bd1e59e56598518beb94fd6db628ded570326f0a98c679a304bd9f00150" checksum = "50f37be617794602aabbeee0be4f259dc1778fabe05e2d67ee8f79326d5cb4f6"
dependencies = [ dependencies = [
"version_check 0.1.5", "version_check",
] ]
[[package]] [[package]]
@ -5332,12 +5332,6 @@ dependencies = [
"failure", "failure",
] ]
[[package]]
name = "version_check"
version = "0.1.5"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "914b1a6776c4c929a602fafd8bc742e06365d4bcbe48c30f9cca5824f70dc9dd"
[[package]] [[package]]
name = "version_check" name = "version_check"
version = "0.9.1" version = "0.9.1"

View File

@ -9,7 +9,7 @@ name = "rustdoc"
path = "lib.rs" path = "lib.rs"
[dependencies] [dependencies]
pulldown-cmark = { version = "0.5.3", default-features = false } pulldown-cmark = { version = "0.7", default-features = false }
minifier = "0.0.33" minifier = "0.0.33"
rayon = { version = "0.3.0", package = "rustc-rayon" } rayon = { version = "0.3.0", package = "rustc-rayon" }
serde = { version = "1.0", features = ["derive"] } serde = { version = "1.0", features = ["derive"] }

View File

@ -33,7 +33,7 @@ use crate::html::highlight;
use crate::html::toc::TocBuilder; use crate::html::toc::TocBuilder;
use crate::test; use crate::test;
use pulldown_cmark::{html, CowStr, Event, Options, Parser, Tag}; use pulldown_cmark::{html, CodeBlockKind, CowStr, Event, Options, Parser, Tag};
#[cfg(test)] #[cfg(test)]
mod tests; mod tests;
@ -189,10 +189,15 @@ impl<'a, I: Iterator<Item = Event<'a>>> Iterator for CodeBlocks<'_, 'a, I> {
let compile_fail; let compile_fail;
let ignore; let ignore;
let edition; let edition;
if let Some(Event::Start(Tag::CodeBlock(lang))) = event { if let Some(Event::Start(Tag::CodeBlock(kind))) = event {
let parse_result = LangString::parse(&lang, self.check_error_codes, false); let parse_result = match kind {
CodeBlockKind::Fenced(ref lang) => {
LangString::parse(&lang, self.check_error_codes, false)
}
CodeBlockKind::Indented => LangString::all_false(),
};
if !parse_result.rust { if !parse_result.rust {
return Some(Event::Start(Tag::CodeBlock(lang))); return Some(Event::Start(Tag::CodeBlock(kind)));
} }
compile_fail = parse_result.compile_fail; compile_fail = parse_result.compile_fail;
ignore = parse_result.ignore; ignore = parse_result.ignore;
@ -370,11 +375,11 @@ impl<'a, 'b, 'ids, I: Iterator<Item = Event<'a>>> Iterator for HeadingLinks<'a,
} }
let event = self.inner.next(); let event = self.inner.next();
if let Some(Event::Start(Tag::Header(level))) = event { if let Some(Event::Start(Tag::Heading(level))) = event {
let mut id = String::new(); let mut id = String::new();
for event in &mut self.inner { for event in &mut self.inner {
match &event { match &event {
Event::End(Tag::Header(..)) => break, Event::End(Tag::Heading(..)) => break,
Event::Text(text) | Event::Code(text) => { Event::Text(text) | Event::Code(text) => {
id.extend(text.chars().filter_map(slugify)); id.extend(text.chars().filter_map(slugify));
} }
@ -391,10 +396,10 @@ impl<'a, 'b, 'ids, I: Iterator<Item = Event<'a>>> Iterator for HeadingLinks<'a,
let mut html_header = String::new(); let mut html_header = String::new();
html::push_html(&mut html_header, self.buf.iter().cloned()); html::push_html(&mut html_header, self.buf.iter().cloned());
let sec = builder.push(level as u32, html_header, id.clone()); let sec = builder.push(level as u32, html_header, id.clone());
self.buf.push_front(Event::InlineHtml(format!("{} ", sec).into())); self.buf.push_front(Event::Html(format!("{} ", sec).into()));
} }
self.buf.push_back(Event::InlineHtml(format!("</a></h{}>", level).into())); self.buf.push_back(Event::Html(format!("</a></h{}>", level).into()));
let start_tags = format!( let start_tags = format!(
"<h{level} id=\"{id}\" class=\"section-header\">\ "<h{level} id=\"{id}\" class=\"section-header\">\
@ -402,7 +407,7 @@ impl<'a, 'b, 'ids, I: Iterator<Item = Event<'a>>> Iterator for HeadingLinks<'a,
id = id, id = id,
level = level level = level
); );
return Some(Event::InlineHtml(start_tags.into())); return Some(Event::Html(start_tags.into()));
} }
event event
} }
@ -556,40 +561,44 @@ pub fn find_testable_code<T: test::Tester>(
error_codes: ErrorCodes, error_codes: ErrorCodes,
enable_per_target_ignores: bool, enable_per_target_ignores: bool,
) { ) {
let mut parser = Parser::new(doc); let mut parser = Parser::new(doc).into_offset_iter();
let mut prev_offset = 0; let mut prev_offset = 0;
let mut nb_lines = 0; let mut nb_lines = 0;
let mut register_header = None; let mut register_header = None;
while let Some(event) = parser.next() { while let Some((event, offset)) = parser.next() {
match event { match event {
Event::Start(Tag::CodeBlock(s)) => { Event::Start(Tag::CodeBlock(kind)) => {
let offset = parser.get_offset(); let block_info = match kind {
CodeBlockKind::Fenced(ref lang) => {
let block_info = if s.is_empty() { if lang.is_empty() {
LangString::all_false() LangString::all_false()
} else { } else {
LangString::parse(&*s, error_codes, enable_per_target_ignores) LangString::parse(lang, error_codes, enable_per_target_ignores)
}
}
CodeBlockKind::Indented => LangString::all_false(),
}; };
if !block_info.rust { if !block_info.rust {
continue; continue;
} }
let mut test_s = String::new(); let mut test_s = String::new();
while let Some(Event::Text(s)) = parser.next() { while let Some((Event::Text(s), _)) = parser.next() {
test_s.push_str(&s); test_s.push_str(&s);
} }
let text = test_s let text = test_s
.lines() .lines()
.map(|l| map_line(l).for_code()) .map(|l| map_line(l).for_code())
.collect::<Vec<Cow<'_, str>>>() .collect::<Vec<Cow<'_, str>>>()
.join("\n"); .join("\n");
nb_lines += doc[prev_offset..offset].lines().count();
let line = tests.get_line() + nb_lines; nb_lines += doc[prev_offset..offset.start].lines().count();
let line = tests.get_line() + nb_lines + 1;
tests.add_test(text, block_info, line); tests.add_test(text, block_info, line);
prev_offset = offset; prev_offset = offset.start;
} }
Event::Start(Tag::Header(level)) => { Event::Start(Tag::Heading(level)) => {
register_header = Some(level as u32); register_header = Some(level as u32);
} }
Event::Text(ref s) if register_header.is_some() => { Event::Text(ref s) if register_header.is_some() => {
@ -783,7 +792,7 @@ impl MarkdownHtml<'_> {
// Treat inline HTML as plain text. // Treat inline HTML as plain text.
let p = p.map(|event| match event { let p = p.map(|event| match event {
Event::Html(text) | Event::InlineHtml(text) => Event::Text(text), Event::Html(text) => Event::Text(text),
_ => event, _ => event,
}); });
@ -842,10 +851,10 @@ pub fn plain_summary_line(md: &str) -> String {
let next_event = next_event.unwrap(); let next_event = next_event.unwrap();
let (ret, is_in) = match next_event { let (ret, is_in) = match next_event {
Event::Start(Tag::Paragraph) => (None, 1), Event::Start(Tag::Paragraph) => (None, 1),
Event::Start(Tag::Header(_)) => (None, 1), Event::Start(Tag::Heading(_)) => (None, 1),
Event::Code(code) => (Some(format!("`{}`", code)), 0), Event::Code(code) => (Some(format!("`{}`", code)), 0),
Event::Text(ref s) if self.is_in > 0 => (Some(s.as_ref().to_owned()), 0), Event::Text(ref s) if self.is_in > 0 => (Some(s.as_ref().to_owned()), 0),
Event::End(Tag::Paragraph) | Event::End(Tag::Header(_)) => (None, -1), Event::End(Tag::Paragraph) | Event::End(Tag::Heading(_)) => (None, -1),
_ => (None, 0), _ => (None, 0),
}; };
if is_in > 0 || (is_in < 0 && self.is_in > 0) { if is_in > 0 || (is_in < 0 && self.is_in > 0) {
@ -940,68 +949,79 @@ crate fn rust_code_blocks(md: &str) -> Vec<RustCodeBlock> {
return code_blocks; return code_blocks;
} }
let mut p = Parser::new_ext(md, opts()); let mut p = Parser::new_ext(md, opts()).into_offset_iter();
let mut code_block_start = 0;
let mut code_start = 0;
let mut is_fenced = false;
let mut previous_offset = 0;
let mut in_rust_code_block = false;
while let Some(event) = p.next() {
let offset = p.get_offset();
while let Some((event, offset)) = p.next() {
match event { match event {
Event::Start(Tag::CodeBlock(syntax)) => { Event::Start(Tag::CodeBlock(syntax)) => {
let lang_string = if syntax.is_empty() { let (syntax, code_start, code_end, range, is_fenced) = match syntax {
LangString::all_false() CodeBlockKind::Fenced(syntax) => {
} else { let syntax = syntax.as_ref();
LangString::parse(&*syntax, ErrorCodes::Yes, false) let lang_string = if syntax.is_empty() {
}; LangString::all_false()
} else {
if lang_string.rust { LangString::parse(&*syntax, ErrorCodes::Yes, false)
in_rust_code_block = true; };
if !lang_string.rust {
code_start = offset; continue;
code_block_start = match md[previous_offset..offset].find("```") {
Some(fence_idx) => {
is_fenced = true;
previous_offset + fence_idx
} }
None => { let syntax = if syntax.is_empty() { None } else { Some(syntax.to_owned()) };
is_fenced = false; let (code_start, mut code_end) = match p.next() {
offset Some((Event::Text(_), offset)) => (offset.start, offset.end),
Some((_, sub_offset)) => {
let code = Range { start: sub_offset.start, end: sub_offset.start };
code_blocks.push(RustCodeBlock {
is_fenced: true,
range: offset,
code,
syntax,
});
continue;
}
None => {
let code = Range { start: offset.end, end: offset.end };
code_blocks.push(RustCodeBlock {
is_fenced: true,
range: offset,
code,
syntax,
});
continue;
}
};
while let Some((Event::Text(_), offset)) = p.next() {
code_end = offset.end;
} }
}; (syntax, code_start, code_end, offset, true)
} }
} CodeBlockKind::Indented => {
Event::End(Tag::CodeBlock(syntax)) if in_rust_code_block => { // The ending of the offset goes too far sometime so we reduce it by one in
in_rust_code_block = false; // these cases.
if offset.end > offset.start
let code_block_end = if is_fenced { && md.get(offset.end..=offset.end) == Some(&"\n")
let fence_str = &md[previous_offset..offset].chars().rev().collect::<String>(); {
fence_str (
.find("```") None,
.map(|fence_idx| offset - fence_idx) offset.start,
.unwrap_or_else(|| offset) offset.end,
} else if md.as_bytes().get(offset).map(|b| *b == b'\n').unwrap_or_default() { Range { start: offset.start, end: offset.end - 1 },
offset - 1 false,
} else { )
offset } else {
(None, offset.start, offset.end, offset, false)
}
}
}; };
let code_end = if is_fenced { previous_offset } else { code_block_end };
code_blocks.push(RustCodeBlock { code_blocks.push(RustCodeBlock {
is_fenced, is_fenced,
range: Range { start: code_block_start, end: code_block_end }, range,
code: Range { start: code_start, end: code_end }, code: Range { start: code_start, end: code_end },
syntax: if !syntax.is_empty() { Some(syntax.into_string()) } else { None }, syntax,
}); });
} }
_ => (), _ => (),
} }
previous_offset = offset;
} }
code_blocks code_blocks