zola/components/rendering/src/markdown.rs

252 lines
10 KiB
Rust
Raw Normal View History

2018-10-31 07:18:57 +00:00
use std::borrow::Cow::{Borrowed, Owned};
2017-03-07 12:34:31 +00:00
use self::cmark::{Event, Options, Parser, Tag};
2017-03-07 12:34:31 +00:00
use pulldown_cmark as cmark;
2017-04-06 07:07:18 +00:00
use slug::slugify;
2017-03-07 12:34:31 +00:00
use syntect::easy::HighlightLines;
2018-10-31 07:18:57 +00:00
use syntect::html::{
start_highlighted_html_snippet, styled_line_to_highlighted_html, IncludeBackground,
};
2017-03-27 14:17:33 +00:00
2018-10-31 07:18:57 +00:00
use config::highlighting::{get_highlighter, SYNTAX_SET, THEME_SET};
2017-07-01 07:47:41 +00:00
use errors::Result;
use link_checker::check_url;
2018-10-31 07:18:57 +00:00
use utils::site::resolve_internal_link;
2018-05-06 20:58:39 +00:00
use context::RenderContext;
2018-10-31 07:18:57 +00:00
use table_of_contents::{make_table_of_contents, Header, TempHeader};
2018-05-06 20:58:39 +00:00
const CONTINUE_READING: &str = "<p><a name=\"continue-reading\"></a></p>\n";
2018-08-24 21:37:39 +00:00
#[derive(Debug)]
pub struct Rendered {
pub body: String,
pub summary_len: Option<usize>,
2018-09-30 19:15:09 +00:00
pub toc: Vec<Header>,
}
2018-05-06 20:58:39 +00:00
// We might have cases where the slug is already present in our list of anchor
// for example an article could have several titles named Example
// We add a counter after the slug if the slug is already present, which
// means we will have example, example-1, example-2 etc
fn find_anchor(anchors: &[String], name: String, level: u8) -> String {
if level == 0 && !anchors.contains(&name) {
2018-11-19 14:04:22 +00:00
return name;
2018-05-06 20:58:39 +00:00
}
let new_anchor = format!("{}-{}", name, level + 1);
if !anchors.contains(&new_anchor) {
return new_anchor;
}
find_anchor(anchors, name, level + 1)
}
2017-03-07 12:34:31 +00:00
// Colocated asset links refers to the files in the same directory,
// there it should be a filename only
2018-05-07 19:03:51 +00:00
fn is_colocated_asset_link(link: &str) -> bool {
2018-09-30 19:15:09 +00:00
!link.contains('/') // http://, ftp://, ../ etc
2018-05-07 19:03:51 +00:00
&& !link.starts_with("mailto:")
}
pub fn markdown_to_html(content: &str, context: &RenderContext) -> Result<Rendered> {
2018-05-06 20:58:39 +00:00
// the rendered html
2018-05-07 19:03:51 +00:00
let mut html = String::with_capacity(content.len());
2017-03-27 14:17:33 +00:00
// Set while parsing
let mut error = None;
2018-05-06 20:58:39 +00:00
let mut background = IncludeBackground::Yes;
2018-10-09 12:33:43 +00:00
let mut highlighter: Option<(HighlightLines, bool)> = None;
2017-04-06 07:07:18 +00:00
// If we get text in header, we need to insert the id and a anchor
let mut in_header = false;
// pulldown_cmark can send several text events for a title if there are markdown
// specific characters like `!` in them. We only want to insert the anchor the first time
2017-09-27 14:09:13 +00:00
let mut header_created = false;
2017-06-16 04:00:48 +00:00
let mut anchors: Vec<String> = vec![];
let mut headers = vec![];
// Defaults to a 0 level so not a real header
// It should be an Option ideally but not worth the hassle to update
let mut temp_header = TempHeader::default();
let mut opts = Options::empty();
let mut has_summary = false;
opts.insert(Options::ENABLE_TABLES);
opts.insert(Options::ENABLE_FOOTNOTES);
2017-03-27 14:17:33 +00:00
{
let parser = Parser::new_ext(content, opts).map(|event| {
match event {
2018-05-06 20:58:39 +00:00
Event::Text(text) => {
// Header first
if in_header {
if header_created {
temp_header.add_text(&text);
return Event::Html(Borrowed(""));
2018-05-06 20:58:39 +00:00
}
// += as we might have some <code> or other things already there
temp_header.add_text(&text);
2018-05-06 20:58:39 +00:00
header_created = true;
return Event::Html(Borrowed(""));
2017-09-27 14:09:13 +00:00
}
2018-05-06 20:58:39 +00:00
// if we are in the middle of a code block
2018-10-09 12:33:43 +00:00
if let Some((ref mut highlighter, in_extra)) = highlighter {
let highlighted = if in_extra {
if let Some(ref extra) = context.config.extra_syntax_set {
highlighter.highlight(&text, &extra)
} else {
unreachable!("Got a highlighter from extra syntaxes but no extra?");
}
} else {
highlighter.highlight(&text, &SYNTAX_SET)
};
//let highlighted = &highlighter.highlight(&text, ss);
let html = styled_line_to_highlighted_html(&highlighted, background);
2018-05-06 20:58:39 +00:00
return Event::Html(Owned(html));
}
2018-05-06 20:58:39 +00:00
// Business as usual
Event::Text(text)
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::Start(Tag::CodeBlock(ref info)) => {
if !context.config.highlight_code {
return Event::Html(Borrowed("<pre><code>"));
2017-03-27 14:17:33 +00:00
}
2018-05-07 16:38:04 +00:00
2018-05-06 20:58:39 +00:00
let theme = &THEME_SET.themes[&context.config.highlight_theme];
2018-10-09 12:33:43 +00:00
highlighter = Some(get_highlighter(info, &context.config));
// This selects the background color the same way that start_coloured_html_snippet does
2018-10-31 07:18:57 +00:00
let color =
theme.settings.background.unwrap_or(::syntect::highlighting::Color::WHITE);
2018-10-09 12:33:43 +00:00
background = IncludeBackground::IfDifferent(color);
let snippet = start_highlighted_html_snippet(theme);
Event::Html(Owned(snippet.0))
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::End(Tag::CodeBlock(_)) => {
if !context.config.highlight_code {
return Event::Html(Borrowed("</code></pre>\n"));
2017-03-27 14:17:33 +00:00
}
2018-05-06 20:58:39 +00:00
// reset highlight and close the code block
highlighter = None;
Event::Html(Borrowed("</pre>"))
2018-07-31 13:17:31 +00:00
}
Event::Start(Tag::Image(src, title)) => {
if is_colocated_asset_link(&src) {
2018-10-31 07:18:57 +00:00
return Event::Start(Tag::Image(
Owned(format!("{}{}", context.current_page_permalink, src)),
title,
));
}
2018-05-18 12:51:44 +00:00
Event::Start(Tag::Image(src, title))
2018-07-31 13:17:31 +00:00
}
2018-05-07 19:03:51 +00:00
Event::Start(Tag::Link(link, title)) => {
// A few situations here:
// - it could be a relative link (starting with `./`)
// - it could be a link to a co-located asset
// - it could be a normal link
2018-06-25 17:13:21 +00:00
// - any of those can be in a header or not: if it's in a header
// we need to append to a string
2018-05-07 19:03:51 +00:00
let fixed_link = if link.starts_with("./") {
match resolve_internal_link(&link, context.permalinks) {
Ok(url) => url,
2018-05-06 20:58:39 +00:00
Err(_) => {
error = Some(format!("Relative link {} not found.", link).into());
return Event::Html(Borrowed(""));
2017-03-27 14:17:33 +00:00
}
2018-05-07 19:03:51 +00:00
}
} else if is_colocated_asset_link(&link) {
format!("{}{}", context.current_page_permalink, link)
2018-09-30 19:15:09 +00:00
} else if context.config.check_external_links
&& !link.starts_with('#')
2018-10-31 07:18:57 +00:00
&& !link.starts_with("mailto:")
{
2018-09-30 19:15:09 +00:00
let res = check_url(&link);
if res.is_valid() {
link.to_string()
2018-09-30 19:15:09 +00:00
} else {
error = Some(
2018-10-31 07:18:57 +00:00
format!("Link {} is not valid: {}", link, res.message()).into(),
2018-09-30 19:15:09 +00:00
);
String::new()
}
2018-09-30 19:15:09 +00:00
} else {
link.to_string()
2018-05-07 19:03:51 +00:00
};
if in_header {
let html = if title.is_empty() {
format!("<a href=\"{}\">", fixed_link)
} else {
format!("<a href=\"{}\" title=\"{}\">", fixed_link, title)
2018-05-06 20:58:39 +00:00
};
temp_header.add_html(&html);
return Event::Html(Borrowed(""));
2017-03-27 14:17:33 +00:00
}
2018-05-07 19:03:51 +00:00
Event::Start(Tag::Link(Owned(fixed_link), title))
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::End(Tag::Link(_, _)) => {
if in_header {
temp_header.add_html("</a>");
return Event::Html(Borrowed(""));
2018-05-06 20:58:39 +00:00
}
event
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::Start(Tag::Code) => {
if in_header {
temp_header.add_html("<code>");
return Event::Html(Borrowed(""));
2018-05-06 20:58:39 +00:00
}
event
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::End(Tag::Code) => {
if in_header {
temp_header.add_html("</code>");
return Event::Html(Borrowed(""));
2018-05-06 20:58:39 +00:00
}
event
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::Start(Tag::Header(num)) => {
in_header = true;
temp_header = TempHeader::new(num);
Event::Html(Borrowed(""))
2018-07-31 13:17:31 +00:00
}
2018-05-06 20:58:39 +00:00
Event::End(Tag::Header(_)) => {
// End of a header, reset all the things and return the header string
let id = find_anchor(&anchors, slugify(&temp_header.title), 0);
anchors.push(id.clone());
temp_header.permalink = format!("{}#{}", context.current_page_permalink, id);
temp_header.id = id;
2018-05-06 20:58:39 +00:00
in_header = false;
header_created = false;
let val = temp_header.to_string(context.tera, context.insert_anchor);
headers.push(temp_header.clone());
temp_header = TempHeader::default();
Event::Html(Owned(val))
2018-07-31 13:17:31 +00:00
}
Event::Html(ref markup) if markup.contains("<!-- more -->") => {
has_summary = true;
Event::Html(Borrowed(CONTINUE_READING))
}
2018-05-06 20:58:39 +00:00
_ => event,
2017-05-01 07:04:41 +00:00
}
2018-05-06 20:58:39 +00:00
});
2017-03-07 12:34:31 +00:00
2017-03-27 14:17:33 +00:00
cmark::html::push_html(&mut html, parser);
2017-03-07 12:34:31 +00:00
}
if let Some(e) = error {
2018-09-30 19:15:09 +00:00
return Err(e);
} else {
Ok(Rendered {
summary_len: if has_summary { html.find(CONTINUE_READING) } else { None },
body: html,
2018-09-30 19:15:09 +00:00
toc: make_table_of_contents(&headers),
})
2017-03-27 14:17:33 +00:00
}
2017-03-07 12:34:31 +00:00
}