lemmy/crates/utils/src/utils/markdown.rs

use markdown_it::MarkdownIt;
use once_cell::sync::Lazy;

mod spoiler_rule;

static MARKDOWN_PARSER: Lazy<MarkdownIt> = Lazy::new(|| {
  let mut parser = MarkdownIt::new();
  markdown_it::plugins::cmark::add(&mut parser);
  markdown_it::plugins::extra::add(&mut parser);
  spoiler_rule::add(&mut parser);

  parser
});

/// Replace special HTML characters in API parameters to prevent XSS attacks.
///
/// Taken from https://github.com/OWASP/CheatSheetSeries/blob/master/cheatsheets/Cross_Site_Scripting_Prevention_Cheat_Sheet.md#output-encoding-for-html-contexts
///
/// `>` is left in place because it is interpreted as markdown quote.
pub fn sanitize_html(text: &str) -> String {
  text
    .replace('&', "&amp;")
    .replace('<', "&lt;")
    .replace('\"', "&quot;")
    .replace('\'', "&#x27;")
}

/// Converts text from markdown to HTML, while escaping special characters.
pub fn markdown_to_html(text: &str) -> String {
  MARKDOWN_PARSER.parse(text).xrender()
}

#[cfg(test)]
mod tests {
  #![allow(clippy::unwrap_used)]
  #![allow(clippy::indexing_slicing)]

  use super::*;
  use pretty_assertions::assert_eq;

  #[test]
  fn test_basic_markdown() {
    let tests: Vec<_> = vec![
      (
        "headings",
        "# h1\n## h2\n### h3\n#### h4\n##### h5\n###### h6",
        "<h1>h1</h1>\n<h2>h2</h2>\n<h3>h3</h3>\n<h4>h4</h4>\n<h5>h5</h5>\n<h6>h6</h6>\n"
      ),
      (
        "line breaks",
        "First\rSecond",
        "<p>First\nSecond</p>\n"),
      (
        "emphasis",
        "__bold__ **bold** *italic* ***bold+italic***",
        "<p><strong>bold</strong> <strong>bold</strong> <em>italic</em> <em><strong>bold+italic</strong></em></p>\n"
      ),
      (
        "blockquotes",
        "> #### Hello\n > \n > - Hola\n > - 안영 \n>> Goodbye\n",
        "<blockquote>\n<h4>Hello</h4>\n<ul>\n<li>Hola</li>\n<li>안영</li>\n</ul>\n<blockquote>\n<p>Goodbye</p>\n</blockquote>\n</blockquote>\n"
      ),
      (
        "lists (ordered, unordered)",
        "1. pen\n2. apple\n3. apple pen\n- pen\n- pineapple\n- pineapple pen",
        "<ol>\n<li>pen</li>\n<li>apple</li>\n<li>apple pen</li>\n</ol>\n<ul>\n<li>pen</li>\n<li>pineapple</li>\n<li>pineapple pen</li>\n</ul>\n"
      ),
      (
        "code and code blocks",
        "this is my amazing `code snippet` and my amazing ```code block```",
        "<p>this is my amazing <code>code snippet</code> and my amazing <code>code block</code></p>\n"
      ),
      (
        "links",
        "[Lemmy](https://join-lemmy.org/ \"Join Lemmy!\")",
        "<p><a href=\"https://join-lemmy.org/\" title=\"Join Lemmy!\">Lemmy</a></p>\n"
      ),
      (
        "images",
        "![My linked image](https://image.com \"image alt text\")",
        "<p><img src=\"https://image.com\" alt=\"My linked image\" title=\"image alt text\" /></p>\n"
      ),
      // Ensure any custom plugins are added to 'MARKDOWN_PARSER' implementation.
      (
        "basic spoiler",
        "::: spoiler click to see more\nhow spicy!\n:::\n",
        "<details><summary>click to see more</summary><p>how spicy!\n</p></details>\n"
      ),
      (
          "escape html special chars",
          "<script>alert('xss');</script> hello &\"",
          "<p>&lt;script&gt;alert(‘xss’);&lt;/script&gt; hello &amp;&quot;</p>\n"
          )
    ];

    tests.iter().for_each(|&(msg, input, expected)| {
      let result = markdown_to_html(input);

      assert_eq!(
        result, expected,
        "Testing {}, with original input '{}'",
        msg, input
      );
    });
  }

  #[test]
  fn test_sanitize_html() {
    let sanitized = sanitize_html("<script>alert('xss');</script> hello &\"'");
    let expected = "&lt;script>alert(&#x27;xss&#x27;);&lt;/script> hello &amp;&quot;&#x27;";
    assert_eq!(expected, sanitized)
  }
}
-												Fixes #1884 - Support Spoiler Tags (#3018)

* Fixes #1884 - Switches markdown libraries and creates a custom rule to manage spoiler blocks

* Add tests to cover invalid spoiler input

* Consolidate tests, add comments

* Make immutable, static instance of markdown parser

---------

Co-authored-by: Nutomic <me@nutomic.com>
											
										
										
											2023-06-14 11:15:59 +00:00
+								use markdown_it::MarkdownIt;
 								use once_cell::sync::Lazy;
 								mod spoiler_rule;
 								static MARKDOWN_PARSER: Lazy<MarkdownIt> = Lazy::new(|| {
 								  let mut parser = MarkdownIt::new();
 								  markdown_it::plugins::cmark::add(&mut parser);
 								  markdown_it::plugins::extra::add(&mut parser);
 								  spoiler_rule::add(&mut parser);
 								  parser
 								});
-												Only sanitize strings when generating RSS feeds and emails (fixes #4003) (#4024)

* Only sanitize strings when generating RSS feeds and emails (fixes #4003)

* clippy

* fix test
											
										
										
											2023-10-11 14:48:19 +00:00
+								/// Replace special HTML characters in API parameters to prevent XSS attacks.
 								///
 								/// Taken from https://github.com/OWASP/CheatSheetSeries/blob/master/cheatsheets/Cross_Site_Scripting_Prevention_Cheat_Sheet.md#output-encoding-for-html-contexts
 								///
 								/// `>` is left in place because it is interpreted as markdown quote.
 								pub fn sanitize_html(text: &str) -> String {
 								  text
 								    .replace('&', "&amp;")
 								    .replace('<', "&lt;")
 								    .replace('\"', "&quot;")
 								    .replace('\'', "&#x27;")
 								}
 								/// Converts text from markdown to HTML, while escaping special characters.
-												Organize utils into separate files. Fixes #2295 (#2736)

* Organize utils into separate files. Fixes #2295

* Moving tests.

* Fix test.

* Fix test 2
											
										
										
											2023-02-16 04:05:14 +00:00
+								pub fn markdown_to_html(text: &str) -> String {
-												Fixes #1884 - Support Spoiler Tags (#3018)

* Fixes #1884 - Switches markdown libraries and creates a custom rule to manage spoiler blocks

* Add tests to cover invalid spoiler input

* Consolidate tests, add comments

* Make immutable, static instance of markdown parser

---------

Co-authored-by: Nutomic <me@nutomic.com>
											
										
										
											2023-06-14 11:15:59 +00:00
+								  MARKDOWN_PARSER.parse(text).xrender()
 								}
 								#[cfg(test)]
 								mod tests {
-												Cache & Optimize Woodpecker CI (#3450)

* Try using drone cache plugin

* Try another path

* Include volume

* Fix formatting

* Include fmt

* Exclude cargo dir from prettier

* Don't override cargo

* Just do check

* Add cache key

* Use different cache plugin

* Add clippy

* Try minio

* Add quotes

* Try adding secrets

* Try again

* Again

* Use correct secret formation

* Add back clippy

* Use secret for the root bucket name

* Try drone cache instead

* Add region

* Add path-style option

* Include cargo clippy

* Include everything again

* Fix formatting

* Don't run clippy twice

* Add `allow` statements for tests to pass

* Adjust endpoint to be a secret

* Fix prettier

* Merge & fix tests

* Try to restart the woodpecker test

* Change the ENV var name

---------

Co-authored-by: Dessalines <dessalines@users.noreply.github.com>
											
										
										
											2023-07-17 15:04:14 +00:00
+								  #![allow(clippy::unwrap_used)]
 								  #![allow(clippy::indexing_slicing)]
-												Only sanitize strings when generating RSS feeds and emails (fixes #4003) (#4024)

* Only sanitize strings when generating RSS feeds and emails (fixes #4003)

* clippy

* fix test
											
										
										
											2023-10-11 14:48:19 +00:00
+								  use super::*;
-												Use `pretty_assertions` for assertions (#4347)

* Use `pretty_assertions` for assertions

* fixed ordering of `use`s

* ci

---------

Co-authored-by: Felix Ableitner <me@nutomic.com>
											
										
										
											2024-01-04 09:47:18 +00:00
+								  use pretty_assertions::assert_eq;
-												Fixes #1884 - Support Spoiler Tags (#3018)

* Fixes #1884 - Switches markdown libraries and creates a custom rule to manage spoiler blocks

* Add tests to cover invalid spoiler input

* Consolidate tests, add comments

* Make immutable, static instance of markdown parser

---------

Co-authored-by: Nutomic <me@nutomic.com>
											
										
										
											2023-06-14 11:15:59 +00:00
 								  #[test]
 								  fn test_basic_markdown() {
 								    let tests: Vec<_> = vec![
 								      (
 								        "headings",
 								        "# h1\n## h2\n### h3\n#### h4\n##### h5\n###### h6",
 								        "<h1>h1</h1>\n<h2>h2</h2>\n<h3>h3</h3>\n<h4>h4</h4>\n<h5>h5</h5>\n<h6>h6</h6>\n"
 								      ),
 								      (
 								        "line breaks",
 								        "First\rSecond",
 								        "<p>First\nSecond</p>\n"),
 								      (
 								        "emphasis",
 								        "__bold__ **bold** *italic* ***bold+italic***",
 								        "<p><strong>bold</strong> <strong>bold</strong> <em>italic</em> <em><strong>bold+italic</strong></em></p>\n"
 								      ),
 								      (
 								        "blockquotes",
 								        "> #### Hello\n > \n > - Hola\n > - 안영 \n>> Goodbye\n",
 								        "<blockquote>\n<h4>Hello</h4>\n<ul>\n<li>Hola</li>\n<li>안영</li>\n</ul>\n<blockquote>\n<p>Goodbye</p>\n</blockquote>\n</blockquote>\n"
 								      ),
 								      (
 								        "lists (ordered, unordered)",
 								        "1. pen\n2. apple\n3. apple pen\n- pen\n- pineapple\n- pineapple pen",
 								        "<ol>\n<li>pen</li>\n<li>apple</li>\n<li>apple pen</li>\n</ol>\n<ul>\n<li>pen</li>\n<li>pineapple</li>\n<li>pineapple pen</li>\n</ul>\n"
 								      ),
 								      (
 								        "code and code blocks",
 								        "this is my amazing `code snippet` and my amazing ```code block```",
 								        "<p>this is my amazing <code>code snippet</code> and my amazing <code>code block</code></p>\n"
 								      ),
 								      (
 								        "links",
 								        "[Lemmy](https://join-lemmy.org/ \"Join Lemmy!\")",
 								        "<p><a href=\"https://join-lemmy.org/\" title=\"Join Lemmy!\">Lemmy</a></p>\n"
 								      ),
 								      (
 								        "images",
 								        "![My linked image](https://image.com \"image alt text\")",
 								        "<p><img src=\"https://image.com\" alt=\"My linked image\" title=\"image alt text\" /></p>\n"
 								      ),
 								      // Ensure any custom plugins are added to 'MARKDOWN_PARSER' implementation.
 								      (
 								        "basic spoiler",
 								        "::: spoiler click to see more\nhow spicy!\n:::\n",
 								        "<details><summary>click to see more</summary><p>how spicy!\n</p></details>\n"
 								      ),
-												Only sanitize strings when generating RSS feeds and emails (fixes #4003) (#4024)

* Only sanitize strings when generating RSS feeds and emails (fixes #4003)

* clippy

* fix test
											
										
										
											2023-10-11 14:48:19 +00:00
+								      (
 								          "escape html special chars",
 								          "<script>alert('xss');</script> hello &\"",
 								          "<p>&lt;script&gt;alert(‘xss’);&lt;/script&gt; hello &amp;&quot;</p>\n"
 								          )
-												Fixes #1884 - Support Spoiler Tags (#3018)

* Fixes #1884 - Switches markdown libraries and creates a custom rule to manage spoiler blocks

* Add tests to cover invalid spoiler input

* Consolidate tests, add comments

* Make immutable, static instance of markdown parser

---------

Co-authored-by: Nutomic <me@nutomic.com>
											
										
										
											2023-06-14 11:15:59 +00:00
+								    ];
 								    tests.iter().for_each(|&(msg, input, expected)| {
 								      let result = markdown_to_html(input);
 								      assert_eq!(
 								        result, expected,
 								        "Testing {}, with original input '{}'",
 								        msg, input
 								      );
 								    });
 								  }
-												Only sanitize strings when generating RSS feeds and emails (fixes #4003) (#4024)

* Only sanitize strings when generating RSS feeds and emails (fixes #4003)

* clippy

* fix test
											
										
										
											2023-10-11 14:48:19 +00:00
 								  #[test]
 								  fn test_sanitize_html() {
 								    let sanitized = sanitize_html("<script>alert('xss');</script> hello &\"'");
 								    let expected = "&lt;script>alert(&#x27;xss&#x27;);&lt;/script> hello &amp;&quot;&#x27;";
 								    assert_eq!(expected, sanitized)
 								  }
-												Organize utils into separate files. Fixes #2295 (#2736)

* Organize utils into separate files. Fixes #2295

* Moving tests.

* Fix test.

* Fix test 2
											
										
										
											2023-02-16 04:05:14 +00:00
+								}