#[cfg(feature = "scraper")]
pub mod test {
use html2md::{parse_html, rewrite_html};
use pretty_assertions::assert_eq;
#[test]
fn test_dumb() {
let md = parse_html("<p>CARTHAPHILUS</p>", false);
assert_eq!(md, "CARTHAPHILUS");
let md = rewrite_html("<p>CARTHAPHILUS</p>", false);
assert_eq!(md, "CARTHAPHILUS")
}
#[test]
fn test_space() {
let s = r#"<p><a href="http://ya.ru">APOSIMZ</a></p>\n"#;
let md = parse_html(s, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)\n\\\\n");
let md = rewrite_html(s, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)\n\\n");
}
#[test]
fn test_anchor() {
let md = parse_html(r#"<p><a href="http://ya.ru">APOSIMZ</a></p>"#, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)");
let md = rewrite_html(r#"<p><a href="http://ya.ru">APOSIMZ</a></p>"#, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)");
}
#[test]
fn test_anchor2() {
let s =
r#"<p><a href="http://ya.ru">APOSIMZ</a><a href="http://yandex.ru">SIDONIA</a></p>"#;
let md = parse_html(s, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)[SIDONIA](http://yandex.ru)");
let md = rewrite_html(s, false);
assert_eq!(md, "[APOSIMZ](http://ya.ru)[SIDONIA](http://yandex.ru)");
}
#[test]
fn test_anchor3() {
let s = r#"<p><a href="http://ya.ru">APOSIMZ</a><p/><a href="http://yandex.ru">SIDONIA</a></p>"#;
let m = "[APOSIMZ](http://ya.ru)\n[SIDONIA](http://yandex.ru)";
let md = parse_html(s, false);
assert_eq!(md, m);
let md = rewrite_html(s, false);
assert_eq!(md, m)
}
#[test]
fn test_anchor4() {
let s = r#"<p><a href="/my%20uri">link</a></p>"#;
let m = "\
[link](</my uri>)";
let md = parse_html(s, false);
assert_eq!(md, m);
let md = rewrite_html(s, false);
assert_eq!(md, m);
}
#[test]
fn test_image() {
let md = parse_html(
r#"<p><a href="https://gitter.im/MARC-FS/Lobby?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge"><img src="https://img.shields.io/gitter/room/MARC-FS/MARC-FS.svg" alt="Gitter"></a><br>"#,
false,
);
assert_eq!(md, "[](https://gitter.im/MARC-FS/Lobby?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)")
}
#[test]
fn test_escaping() {
let s = r#"<p>*god*'s in his **heaven** - all is right with the __world__</p>"#;
let m = "\\*god\\*\'s in his \\*\\*heaven\\*\\* - all is right with the \\_\\_world\\_\\_";
let md = parse_html(s, false);
assert_eq!(md, m);
let md = rewrite_html(s, false);
assert_eq!(md, m);
}
#[test]
fn test_escaping_mid_hyphens() {
let md = parse_html(r#"<h1>This is a header with-hyphen!</h1>"#, false);
assert_eq!(md, "# This is a header with-hyphen!")
}
#[test]
fn test_escaping_start_hyphens() {
let md = parse_html(
r#"<h1>- This is a header with starting hyphen!</h1>"#,
false,
);
assert_eq!(md, "# - This is a header with starting hyphen!")
}
#[test]
fn test_escaping_start_sharp() {
let md = parse_html("<html># nothing to worry about</html>", false);
assert_eq!(md, "\\# nothing to worry about")
}
#[test]
fn test_escaping_start_hyphens_space() {
let md = parse_html(
r#"<h1> - This is a header with starting hyphen!</h1>"#,
false,
);
assert_eq!(md, "# - This is a header with starting hyphen!")
}
#[test]
fn test_escaping_html_tags() {
let md = parse_html(
r#"xxxxxxx xx xxxxxxxxxxx: <iframe src="xxxxxx_xx_xxxxxxxxxxx/embed/" allowfullscreen="" height="725" width="450"></iframe>"#,
false,
);
assert_eq!(
md,
r#"xxxxxxx xx xxxxxxxxxxx: \<iframe src="xxxxxx\_xx\_xxxxxxxxxxx/embed/" allowfullscreen="" height="725" width="450"\>\</iframe\>"#
)
}
#[test]
fn test_headers() {
let md = parse_html(
r#"<h1 id="marc-fs">MARC-FS</h1><p><a href="http://Mail.ru">Mail.ru</a> Cloud filesystem written for FUSE</p><h2 id="synopsis">Synopsis</h2>"#,
false,
);
assert_eq!(
md,
"# MARC-FS\n[Mail.ru](http://Mail.ru) Cloud filesystem written for FUSE\n## Synopsis"
)
}
#[test]
fn test_escaping_start_equal() {
let md = parse_html(r#"<p>This is NOT a header!<br/>===========</p>"#, false);
assert_eq!(md, "This is NOT a header!\n\\===========")
}
#[test]
fn test_escaping_start_equal_space() {
let md = parse_html(r#"<p>This is NOT a header!<br/> ===========</p>"#, false);
assert_eq!(md, "This is NOT a header!\n\\===========")
}
#[test]
fn test_escaping_start_hyphen() {
let md = parse_html(r#"<p>This is NOT a header!<br/>-------</p>"#, false);
assert_eq!(md, "This is NOT a header!\n\\-------")
}
#[test]
fn test_escaping_start_hyphen_space() {
let md = parse_html(r#"<p>This is NOT a header!<br/> -------</p>"#, false);
assert_eq!(md, "This is NOT a header!\n\\-------")
}
#[test]
fn test_escaping_sup_tags() {
let md = parse_html(
r#"<p>This is NOT a header!<br/><sup>something</sup> -------</p>"#,
false,
);
assert_eq!(md, "This is NOT a header!\nsomething -------")
}
#[test]
fn test_html_entity_decoding() {
let html = r#"<p>Tom & Jerry</p>"#;
let md = rewrite_html(html, false);
assert_eq!(md, "Tom & Jerry");
let html = r#"<p>1 < 2 > 0</p>"#;
let md = rewrite_html(html, false);
assert_eq!(md, "1 \\< 2 \\> 0");
let html = r#"<p>He said "hello"</p>"#;
let md = rewrite_html(html, false);
assert_eq!(md, r#"He said "hello""#);
let html = r#"<p>It's fine</p>"#;
let md = rewrite_html(html, false);
assert_eq!(md, "It's fine");
let html = r#"<p>non breaking</p>"#;
let md = rewrite_html(html, false);
assert_eq!(md, "nonbreaking");
}
}