decruft 0.1.2

Extract clean, readable content from web pages
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
<!-- {"url": "https://store.example.com/news/app/123456/view/987654321"} -->
<html>
<head>
<title>Example Game - Patch 1.2.3 is now LIVE! - Example Store News</title>
<meta property="article:published_time" content="2025-01-15T12:00:00Z">
<meta name="Description" content="Patch 1.2.3 is now live! Available on all platforms!">
</head>
<body>
<div id="application_config"
	data-partnereventstore="[{&quot;gid&quot;:&quot;987654321&quot;,&quot;event_name&quot;:&quot;Patch 1.2.3 is now LIVE!&quot;,&quot;appid&quot;:123456,&quot;announcement_body&quot;:{&quot;gid&quot;:&quot;987654322&quot;,&quot;headline&quot;:&quot;Patch 1.2.3 is now LIVE!&quot;,&quot;posttime&quot;:1736942400,&quot;body&quot;:&quot;[p]Patch 1.2.3 is now live! This is build 500, network compatible. Available on all platforms! You can read the [url=\&quot;https:\/\/docs.example.com\/patch-123\&quot;]full patch notes here[\/url].\n\nOr, watch the video patch notes below:\n\n[\/p][previewyoutube=\&quot;dQw4w9WgXcQ;full\&quot;][\/previewyoutube]&quot;}}]"
	data-groupvanityinfo="[{&quot;success&quot;:1,&quot;group_name&quot;:&quot;Example Game&quot;,&quot;vanity_url&quot;:&quot;examplegame&quot;}]"
></div>
<div id="application_root"></div>
</body>
</html>