1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
use serde::{Deserialize, Serialize};
mod utils;
use utils::{regex_for_domain, regex_for_prefix, regex_for_robots};
#[derive(Clone, Debug, Deserialize, Serialize)]
pub enum LensRule {
LimitURLDepth(String, u8),
SkipURL(String),
}
impl LensRule {
pub fn to_regex(&self) -> String {
match &self {
LensRule::LimitURLDepth(prefix, max_depth) => {
let prefix = prefix.trim_end_matches('/');
let regex = format!("^{}/?(/[^/]+/?){{0, {}}}$", prefix, max_depth);
regex
}
LensRule::SkipURL(rule_str) => {
regex_for_robots(rule_str).expect("Invalid SkipURL regex")
}
}
}
}
#[derive(Clone, Debug, Default, Deserialize, Serialize)]
pub struct LensConfig {
#[serde(default = "LensConfig::default_author")]
pub author: String,
pub name: String,
pub description: Option<String>,
pub domains: Vec<String>,
pub urls: Vec<String>,
pub version: String,
#[serde(default = "LensConfig::default_is_enabled")]
pub is_enabled: bool,
#[serde(default)]
pub rules: Vec<LensRule>,
#[serde(default)]
pub trigger: String,
}
impl LensConfig {
fn default_author() -> String {
"Unknown".to_string()
}
fn default_is_enabled() -> bool {
true
}
pub fn into_regexes(&self) -> Vec<String> {
let mut filters: Vec<String> = Vec::new();
for domain in &self.domains {
filters.push(regex_for_domain(domain));
}
for prefix in &self.urls {
filters.push(regex_for_prefix(prefix));
}
for rule in &self.rules {
filters.push(rule.to_regex());
}
filters
}
}