1use std::collections::HashSet;
2use std::net::SocketAddr;
3use std::time::Duration;
4
5use chrono::Utc;
6use native_tls::TlsConnector;
7use once_cell::sync::Lazy;
8use regex::Regex;
9use reqwest::{Client, Url};
10use tokio::net::TcpStream;
11use tracing::{debug, instrument};
12
13use super::types::{CertificateInfo, DnsResolution, DomainExpiration, StatusResponse};
14use crate::caa::{self, CaaPolicy};
15use crate::dns::{DnsResolver, RecordData, RecordType};
16use crate::error::{Result, SeerError};
17use crate::lookup::SmartLookup;
18use crate::validation::{describe_reserved_ip, normalize_domain};
19
20const DEFAULT_TIMEOUT: Duration = Duration::from_secs(10);
23const MAX_REDIRECTS: usize = 5;
24
25static TITLE_REGEX: Lazy<Regex> = Lazy::new(|| {
27 Regex::new(r"(?i)<title[^>]*>([^<]+)</title>").expect("Invalid regex for HTML title extraction")
28});
29
30#[derive(Debug, Clone)]
32pub struct StatusClient {
33 timeout: Duration,
34 dns_resolver: DnsResolver,
36 smart_lookup: SmartLookup,
38}
39
40impl Default for StatusClient {
41 fn default() -> Self {
42 Self::new()
43 }
44}
45
46impl StatusClient {
47 pub fn new() -> Self {
49 Self {
50 timeout: DEFAULT_TIMEOUT,
51 dns_resolver: DnsResolver::new(),
52 smart_lookup: SmartLookup::new(),
53 }
54 }
55
56 pub fn with_timeout(mut self, timeout: Duration) -> Self {
58 self.timeout = timeout;
59 self
60 }
61
62 #[instrument(skip(self), fields(domain = %domain))]
64 pub async fn check(&self, domain: &str) -> Result<StatusResponse> {
65 let domain = normalize_domain(domain)?;
67 debug!("Checking status for domain: {}", domain);
68
69 let mut response = StatusResponse::new(domain.clone());
70
71 let (http_result, cert_result, expiry_result, dns_result, caa_policy) = tokio::join!(
76 self.fetch_http_info(&domain),
77 self.fetch_certificate_info(&domain),
78 self.fetch_domain_expiration(&domain),
79 self.fetch_dns_resolution(&domain),
80 caa::lookup_caa(&self.dns_resolver, &domain),
81 );
82
83 match http_result {
85 Ok((status, status_text, title)) => {
86 response.http_status = Some(status);
87 response.http_status_text = Some(status_text);
88 response.title = title;
89 }
90 Err(e) => response.errors.push(super::types::StatusError {
91 check: "http".to_string(),
92 message: e.to_string(),
93 }),
94 }
95
96 let mut caa_policy: CaaPolicy = caa_policy;
99 match cert_result {
100 Ok(cert_info) => {
101 caa_policy.issuer_match =
102 Some(caa::classify_issuer(&cert_info.issuer, &caa_policy));
103 response.certificate = Some(cert_info);
104 }
105 Err(e) => response.errors.push(super::types::StatusError {
106 check: "ssl".to_string(),
107 message: e.to_string(),
108 }),
109 }
110 response.caa = Some(caa_policy);
111
112 match expiry_result {
114 Ok(expiry_info) => response.domain_expiration = expiry_info,
115 Err(e) => response.errors.push(super::types::StatusError {
116 check: "expiration".to_string(),
117 message: e.to_string(),
118 }),
119 }
120
121 match dns_result {
123 Ok(dns_info) => response.dns_resolution = Some(dns_info),
124 Err(e) => response.errors.push(super::types::StatusError {
125 check: "dns".to_string(),
126 message: e.to_string(),
127 }),
128 }
129
130 Ok(response)
131 }
132
133 async fn fetch_http_info(&self, domain: &str) -> Result<(u16, String, Option<String>)> {
152 let mut url = Url::parse(&format!("https://{}", domain))
153 .map_err(|e| SeerError::HttpError(format!("invalid URL: {}", e)))?;
154 let mut visited = HashSet::new();
155
156 for _ in 0..=MAX_REDIRECTS {
157 let validated_addrs = validate_url_target(&url).await?;
158
159 if !visited.insert(url.clone()) {
160 return Err(SeerError::HttpError("redirect loop detected".to_string()));
161 }
162
163 let host = url
167 .host_str()
168 .ok_or_else(|| SeerError::HttpError("missing URL host".to_string()))?;
169 let client = Client::builder()
170 .redirect(reqwest::redirect::Policy::none())
171 .user_agent(concat!("Seer/", env!("CARGO_PKG_VERSION")))
172 .resolve_to_addrs(host, &validated_addrs)
173 .build()
174 .map_err(|e| SeerError::HttpError(format!("failed to build HTTP client: {}", e)))?;
175
176 let response = client
177 .get(url.clone())
178 .timeout(self.timeout)
179 .send()
180 .await
181 .map_err(|e| SeerError::HttpError(e.to_string()))?;
182
183 if response.status().is_redirection() {
184 let location = response.headers().get(reqwest::header::LOCATION);
185 let location = location.and_then(|v| v.to_str().ok()).ok_or_else(|| {
186 SeerError::HttpError("redirect missing location header".to_string())
187 })?;
188 let next_url = url
189 .join(location)
190 .or_else(|_| Url::parse(location))
191 .map_err(|e| SeerError::HttpError(format!("invalid redirect URL: {}", e)))?;
192 url = next_url;
193 continue;
194 }
195
196 let status = response.status();
197 let status_code = status.as_u16();
198 let status_text = status.canonical_reason().unwrap_or("Unknown").to_string();
199
200 let title = if status.is_success() {
202 let content_type = response
203 .headers()
204 .get("content-type")
205 .and_then(|v| v.to_str().ok())
206 .unwrap_or("");
207
208 if content_type.contains("text/html") {
209 const MAX_TITLE_BODY: usize = 64 * 1024;
214 use futures::StreamExt;
215 let mut buf: Vec<u8> = Vec::with_capacity(8 * 1024);
216 let mut stream = response.bytes_stream();
217 while let Some(chunk) = stream.next().await {
218 let chunk = chunk
219 .map_err(|e| SeerError::HttpError(format!("body chunk: {}", e)))?;
220 let remaining = MAX_TITLE_BODY.saturating_sub(buf.len());
221 if remaining == 0 {
222 break;
223 }
224 let take = remaining.min(chunk.len());
225 buf.extend_from_slice(&chunk[..take]);
226 if buf.len() >= MAX_TITLE_BODY {
227 break;
228 }
229 }
230 let body = String::from_utf8_lossy(&buf);
231 extract_title(&body)
232 } else {
233 None
234 }
235 } else {
236 None
237 };
238
239 return Ok((status_code, status_text, title));
240 }
241
242 Err(SeerError::HttpError("too many redirects".to_string()))
243 }
244
245 async fn fetch_certificate_info(&self, domain: &str) -> Result<CertificateInfo> {
252 let socket_addrs = crate::net::resolve_public_host(domain, 443)
257 .await
258 .map_err(|e| SeerError::CertificateError(e.to_string()))?;
259
260 let connector = TlsConnector::builder()
261 .danger_accept_invalid_certs(true) .build()
263 .map_err(|e| SeerError::CertificateError(e.to_string()))?;
264
265 let connector = tokio_native_tls::TlsConnector::from(connector);
266
267 let stream =
270 tokio::time::timeout(self.timeout, TcpStream::connect(socket_addrs.as_slice()))
271 .await
272 .map_err(|_| SeerError::Timeout(format!("connection to {} timed out", domain)))?
273 .map_err(|e| SeerError::CertificateError(e.to_string()))?;
274
275 let tls_stream = tokio::time::timeout(self.timeout, connector.connect(domain, stream))
277 .await
278 .map_err(|_| SeerError::Timeout(format!("TLS handshake with {} timed out", domain)))?
279 .map_err(|e| SeerError::CertificateError(e.to_string()))?;
280
281 let cert = tls_stream
283 .get_ref()
284 .peer_certificate()
285 .map_err(|e| SeerError::CertificateError(e.to_string()))?
286 .ok_or_else(|| SeerError::CertificateError("no certificate found".to_string()))?;
287
288 let der = cert
290 .to_der()
291 .map_err(|e| SeerError::CertificateError(e.to_string()))?;
292
293 parse_certificate_der(&der, domain)
294 }
295
296 async fn fetch_domain_expiration(&self, domain: &str) -> Result<Option<DomainExpiration>> {
298 match self.smart_lookup.lookup(domain).await {
299 Ok(result) => {
300 let (expiration_date, registrar) = result.expiration_info();
301
302 if let Some(exp_date) = expiration_date {
303 let days_until_expiry = (exp_date - Utc::now()).num_days();
304 Ok(Some(DomainExpiration {
305 expiration_date: exp_date,
306 days_until_expiry,
307 registrar,
308 }))
309 } else {
310 Ok(None)
311 }
312 }
313 Err(_) => Ok(None), }
315 }
316
317 async fn fetch_dns_resolution(&self, domain: &str) -> Result<DnsResolution> {
319 let resolver = &self.dns_resolver;
320
321 let (a_result, aaaa_result, cname_result, ns_result) = tokio::join!(
323 resolver.resolve(domain, RecordType::A, None),
324 resolver.resolve(domain, RecordType::AAAA, None),
325 resolver.resolve(domain, RecordType::CNAME, None),
326 resolver.resolve(domain, RecordType::NS, None)
327 );
328
329 let a_records: Vec<String> = a_result
331 .unwrap_or_default()
332 .into_iter()
333 .filter_map(|r| {
334 if let RecordData::A { address } = r.data {
335 Some(address)
336 } else {
337 None
338 }
339 })
340 .collect();
341
342 let aaaa_records: Vec<String> = aaaa_result
344 .unwrap_or_default()
345 .into_iter()
346 .filter_map(|r| {
347 if let RecordData::AAAA { address } = r.data {
348 Some(address)
349 } else {
350 None
351 }
352 })
353 .collect();
354
355 let cname_target: Option<String> =
357 cname_result.unwrap_or_default().into_iter().find_map(|r| {
358 if let RecordData::CNAME { target } = r.data {
359 Some(target.trim_end_matches('.').to_string())
360 } else {
361 None
362 }
363 });
364
365 let nameservers: Vec<String> = ns_result
367 .unwrap_or_default()
368 .into_iter()
369 .filter_map(|r| {
370 if let RecordData::NS { nameserver } = r.data {
371 Some(nameserver.trim_end_matches('.').to_string())
372 } else {
373 None
374 }
375 })
376 .collect();
377
378 let resolves = !a_records.is_empty() || !aaaa_records.is_empty() || cname_target.is_some();
380
381 Ok(DnsResolution {
382 a_records,
383 aaaa_records,
384 cname_target,
385 nameservers,
386 resolves,
387 })
388 }
389}
390
391fn extract_title(html: &str) -> Option<String> {
395 TITLE_REGEX
396 .captures(html)
397 .and_then(|caps| caps.get(1))
398 .map(|m| m.as_str().trim().to_string())
399 .filter(|s| !s.is_empty())
400}
401
402async fn validate_url_target(url: &Url) -> Result<Vec<SocketAddr>> {
408 let scheme = url.scheme();
409 if scheme != "https" && scheme != "http" {
410 return Err(SeerError::HttpError(format!(
411 "unsupported URL scheme: {}",
412 scheme
413 )));
414 }
415
416 if !url.username().is_empty() || url.password().is_some() {
417 return Err(SeerError::HttpError(
418 "URL credentials are not allowed".to_string(),
419 ));
420 }
421
422 let host = url
423 .host_str()
424 .ok_or_else(|| SeerError::HttpError("missing URL host".to_string()))?;
425 let port = url.port_or_known_default().unwrap_or(443);
426
427 if port != 80 && port != 443 {
429 return Err(SeerError::HttpError(format!(
430 "non-standard port {} is not allowed in redirects",
431 port
432 )));
433 }
434
435 if let Ok(ip) = host.parse::<std::net::IpAddr>() {
436 if let Some(reason) = describe_reserved_ip(&ip) {
437 return Err(SeerError::HttpError(format!(
438 "cannot connect to {}: {} — {}",
439 host, ip, reason
440 )));
441 }
442 return Ok(vec![SocketAddr::new(ip, port)]);
443 }
444
445 let addr = format!("{}:{}", host, port);
446 let socket_addrs: Vec<_> = tokio::net::lookup_host(&addr)
447 .await
448 .map_err(|e| SeerError::HttpError(format!("DNS lookup failed: {}", e)))?
449 .collect();
450
451 if socket_addrs.is_empty() {
452 return Err(SeerError::HttpError(format!(
453 "DNS lookup returned no addresses for {}",
454 host
455 )));
456 }
457
458 for socket_addr in &socket_addrs {
459 if let Some(reason) = describe_reserved_ip(&socket_addr.ip()) {
460 return Err(SeerError::HttpError(format!(
461 "cannot connect to {}: {} — {}",
462 host,
463 socket_addr.ip(),
464 reason
465 )));
466 }
467 }
468
469 Ok(socket_addrs)
470}
471
472fn parse_certificate_der(der: &[u8], domain: &str) -> Result<CertificateInfo> {
474 use x509_parser::prelude::*;
475
476 let (_, cert) = X509Certificate::from_der(der)
477 .map_err(|e| SeerError::CertificateError(format!("failed to parse certificate: {}", e)))?;
478
479 let issuer = format_issuer_name(cert.issuer()).unwrap_or_else(|| "Unknown Issuer".to_string());
484
485 let subject =
487 extract_name_from_x509(cert.subject()).unwrap_or_else(|| "Unknown Subject".to_string());
488
489 let valid_from = asn1_time_to_chrono(cert.validity().not_before)?;
491 let valid_until = asn1_time_to_chrono(cert.validity().not_after)?;
492
493 let now = Utc::now();
494 let days_until_expiry = (valid_until - now).num_days();
495 let is_valid = now >= valid_from && now <= valid_until;
496
497 let hostname_verified = cert_matches_hostname(&cert, domain);
502
503 Ok(CertificateInfo {
504 issuer,
505 subject,
506 valid_from,
507 valid_until,
508 days_until_expiry,
509 is_valid,
510 hostname_verified,
511 })
512}
513
514fn hostname_matches_pattern(host: &str, pattern: &str) -> bool {
520 let host = host.to_ascii_lowercase();
521 let pattern = pattern.to_ascii_lowercase();
522 if let Some(rest) = pattern.strip_prefix("*.") {
523 let Some(dot) = host.find('.') else {
525 return false;
526 };
527 let host_rest = &host[dot + 1..];
528 host_rest == rest
529 } else {
530 host == pattern
531 }
532}
533
534fn cert_matches_hostname(cert: &x509_parser::certificate::X509Certificate<'_>, host: &str) -> bool {
540 use x509_parser::prelude::*;
541
542 if let Ok(Some(san_ext)) = cert.tbs_certificate.subject_alternative_name() {
544 for name in &san_ext.value.general_names {
545 if let GeneralName::DNSName(n) = name {
546 if hostname_matches_pattern(host, n) {
547 return true;
548 }
549 }
550 }
551 }
552
553 for cn in cert.subject().iter_common_name() {
555 if let Ok(s) = cn.as_str() {
556 if hostname_matches_pattern(host, s) {
557 return true;
558 }
559 }
560 }
561
562 false
563}
564
565fn format_issuer_name(name: &x509_parser::prelude::X509Name) -> Option<String> {
569 use x509_parser::oid_registry;
570 let cn = extract_oid_value(name, &oid_registry::OID_X509_COMMON_NAME);
571 let org = extract_oid_value(name, &oid_registry::OID_X509_ORGANIZATION_NAME);
572 match (org, cn) {
573 (Some(o), Some(c)) if o != c => Some(format!("{} ({})", o, c)),
574 (Some(o), _) => Some(o),
575 (None, Some(c)) => Some(c),
576 (None, None) => None,
577 }
578}
579
580fn extract_oid_value(
582 name: &x509_parser::prelude::X509Name,
583 oid: &x509_parser::der_parser::oid::Oid<'static>,
584) -> Option<String> {
585 for rdn in name.iter() {
586 for attr in rdn.iter() {
587 if attr.attr_type() == oid {
588 if let Some(s) = extract_attr_string(attr.attr_value()) {
589 return Some(s);
590 }
591 }
592 }
593 }
594 None
595}
596
597fn extract_name_from_x509(name: &x509_parser::prelude::X509Name) -> Option<String> {
599 use x509_parser::prelude::*;
600
601 for rdn in name.iter() {
603 for attr in rdn.iter() {
604 if attr.attr_type() == &oid_registry::OID_X509_COMMON_NAME {
605 if let Some(s) = extract_attr_string(attr.attr_value()) {
606 return Some(s);
607 }
608 }
609 }
610 }
611
612 for rdn in name.iter() {
614 for attr in rdn.iter() {
615 if attr.attr_type() == &oid_registry::OID_X509_ORGANIZATION_NAME {
616 if let Some(s) = extract_attr_string(attr.attr_value()) {
617 return Some(s);
618 }
619 }
620 }
621 }
622
623 None
624}
625
626fn extract_attr_string(value: &x509_parser::der_parser::asn1_rs::Any) -> Option<String> {
628 if let Ok(s) = value.as_str() {
630 return Some(s.to_string());
631 }
632
633 if let Ok(utf8) = value.as_utf8string() {
635 return Some(utf8.string().to_string());
636 }
637
638 if let Ok(s) = std::str::from_utf8(value.data) {
640 return Some(s.to_string());
641 }
642
643 None
644}
645
646fn asn1_time_to_chrono(time: x509_parser::time::ASN1Time) -> Result<chrono::DateTime<Utc>> {
648 let timestamp = time.timestamp();
649 chrono::DateTime::from_timestamp(timestamp, 0)
650 .ok_or_else(|| SeerError::CertificateError("invalid certificate timestamp".to_string()))
651}
652
653#[cfg(test)]
654mod tests {
655 use super::*;
656
657 #[test]
658 fn hostname_matches_pattern_exact() {
659 assert!(hostname_matches_pattern("example.com", "example.com"));
660 assert!(hostname_matches_pattern("EXAMPLE.COM", "example.com"));
661 assert!(hostname_matches_pattern("example.com", "EXAMPLE.COM"));
662 assert!(!hostname_matches_pattern("evil.com", "example.com"));
663 assert!(!hostname_matches_pattern("example.com", "evil.com"));
664 }
665
666 #[test]
667 fn hostname_matches_pattern_wildcard() {
668 assert!(hostname_matches_pattern("a.example.com", "*.example.com"));
669 assert!(hostname_matches_pattern("A.EXAMPLE.COM", "*.example.com"));
670 assert!(!hostname_matches_pattern("example.com", "*.example.com"));
672 assert!(!hostname_matches_pattern(
674 "a.b.example.com",
675 "*.example.com"
676 ));
677 assert!(!hostname_matches_pattern("b.other.com", "*.example.com"));
678 }
679
680 #[test]
681 fn hostname_matches_pattern_wildcard_requires_dot() {
682 assert!(!hostname_matches_pattern("localhost", "*.example.com"));
684 }
685}