use crate::agent::{AgentBase, YaydlAgent};
use crate::definitions::SiteDefinition;
use crate::VIDEO;
use anyhow::Result;
use regex::Regex;
use scraper::{Html, Selector};
use std::env;
use url::Url;
const INVIDIOUS_INSTANCE: &str = "https://invidious.nerdvpn.de";
fn get_invidious_instance() -> String {
let invidious_env = env::var("YAYDL_INVIDIOUS_INSTANCE");
if invidious_env.is_ok() {
invidious_env.unwrap_or(INVIDIOUS_INSTANCE.to_string())
} else {
INVIDIOUS_INSTANCE.to_string()
}
}
fn get_video_info(video: &mut VIDEO, url: &str) -> Result<Html> {
if video.info.is_empty() {
let id_regex = Regex::new(r"(?:v=|\.be/|shorts/)(.*?)(&.*)*$").unwrap();
let id = id_regex.captures(url).unwrap().get(1).unwrap().as_str();
let invidious_url = format!("{}/watch?v={}", get_invidious_instance(), id);
let local_url = invidious_url.to_owned();
let url_p = Url::parse(&local_url)?;
let agent = YaydlAgent::init(url_p);
let body = agent
.get(&local_url)
.call()
.expect("Could not go to the url")
.body_mut()
.read_to_string()
.expect("Could not read the site source");
video.info.push_str(&body);
}
let d = Html::parse_document(&video.info);
Ok(d)
}
struct YouTubeHandler;
impl SiteDefinition for YouTubeHandler {
fn can_handle_url<'a>(
&'a self,
_video: &mut VIDEO,
url: &'a str,
_webdriver_port: u16,
) -> Result<bool> {
Ok(Regex::new(r"invidious\.|(?:www\.)?youtu(?:be\.com|\.be)/")
.unwrap()
.is_match(url))
}
fn is_playlist<'a>(&'a self, _url: &'a str, _webdriver_port: u16) -> Result<bool> {
Ok(false)
}
fn find_video_title<'a>(
&'a self,
video: &'a mut VIDEO,
url: &'a str,
_webdriver_port: u16,
) -> Result<String> {
let video_info = get_video_info(video, url)?;
let title_selector = Selector::parse(r#"meta[property="og:title"]"#).unwrap();
let title_elem = video_info.select(&title_selector).next().unwrap();
let title_contents = title_elem.value().attr("content").unwrap();
Ok(title_contents.to_string())
}
fn find_video_direct_url<'a>(
&'a self,
video: &'a mut VIDEO,
url: &'a str,
_webdriver_port: u16,
_onlyaudio: bool,
) -> Result<String> {
let video_info = get_video_info(video, url)?;
let mut url_to_choose = "".to_string();
let quality_selector = Selector::parse(r#"source"#).unwrap();
let quality_iter = video_info.select(&quality_selector);
let mut last_vq: String = String::new();
for source in quality_iter {
let this_tag = source;
let this_vq = this_tag.value().attr("label").unwrap_or("");
let is_same_or_better_video = this_vq != last_vq && last_vq != "medium";
if is_same_or_better_video {
let this_mimetype = this_tag.value().attr("type").unwrap();
let mut mime_split = this_mimetype.split(";");
video.mime = mime_split.next().unwrap().to_string();
let relative_url = this_tag.value().attr("src").unwrap();
url_to_choose = relative_url.to_string();
last_vq = String::from(this_vq);
}
}
if url_to_choose.is_empty() {
Err(anyhow::Error::msg(
"Could not find a working video - aborting.".to_string(),
))
} else {
let url_p = Url::parse(&url_to_choose)?;
let agent = YaydlAgent::init(url_p);
let resp = agent.get(&url_to_choose).call()?;
let has_redirect = resp.headers().get("Location");
if has_redirect.is_some() {
url_to_choose = has_redirect.unwrap().to_str()?.to_string();
}
Ok(url_to_choose)
}
}
fn does_video_exist<'a>(
&'a self,
video: &'a mut VIDEO,
url: &'a str,
_webdriver_port: u16,
) -> Result<bool> {
let _video_info = get_video_info(video, url);
Ok(!video.info.is_empty())
}
fn display_name<'a>(&'a self) -> String {
"Invidious".to_string()
}
fn find_video_file_extension<'a>(
&'a self,
video: &'a mut VIDEO,
_url: &'a str,
_webdriver_port: u16,
_onlyaudio: bool,
) -> Result<String> {
let mut ext = "mp4";
if video.mime.contains("/webm") {
ext = "webm";
} else if video.mime.contains("audio/mp4") {
ext = "m4a";
}
Ok(ext.to_string())
}
fn web_driver_required<'a>(&'a self) -> bool {
false
}
}
inventory::submit! {
&YouTubeHandler as &dyn SiteDefinition
}