use std::borrow::Cow;
use bstr::ByteSlice;
use quick_error::quick_error;
use crate::Scheme;
quick_error! {
#[derive(Debug)]
#[allow(missing_docs)]
pub enum Error {
Utf8(err: std::str::Utf8Error) {
display("Could not decode URL as UTF8")
from()
source(err)
}
Url(err: String) {
display("the URL could not be parsed: {}", err)
}
UnsupportedProtocol(protocol: String) {
display("Protocol '{}' is not supported", protocol)
}
EmptyPath {
display("Paths cannot be empty")
}
RelativeUrl(url: String) {
display("Relative URLs are not permitted: '{}'", url)
}
}
}
fn str_to_protocol(s: &str) -> Result<Scheme, Error> {
Ok(match s {
"ssh" => Scheme::Ssh,
"file" => Scheme::File,
"git" => Scheme::Git,
"http" => Scheme::Http,
"https" => Scheme::Https,
"rad" => Scheme::Radicle,
_ => return Err(Error::UnsupportedProtocol(s.into())),
})
}
fn guess_protocol(url: &[u8]) -> &str {
match url.find_byte(b':') {
Some(colon_pos) => {
if url[..colon_pos].find_byte(b'.').is_some() {
"ssh"
} else {
"file"
}
}
None => "file",
}
}
fn sanitize_for_protocol<'a>(protocol: &str, url: &'a str) -> Cow<'a, str> {
match protocol {
"ssh" => url.replacen(':', "/", 1).into(),
_ => url.into(),
}
}
fn has_no_explicit_protocol(url: &[u8]) -> bool {
url.find(b"://").is_none()
}
fn possibly_strip_file_protocol(url: &[u8]) -> &[u8] {
if url.starts_with(b"file://") {
&url[b"file://".len()..]
} else {
url
}
}
fn to_owned_url(url: url::Url) -> Result<crate::Url, Error> {
Ok(crate::Url {
scheme: str_to_protocol(url.scheme())?,
user: if url.username().is_empty() {
None
} else {
Some(url.username().into())
},
host: url.host_str().map(Into::into),
port: url.port(),
path: url.path().into(),
})
}
pub fn parse(bytes: &[u8]) -> Result<crate::Url, Error> {
let guessed_protocol = guess_protocol(bytes);
if possibly_strip_file_protocol(bytes) != bytes || (has_no_explicit_protocol(bytes) && guessed_protocol == "file") {
return Ok(crate::Url {
scheme: Scheme::File,
path: possibly_strip_file_protocol(bytes).into(),
..Default::default()
});
}
let url_str = std::str::from_utf8(bytes)?;
let mut url = match url::Url::parse(url_str) {
Ok(url) => url,
Err(::url::ParseError::RelativeUrlWithoutBase) => {
url::Url::parse(&format!(
"{}://{}",
guessed_protocol,
sanitize_for_protocol(guessed_protocol, url_str)
))
.map_err(|err| Error::Url(err.to_string()))?
}
Err(err) => return Err(Error::Url(err.to_string())),
};
if url.scheme().find('.').is_some() {
url = url::Url::parse(&format!("ssh://{}", sanitize_for_protocol("ssh", url_str)))
.map_err(|err| Error::Url(err.to_string()))?;
}
if url.scheme() != "rad" && url.path().is_empty() {
return Err(Error::EmptyPath);
}
if url.cannot_be_a_base() {
return Err(Error::RelativeUrl(url.into()));
}
to_owned_url(url)
}