// Loose subset interpretation of the URL standard // Not using full Url crate here for no_std compatibility // // Caveats: // No support for query string parsing // No support for paths with ';' parameters // URLs must convert to UTF8 // Only IP address and DNS hostname host fields are supported use super::IpAddr; use alloc::borrow::ToOwned; use alloc::string::String; use alloc::vec::Vec; use core::fmt; use core::str::FromStr; fn is_alphanum(c: u8) -> bool { matches!(c, b'A'..=b'Z' | b'a'..=b'z' | b'0'..=b'9' ) } fn is_mark(c: u8) -> bool { matches!( c, b'-' | b'_' | b'.' | b'!' | b'~' | b'*' | b'\'' | b'(' | b')' ) } fn is_unreserved(c: u8) -> bool { is_alphanum(c) || is_mark(c) } fn must_encode_userinfo(c: u8) -> bool { !(is_unreserved(c) || matches!(c, b'%' | b':' | b';' | b'&' | b'=' | b'+' | b'$' | b',')) } fn must_encode_path(c: u8) -> bool { !(is_unreserved(c) || matches!( c, b'%' | b'/' | b':' | b'@' | b'&' | b'=' | b'+' | b'$' | b',' )) } fn is_valid_host>(host: H) -> bool { if host.as_ref().is_empty() { return false; } if IpAddr::from_str(host.as_ref()).is_err() { for ch in host.as_ref().chars() { if !matches!(ch, 'A'..='Z' | 'a'..='z' | '0'..='9' | '-' | '.' ) { return false; } } } true } fn is_valid_scheme>(host: H) -> bool { let mut chars = host.as_ref().chars(); if let Some(ch) = chars.next() { if !matches!(ch, 'A'..='Z' | 'a'..='z') { return false; } } else { return false; } for ch in chars { if !matches!(ch, 'A'..='Z' | 'a'..='z' | '0'..='9' | '-' | '+' | '.' ) { return false; } } true } fn hex_decode(h: u8) -> Result { match h { b'0'..=b'9' => Ok(h - b'0'), b'A'..=b'F' => Ok(h - b'A' + 10), b'a'..=b'f' => Ok(h - b'a' + 10), _ => Err("Unexpected character in percent encoding".to_owned()), } } fn hex_encode(c: u8) -> (char, char) { let c0 = c >> 4; let c1 = c & 15; ( if c0 < 10 { char::from_u32((b'0' + c0) as u32).unwrap() } else { char::from_u32((b'A' + c0 - 10) as u32).unwrap() }, if c1 < 10 { char::from_u32((b'0' + c1) as u32).unwrap() } else { char::from_u32((b'A' + c1 - 10) as u32).unwrap() }, ) } fn url_decode>(s: S) -> Result { let url = s.as_ref().to_owned(); if !url.is_ascii() { return Err("URL is not in ASCII encoding".to_owned()); } let url_bytes = url.as_bytes(); let mut dec_bytes: Vec = Vec::with_capacity(url_bytes.len()); let mut i = 0; let end = url_bytes.len(); while i < end { let mut b = url_bytes[i]; i += 1; if b == b'%' { if (i + 1) >= end { return Err("Invalid URL encoding".to_owned()); } b = hex_decode(url_bytes[i])? << 4 | hex_decode(url_bytes[i + 1])?; i += 2; } dec_bytes.push(b); } String::from_utf8(dec_bytes).map_err(|e| format!("Decoded URL is not valid UTF-8: {}", e)) } fn url_encode>(s: S, must_encode: impl Fn(u8) -> bool) -> String { let bytes = s.as_ref().as_bytes(); let mut out = String::new(); for b in bytes { if must_encode(*b) { let (c0, c1) = hex_encode(*b); out.push('%'); out.push(c0); out.push(c1); } else { out.push(char::from_u32(*b as u32).unwrap()) } } out } fn convert_port(port_str: N) -> Result where N: AsRef, { port_str .as_ref() .parse::() .map_err(|e| format!("Invalid port: {}", e)) } /////////////////////////////////////////////////////////////////////////////// #[derive(Debug, Clone, PartialEq, Eq, Hash, PartialOrd, Ord)] pub struct SplitUrlPath { pub path: String, pub fragment: Option, pub query: Option, } impl SplitUrlPath { pub fn new(path: P, fragment: Option, query: Option) -> Self where P: AsRef, F: AsRef, Q: AsRef, { Self { path: path.as_ref().to_owned(), fragment: fragment.map(|f| f.as_ref().to_owned()), query: query.map(|f| f.as_ref().to_owned()), } } } impl FromStr for SplitUrlPath { type Err = String; fn from_str(s: &str) -> Result { Ok(if let Some((p, q)) = s.split_once('?') { if let Some((p, f)) = p.split_once('#') { SplitUrlPath::new(url_decode(p)?, Some(url_decode(f)?), Some(q)) } else { SplitUrlPath::new(url_decode(p)?, Option::::None, Some(q)) } } else if let Some((p, f)) = s.split_once('#') { SplitUrlPath::new(url_decode(p)?, Some(url_decode(f)?), Option::::None) } else { SplitUrlPath::new( url_decode(s)?, Option::::None, Option::::None, ) }) } } impl fmt::Display for SplitUrlPath { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { if let Some(fragment) = &self.fragment { if let Some(query) = &self.query { write!( f, "{}#{}?{}", url_encode(&self.path, must_encode_path), url_encode(fragment, must_encode_path), query ) } else { write!(f, "{}#{}", self.path, fragment) } } else if let Some(query) = &self.query { write!(f, "{}?{}", url_encode(&self.path, must_encode_path), query) } else { write!(f, "{}", url_encode(&self.path, must_encode_path)) } } } /////////////////////////////////////////////////////////////////////////////// #[derive(Debug, Clone, PartialEq, Eq, Hash, PartialOrd, Ord)] pub struct SplitUrl { pub scheme: String, pub userinfo: Option, pub host: String, pub port: Option, pub path: Option, } impl SplitUrl { pub fn new( scheme: S, userinfo: Option, host: H, port: Option, path: Option, ) -> Self where S: AsRef, H: AsRef, { Self { scheme: scheme.as_ref().to_owned(), userinfo, host: host.as_ref().to_owned(), port, path, } } } impl FromStr for SplitUrl { type Err = String; fn from_str(s: &str) -> Result { if let Some((scheme, mut rest)) = s.split_once("://") { if !is_valid_scheme(scheme) { return Err("Invalid scheme specified".to_owned()); } let userinfo = { if let Some((userinfo_str, after)) = rest.split_once('@') { rest = after; Some(url_decode(userinfo_str)?) } else { None } }; if let Some((host, rest)) = rest.rsplit_once(':') { if !is_valid_host(host) { return Err("Invalid host specified".to_owned()); } if let Some((portstr, path)) = rest.split_once('/') { let port = convert_port(portstr)?; let path = SplitUrlPath::from_str(path)?; Ok(SplitUrl::new( scheme, userinfo, host, Some(port), Some(path), )) } else { let port = convert_port(rest)?; Ok(SplitUrl::new(scheme, userinfo, host, Some(port), None)) } } else if let Some((host, path)) = rest.split_once('/') { if !is_valid_host(host) { return Err("Invalid host specified".to_owned()); } let path = SplitUrlPath::from_str(path)?; Ok(SplitUrl::new(scheme, userinfo, host, None, Some(path))) } else { if !is_valid_host(rest) { return Err("Invalid host specified".to_owned()); } Ok(SplitUrl::new(scheme, userinfo, rest, None, None)) } } else { Err("No scheme specified".to_owned()) } } } impl fmt::Display for SplitUrl { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { let hostname = { if let Some(userinfo) = &self.userinfo { let userinfo = url_encode(userinfo, must_encode_userinfo); if let Some(port) = self.port { format!("{}@{}:{}", userinfo, self.host, port) } else { format!("{}@{}", userinfo, self.host) } } else { self.host.clone() } }; if let Some(path) = &self.path { write!(f, "{}://{}/{}", self.scheme, hostname, path) } else { write!(f, "{}://{}", self.scheme, hostname) } } }