tirocinio-canali-steffo-acrate/acrate-nodeinfo/src/lib.rs

329 lines
10 KiB
Rust
Raw Normal View History

2024-11-09 12:14:11 +00:00
//! Serde-based [RFC 6415] `host-meta` parser.
//!
//! [RFC 6415]: https://datatracker.ietf.org/doc/html/rfc6415
2024-11-09 10:01:26 +00:00
use reqwest::header::HeaderValue;
use serde::Deserialize;
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
/// A [host-meta document].
///
/// [host-meta document]: https://datatracker.ietf.org/doc/html/rfc6415
#[derive(Debug, Clone, Deserialize)]
2024-11-09 12:14:11 +00:00
pub struct HostMetaDocument {
/// The resource this document refers to.
#[serde(alias = "Subject")]
2024-11-09 12:14:11 +00:00
pub subject: Option<String>,
/// Links established between the [`Self::subject`] and other resources.
#[serde(alias = "Links")]
2024-11-09 12:14:11 +00:00
pub links: Vec<HostMetaLink>,
2024-11-09 10:01:26 +00:00
}
2024-11-09 12:14:11 +00:00
/// A [host-meta Link Element], which puts the subject resource in relation with another.
///
/// [host-meta Link Element]: https://datatracker.ietf.org/doc/html/rfc6415#section-3.1.1
#[derive(Debug, Clone, Deserialize)]
2024-11-09 12:14:11 +00:00
pub struct HostMetaLink {
/// The kind of relation established by the subject with the attached resource.
2024-11-09 10:01:26 +00:00
pub rel: String,
2024-11-09 12:14:11 +00:00
/// The resource put in relation with the subject resource.
2024-11-09 10:01:26 +00:00
pub href: String,
}
2024-11-09 12:14:11 +00:00
impl HostMetaDocument {
/// Get an [host-meta document] in the [JRD format].
///
/// This follows redirects until the redirect chain is 10 hops; see [`reqwest::redirect`] for more info.
///
/// [JRD format]: https://datatracker.ietf.org/doc/html/rfc6415#appendix-A
/// [host-meta document]: https://datatracker.ietf.org/doc/html/rfc6415
pub async fn get_jrd(client: &reqwest::Client, url: reqwest::Url) -> Result<Self, HostMetaGetJRDError> {
use HostMetaGetJRDError::*;
log::debug!("Getting host-meta JRD document at: {url}");
log::trace!("Building request...");
let request = {
log::trace!("Creating new request...");
let mut request = reqwest::Request::new(reqwest::Method::GET, url);
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::trace!("Setting request headers...");
let headers = request.headers_mut();
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::trace!("Setting `Accept: application/json`...");
let _ = headers.insert(reqwest::header::ACCEPT, "application/json".parse().unwrap());
request
};
log::trace!("Sending request...");
let response = client.execute(request)
2024-11-09 10:01:26 +00:00
.await
.map_err(Request)?;
log::trace!("Checking `Content-Type` of the response...");
let content_type = response
2024-11-09 10:01:26 +00:00
.headers()
.get(reqwest::header::CONTENT_TYPE)
.ok_or(ContentTypeMissing)?;
log::trace!("Extracting MIME type from the `Content-Type` header...");
let mime_type = extract_mime_from_content_type(content_type)
2024-11-09 10:01:26 +00:00
.ok_or(ContentTypeInvalid)?;
log::trace!("Ensuring MIME type of `{mime_type}` is acceptable for JRD parsing...");
if mime_type != "application/json" {
return Err(ContentTypeInvalid)
}
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to parse response as JSON...");
2024-11-09 10:01:26 +00:00
let data = response.json::<Self>()
.await
.map_err(Parse)?;
Ok(data)
}
2024-11-09 12:14:11 +00:00
/// Get an [host-meta document] in the [XRD format].
///
/// This follows redirects until the redirect chain is 10 hops; see [`reqwest::redirect`] for more info.
///
/// [XRD format]: https://datatracker.ietf.org/doc/html/rfc6415#section-3.1
/// [host-meta document]: https://datatracker.ietf.org/doc/html/rfc6415
pub async fn get_xrd(client: &reqwest::Client, url: reqwest::Url) -> Result<Self, HostMetaGetXRDError> {
use HostMetaGetXRDError::*;
log::debug!("Getting host-meta XRD document at: {url}");
log::trace!("Building request...");
let request = {
log::trace!("Creating new request...");
let mut request = reqwest::Request::new(reqwest::Method::GET, url);
log::trace!("Setting request headers...");
let headers = request.headers_mut();
log::trace!("Setting `Accept: application/xrd+xml`...");
let _ = headers.insert(reqwest::header::ACCEPT, "application/xrd+xml".parse().unwrap());
request
};
log::trace!("Sending request...");
let response = client.execute(request)
.await
.map_err(Request)?;
log::trace!("Checking `Content-Type` of the response...");
let content_type = response
2024-11-09 12:14:11 +00:00
.headers()
.get(reqwest::header::CONTENT_TYPE)
.ok_or(ContentTypeMissing)?;
log::trace!("Extracting MIME type from the `Content-Type` header...");
let mime_type = extract_mime_from_content_type(content_type)
2024-11-09 12:14:11 +00:00
.ok_or(ContentTypeInvalid)?;
2024-11-09 10:01:26 +00:00
log::trace!("Ensuring MIME type of `{mime_type}` is acceptable for JRD parsing...");
if mime_type != "application/xrd+xml" {
return Err(ContentTypeInvalid)
}
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to parse response as text...");
let data = response.text()
.await
.map_err(Decode)?;
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::trace!("Parsing response as XML...");
let data = quick_xml::de::from_str::<Self>(&data)
.map_err(Parse)?;
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
Ok(data)
}
/// Attempt to discover the [host-meta document] at the given URL in various ways.
///
/// In order, this method attempts:
/// 1. [HTTPS] [XRD](Self::get_xrd)
/// 2. [HTTPS] [JRD](Self::get_jrd)
/// 3. [HTTP] [XRD](Self::get_xrd)
/// 4. [HTTP] [JRD](Self::get_jrd)
///
/// This follows redirects until the redirect chain is 10 hops; see [`reqwest::redirect`] for more info.
///
/// [host-meta document]: https://datatracker.ietf.org/doc/html/rfc6415
/// [HTTPS]: https://datatracker.ietf.org/doc/html/rfc2818
/// [HTTP]: https://datatracker.ietf.org/doc/html/rfc2616
/// [JRD]: https://datatracker.ietf.org/doc/html/rfc6415#appendix-A
pub async fn discover(client: &reqwest::Client, mut url: reqwest::Url) -> Result<Self, HostMetaDiscoverError> {
use HostMetaDiscoverError::*;
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::debug!("Discovering host-meta document at base: {url}");
2024-11-09 10:01:26 +00:00
log::trace!("Unsetting URL query...");
url.set_query(None);
log::trace!("Unsetting URL fragment...");
url.set_fragment(None);
log::trace!("Setting URL scheme to HTTPS...");
url.set_scheme("https")
.map_err(UrlManipulation)?;
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to retrieve XRD host-meta via HTTPS...");
let https_xrd = match Self::get_xrd(client, url.clone()).await {
Ok(data) => {
log::trace!("HTTPS XRD retrieval was successful, returning...");
return Ok(data)
}
Err(err) => {
log::trace!("HTTPS XRD retrieval failed.");
err
}
};
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to retrieve JRD host-meta via HTTPS...");
let https_jrd = match Self::get_jrd(client, url.clone()).await {
2024-11-09 10:01:26 +00:00
Ok(data) => {
2024-11-09 12:14:11 +00:00
log::trace!("HTTPS JRD retrieval was successful, returning...");
2024-11-09 10:01:26 +00:00
return Ok(data)
}
Err(err) => {
2024-11-09 12:14:11 +00:00
log::trace!("HTTPS JRD retrieval failed.");
2024-11-09 10:01:26 +00:00
err
}
};
log::trace!("Setting URL scheme to HTTP...");
url.set_scheme("http")
.map_err(UrlManipulation)?;
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to retrieve XRD host-meta via HTTP...");
let http_xrd = match Self::get_xrd(client, url.clone()).await {
Ok(data) => {
log::trace!("HTTP XRD retrieval was successful, returning...");
return Ok(data)
}
Err(err) => {
log::trace!("HTTP XRD retrieval failed.");
err
}
};
2024-11-09 10:01:26 +00:00
2024-11-09 12:14:11 +00:00
log::trace!("Attempting to retrieve JRD host-meta via HTTP...");
let http_jrd = match Self::get_jrd(client, url.clone()).await {
2024-11-09 10:01:26 +00:00
Ok(data) => {
2024-11-09 12:14:11 +00:00
log::trace!("HTTP JRD retrieval was successful, returning...");
2024-11-09 10:01:26 +00:00
return Ok(data)
}
Err(err) => {
2024-11-09 12:14:11 +00:00
log::trace!("HTTP JRD retrieval failed.");
2024-11-09 10:01:26 +00:00
err
}
};
Err(
2024-11-09 12:14:11 +00:00
HostMetaDiscoverError::Fetch(
HostMetaDiscoveryAttemptsErrors {
https_xrd,
https_jrd,
http_xrd,
http_jrd,
2024-11-09 10:01:26 +00:00
}
)
)
}
2024-11-09 12:14:11 +00:00
const WELLKNOWN_NODEINFO_PATH: &str = "/.well-known/nodeinfo";
pub async fn discover_nodeinfo(client: &reqwest::Client, mut base: reqwest::Url) -> Result<Self, HostMetaDiscoverError> {
base.set_path(Self::WELLKNOWN_NODEINFO_PATH);
Self::discover(client, base)
.await
}
const WELLKNOWN_HOSTMETA_PATH: &str = "/.well-known/host-meta";
pub async fn discover_hostmeta(client: &reqwest::Client, mut base: reqwest::Url) -> Result<Self, HostMetaDiscoverError> {
base.set_path(Self::WELLKNOWN_HOSTMETA_PATH);
Self::discover(client, base)
.await
}
2024-11-09 10:01:26 +00:00
}
#[derive(Debug)]
2024-11-09 12:14:11 +00:00
pub enum HostMetaDiscoverError {
2024-11-09 10:01:26 +00:00
/// Manipulation of the URL scheme of the given base failed.
///
/// See [reqwest::Url::set_scheme] for possible causes.
UrlManipulation(()),
2024-11-09 12:14:11 +00:00
/// All attempts of fetching the host-meta document failed.
Fetch(HostMetaDiscoveryAttemptsErrors),
2024-11-09 08:41:08 +00:00
}
#[derive(Debug)]
2024-11-09 12:14:11 +00:00
pub struct HostMetaDiscoveryAttemptsErrors {
/// The error that occoured when trying to fetch the host-meta document in [XRD format] via [HTTPS].
///
/// [HTTPS]: https://datatracker.ietf.org/doc/html/rfc2818
/// [XRD format]: https://datatracker.ietf.org/doc/html/rfc6415#section-3.1
pub https_xrd: HostMetaGetXRDError,
/// The error that occoured when trying to fetch the host-meta document in [JRD format] via [HTTPS].
///
/// [HTTPS]: https://datatracker.ietf.org/doc/html/rfc2818
/// [JRD format]: https://datatracker.ietf.org/doc/html/rfc6415#appendix-A
pub https_jrd: HostMetaGetJRDError,
2024-11-09 08:41:08 +00:00
2024-11-09 12:14:11 +00:00
/// The error that occoured when trying to fetch the host-meta document in [XRD format] via [HTTP].
///
/// [HTTP]: https://datatracker.ietf.org/doc/html/rfc2616
/// [XRD format]: https://datatracker.ietf.org/doc/html/rfc6415#section-3.1
pub http_xrd: HostMetaGetXRDError,
2024-11-09 08:41:08 +00:00
2024-11-09 12:14:11 +00:00
/// The error that occoured when trying to fetch the host-meta document in [JRD format] via [HTTP].
///
/// [HTTP]: https://datatracker.ietf.org/doc/html/rfc2616
/// [JRD format]: https://datatracker.ietf.org/doc/html/rfc6415#appendix-A
pub http_jrd: HostMetaGetJRDError,
2024-11-09 08:41:08 +00:00
}
2024-11-09 12:14:11 +00:00
#[derive(Debug)]
2024-11-09 12:14:11 +00:00
pub enum HostMetaGetXRDError {
/// The HTTP request failed.
Request(reqwest::Error),
/// The `Content-Type` header of the response is missing.
ContentTypeMissing,
/// The `Content-Type` header of the response is invalid.
ContentTypeInvalid,
/// The document failed to be read as text.
Decode(reqwest::Error),
/// The document failed to be parsed as XML by [`quick_xml`].
Parse(quick_xml::DeError),
}
#[derive(Debug)]
2024-11-09 12:14:11 +00:00
pub enum HostMetaGetJRDError {
/// The HTTP request failed.
Request(reqwest::Error),
/// The `Content-Type` header of the response is missing.
ContentTypeMissing,
/// The `Content-Type` header of the response is invalid.
ContentTypeInvalid,
/// The document failed to be parsed as JSON by [`reqwest`].
Parse(reqwest::Error),
}
/// Extract the MIME type from the value of the `Content-Type` header.
fn extract_mime_from_content_type(value: &HeaderValue) -> Option<String> {
let value = value.to_str().ok()?;
match value.split_once("; ") {
None => Some(value.to_string()),
Some((mime, _)) => Some(mime.to_string()),
}
}