2021-11-16 17:03:09 +00:00
|
|
|
use crate::fetcher::post_or_comment::PostOrComment;
|
2023-03-21 15:03:05 +00:00
|
|
|
use activitypub_federation::config::{Data, UrlVerifier};
|
2022-10-28 13:38:22 +00:00
|
|
|
use async_trait::async_trait;
|
2023-07-05 15:08:02 +00:00
|
|
|
use futures::future::join3;
|
2022-11-28 14:29:33 +00:00
|
|
|
use lemmy_api_common::context::LemmyContext;
|
2022-10-27 09:24:07 +00:00
|
|
|
use lemmy_db_schema::{
|
2023-03-21 15:03:05 +00:00
|
|
|
source::{
|
|
|
|
activity::{Activity, ActivityInsertForm},
|
|
|
|
instance::Instance,
|
|
|
|
local_site::LocalSite,
|
|
|
|
},
|
|
|
|
traits::Crud,
|
2022-10-27 09:24:07 +00:00
|
|
|
utils::DbPool,
|
2022-06-22 20:24:54 +00:00
|
|
|
};
|
2023-07-10 14:50:07 +00:00
|
|
|
use lemmy_utils::error::{LemmyError, LemmyErrorType, LemmyResult};
|
2023-07-05 15:08:02 +00:00
|
|
|
use moka::future::Cache;
|
2022-11-09 10:05:00 +00:00
|
|
|
use once_cell::sync::Lazy;
|
2023-03-21 15:03:05 +00:00
|
|
|
use serde::Serialize;
|
2023-07-05 15:08:02 +00:00
|
|
|
use std::{sync::Arc, time::Duration};
|
2022-11-26 20:47:13 +00:00
|
|
|
use url::Url;
|
2021-11-16 17:03:09 +00:00
|
|
|
|
2020-10-12 14:10:09 +00:00
|
|
|
pub mod activities;
|
2021-10-29 10:32:42 +00:00
|
|
|
pub(crate) mod activity_lists;
|
2022-11-28 14:29:33 +00:00
|
|
|
pub mod api;
|
2021-10-27 16:03:07 +00:00
|
|
|
pub(crate) mod collections;
|
2020-04-10 11:37:35 +00:00
|
|
|
pub mod fetcher;
|
2021-07-17 16:20:44 +00:00
|
|
|
pub mod http;
|
2021-11-15 22:54:25 +00:00
|
|
|
pub(crate) mod mentions;
|
2020-10-12 14:10:09 +00:00
|
|
|
pub mod objects;
|
2021-10-29 10:32:42 +00:00
|
|
|
pub mod protocol;
|
2020-04-24 14:04:36 +00:00
|
|
|
|
2023-03-21 15:03:05 +00:00
|
|
|
pub const FEDERATION_HTTP_FETCH_LIMIT: u32 = 50;
|
2023-07-05 15:08:02 +00:00
|
|
|
/// All incoming and outgoing federation actions read the blocklist/allowlist and slur filters
|
|
|
|
/// multiple times. This causes a huge number of database reads if we hit the db directly. So we
|
|
|
|
/// cache these values for a short time, which will already make a huge difference and ensures that
|
|
|
|
/// changes take effect quickly.
|
|
|
|
const BLOCKLIST_CACHE_DURATION: Duration = Duration::from_secs(60);
|
2022-11-21 16:44:34 +00:00
|
|
|
|
2022-06-02 14:33:41 +00:00
|
|
|
static CONTEXT: Lazy<Vec<serde_json::Value>> = Lazy::new(|| {
|
|
|
|
serde_json::from_str(include_str!("../assets/lemmy/context.json")).expect("parse context")
|
|
|
|
});
|
|
|
|
|
2022-10-28 13:38:22 +00:00
|
|
|
#[derive(Clone)]
|
2023-03-21 15:03:05 +00:00
|
|
|
pub struct VerifyUrlData(pub DbPool);
|
2022-10-28 13:38:22 +00:00
|
|
|
|
|
|
|
#[async_trait]
|
|
|
|
impl UrlVerifier for VerifyUrlData {
|
|
|
|
async fn verify(&self, url: &Url) -> Result<(), &'static str> {
|
2023-07-05 15:08:02 +00:00
|
|
|
let local_site_data = local_site_data_cached(&self.0)
|
2022-10-28 13:38:22 +00:00
|
|
|
.await
|
|
|
|
.expect("read local site data");
|
2023-03-21 15:03:05 +00:00
|
|
|
check_apub_id_valid(url, &local_site_data)?;
|
|
|
|
Ok(())
|
2022-10-28 13:38:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-19 14:29:35 +00:00
|
|
|
/// Checks if the ID is allowed for sending or receiving.
|
|
|
|
///
|
|
|
|
/// In particular, it checks for:
|
|
|
|
/// - federation being enabled (if its disabled, only local URLs are allowed)
|
|
|
|
/// - the correct scheme (either http or https)
|
|
|
|
/// - URL being in the allowlist (if it is active)
|
|
|
|
/// - URL not being in the blocklist (if it is active)
|
2023-03-21 15:03:05 +00:00
|
|
|
#[tracing::instrument(skip(local_site_data))]
|
|
|
|
fn check_apub_id_valid(apub_id: &Url, local_site_data: &LocalSiteData) -> Result<(), &'static str> {
|
2022-06-02 14:33:41 +00:00
|
|
|
let domain = apub_id.domain().expect("apud id has domain").to_string();
|
2020-08-18 13:12:03 +00:00
|
|
|
|
2022-10-27 09:24:07 +00:00
|
|
|
if !local_site_data
|
|
|
|
.local_site
|
|
|
|
.as_ref()
|
|
|
|
.map(|l| l.federation_enabled)
|
|
|
|
.unwrap_or(true)
|
|
|
|
{
|
2022-06-02 14:33:41 +00:00
|
|
|
return Err("Federation disabled");
|
2020-10-22 16:12:43 +00:00
|
|
|
}
|
|
|
|
|
2023-04-21 21:41:03 +00:00
|
|
|
if local_site_data
|
|
|
|
.blocked_instances
|
|
|
|
.iter()
|
|
|
|
.any(|i| domain.eq(&i.domain))
|
|
|
|
{
|
|
|
|
return Err("Domain is blocked");
|
2021-04-21 13:36:07 +00:00
|
|
|
}
|
2021-03-01 17:24:11 +00:00
|
|
|
|
2023-04-21 21:41:03 +00:00
|
|
|
// Only check this if there are instances in the allowlist
|
|
|
|
if !local_site_data.allowed_instances.is_empty()
|
|
|
|
&& !local_site_data
|
|
|
|
.allowed_instances
|
|
|
|
.iter()
|
|
|
|
.any(|i| domain.eq(&i.domain))
|
|
|
|
{
|
|
|
|
return Err("Domain is not in allowlist");
|
2022-06-02 14:33:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2022-10-27 09:24:07 +00:00
|
|
|
#[derive(Clone)]
|
|
|
|
pub(crate) struct LocalSiteData {
|
|
|
|
local_site: Option<LocalSite>,
|
2023-04-21 21:41:03 +00:00
|
|
|
allowed_instances: Vec<Instance>,
|
|
|
|
blocked_instances: Vec<Instance>,
|
2022-10-27 09:24:07 +00:00
|
|
|
}
|
|
|
|
|
2023-07-05 15:08:02 +00:00
|
|
|
pub(crate) async fn local_site_data_cached(pool: &DbPool) -> LemmyResult<Arc<LocalSiteData>> {
|
|
|
|
static CACHE: Lazy<Cache<(), Arc<LocalSiteData>>> = Lazy::new(|| {
|
|
|
|
Cache::builder()
|
|
|
|
.max_capacity(1)
|
|
|
|
.time_to_live(BLOCKLIST_CACHE_DURATION)
|
|
|
|
.build()
|
|
|
|
});
|
|
|
|
Ok(
|
|
|
|
CACHE
|
|
|
|
.try_get_with((), async {
|
|
|
|
let (local_site, allowed_instances, blocked_instances) = join3(
|
|
|
|
LocalSite::read(pool),
|
|
|
|
Instance::allowlist(pool),
|
|
|
|
Instance::blocklist(pool),
|
|
|
|
)
|
|
|
|
.await;
|
|
|
|
|
|
|
|
Ok::<_, diesel::result::Error>(Arc::new(LocalSiteData {
|
|
|
|
// LocalSite may be missing
|
|
|
|
local_site: local_site.ok(),
|
|
|
|
allowed_instances: allowed_instances?,
|
|
|
|
blocked_instances: blocked_instances?,
|
|
|
|
}))
|
|
|
|
})
|
|
|
|
.await?,
|
|
|
|
)
|
2022-10-27 09:24:07 +00:00
|
|
|
}
|
|
|
|
|
2023-07-05 15:08:02 +00:00
|
|
|
pub(crate) async fn check_apub_id_valid_with_strictness(
|
2022-06-02 14:33:41 +00:00
|
|
|
apub_id: &Url,
|
|
|
|
is_strict: bool,
|
2023-07-05 15:08:02 +00:00
|
|
|
context: &LemmyContext,
|
2022-06-02 14:33:41 +00:00
|
|
|
) -> Result<(), LemmyError> {
|
|
|
|
let domain = apub_id.domain().expect("apud id has domain").to_string();
|
2023-07-05 15:08:02 +00:00
|
|
|
let local_instance = context
|
|
|
|
.settings()
|
2022-06-02 14:33:41 +00:00
|
|
|
.get_hostname_without_port()
|
|
|
|
.expect("local hostname is valid");
|
|
|
|
if domain == local_instance {
|
|
|
|
return Ok(());
|
|
|
|
}
|
2023-07-05 15:08:02 +00:00
|
|
|
|
|
|
|
let local_site_data = local_site_data_cached(context.pool()).await?;
|
2023-07-10 14:50:07 +00:00
|
|
|
check_apub_id_valid(apub_id, &local_site_data).map_err(|err| match err {
|
|
|
|
"Federation disabled" => LemmyErrorType::FederationDisabled,
|
|
|
|
"Domain is blocked" => LemmyErrorType::DomainBlocked,
|
|
|
|
"Domain is not in allowlist" => LemmyErrorType::DomainNotInAllowList,
|
|
|
|
_ => panic!("Could not handle apub error!"),
|
|
|
|
})?;
|
2022-06-02 14:33:41 +00:00
|
|
|
|
2023-04-21 21:41:03 +00:00
|
|
|
// Only check allowlist if this is a community, and there are instances in the allowlist
|
|
|
|
if is_strict && !local_site_data.allowed_instances.is_empty() {
|
|
|
|
// need to allow this explicitly because apub receive might contain objects from our local
|
|
|
|
// instance.
|
|
|
|
let mut allowed_and_local = local_site_data
|
|
|
|
.allowed_instances
|
|
|
|
.iter()
|
|
|
|
.map(|i| i.domain.clone())
|
|
|
|
.collect::<Vec<String>>();
|
2023-07-05 15:08:02 +00:00
|
|
|
let local_instance = context
|
|
|
|
.settings()
|
2023-04-21 21:41:03 +00:00
|
|
|
.get_hostname_without_port()
|
|
|
|
.expect("local hostname is valid");
|
|
|
|
allowed_and_local.push(local_instance);
|
|
|
|
|
|
|
|
let domain = apub_id.domain().expect("apud id has domain").to_string();
|
|
|
|
if !allowed_and_local.contains(&domain) {
|
2023-07-10 14:50:07 +00:00
|
|
|
return Err(LemmyErrorType::FederationDisabledByStrictAllowList)?;
|
2020-08-13 20:26:49 +00:00
|
|
|
}
|
2020-04-17 17:34:18 +00:00
|
|
|
}
|
2021-04-21 13:36:07 +00:00
|
|
|
Ok(())
|
2020-04-17 17:34:18 +00:00
|
|
|
}
|
2020-04-24 19:55:54 +00:00
|
|
|
|
2023-03-21 15:03:05 +00:00
|
|
|
/// Store a sent or received activity in the database.
|
|
|
|
///
|
|
|
|
/// Stored activities are served over the HTTP endpoint `GET /activities/{type_}/{id}`. This also
|
|
|
|
/// ensures that the same activity cannot be received more than once.
|
|
|
|
#[tracing::instrument(skip(data, activity))]
|
|
|
|
async fn insert_activity<T>(
|
2020-10-23 12:29:56 +00:00
|
|
|
ap_id: &Url,
|
2023-03-21 15:03:05 +00:00
|
|
|
activity: &T,
|
2020-07-10 18:15:41 +00:00
|
|
|
local: bool,
|
2020-11-06 13:06:47 +00:00
|
|
|
sensitive: bool,
|
2023-03-21 15:03:05 +00:00
|
|
|
data: &Data<LemmyContext>,
|
|
|
|
) -> Result<(), LemmyError>
|
|
|
|
where
|
|
|
|
T: Serialize,
|
|
|
|
{
|
2022-11-19 04:33:54 +00:00
|
|
|
let ap_id = ap_id.clone().into();
|
2023-03-21 15:03:05 +00:00
|
|
|
let form = ActivityInsertForm {
|
|
|
|
ap_id,
|
|
|
|
data: serde_json::to_value(activity)?,
|
|
|
|
local: Some(local),
|
|
|
|
sensitive: Some(sensitive),
|
|
|
|
updated: None,
|
|
|
|
};
|
|
|
|
Activity::create(data.pool(), &form).await?;
|
|
|
|
Ok(())
|
2022-06-02 14:33:41 +00:00
|
|
|
}
|
2022-11-28 14:29:33 +00:00
|
|
|
|
2023-03-21 15:03:05 +00:00
|
|
|
#[async_trait::async_trait]
|
|
|
|
pub trait SendActivity: Sync {
|
2023-07-10 10:27:49 +00:00
|
|
|
type Response: Sync + Send + Clone;
|
2022-11-28 14:29:33 +00:00
|
|
|
|
|
|
|
async fn send_activity(
|
|
|
|
_request: &Self,
|
|
|
|
_response: &Self::Response,
|
2023-03-21 15:03:05 +00:00
|
|
|
_context: &Data<LemmyContext>,
|
2022-11-28 14:29:33 +00:00
|
|
|
) -> Result<(), LemmyError> {
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|