use crate::apub::*; use crate::db::community::{Community, CommunityForm}; use crate::db::post::{Post, PostForm}; use crate::db::user::{UserForm, User_}; use crate::db::Crud; use crate::routes::nodeinfo::{NodeInfo, NodeInfoWellKnown}; use crate::settings::Settings; use activitystreams::collection::{OrderedCollection, UnorderedCollection}; use activitystreams::object::Page; use activitystreams::BaseBox; use diesel::result::Error::NotFound; use diesel::PgConnection; use failure::Error; use isahc::prelude::*; use log::warn; use serde::Deserialize; use std::time::Duration; use url::Url; fn fetch_node_info(domain: &str) -> Result { let well_known_uri = Url::parse(&format!( "{}://{}/.well-known/nodeinfo", get_apub_protocol_string(), domain ))?; let well_known = fetch_remote_object::(&well_known_uri)?; Ok(fetch_remote_object::(&well_known.links.href)?) } fn fetch_communities_from_instance( community_list: &Url, conn: &PgConnection, ) -> Result, Error> { fetch_remote_object::(community_list)? .collection_props .get_many_items_base_boxes() .unwrap() .map(|b| -> Result { let group = b.to_owned().to_concrete::()?; Ok(CommunityForm::from_group(&group, conn)?) }) .map( |cf: Result| -> Result { let cf2 = cf?; let existing = Community::read_from_actor_id(conn, &cf2.actor_id); match existing { Err(NotFound {}) => Ok(Community::create(conn, &cf2)?), Ok(c) => Ok(Community::update(conn, c.id, &cf2)?), Err(e) => Err(Error::from(e)), } }, ) .collect() } // TODO: add an optional param last_updated and only fetch if its too old pub fn fetch_remote_object(url: &Url) -> Result where Response: for<'de> Deserialize<'de>, { if Settings::get().federation.tls_enabled && url.scheme() != "https" { return Err(format_err!("Activitypub uri is insecure: {}", url)); } // TODO: this function should return a future let timeout = Duration::from_secs(60); let text = Request::get(url.as_str()) .header("Accept", APUB_JSON_CONTENT_TYPE) .connect_timeout(timeout) .timeout(timeout) .body(())? .send()? .text()?; let res: Response = serde_json::from_str(&text)?; Ok(res) } fn fetch_remote_community_posts( instance: &str, community: &Community, conn: &PgConnection, ) -> Result, Error> { let endpoint = Url::parse(&format!( "http://{}/federation/c/{}", instance, community.name ))?; let group = fetch_remote_object::(&endpoint)?; let outbox_uri = Url::parse(&group.extension.get_outbox().to_string())?; // TODO: outbox url etc should be stored in local db let outbox = fetch_remote_object::(&outbox_uri)?; let items = outbox.collection_props.get_many_items_base_boxes(); Ok( items .unwrap() .map(|obox: &BaseBox| -> Result { let page = obox.clone().to_concrete::()?; PostForm::from_page(&page, conn) }) .map(|pf: Result| -> Result { let mut pf2 = pf?; pf2.community_id = community.id; let existing = Post::read_from_apub_id(conn, &pf2.ap_id); match existing { Err(NotFound {}) => Ok(Post::create(conn, &pf2)?), Ok(p) => Ok(Post::update(conn, p.id, &pf2)?), Err(e) => Err(Error::from(e)), } }) .collect::, Error>>()?, ) } pub fn fetch_remote_user(apub_id: &Url, conn: &PgConnection) -> Result { let person = fetch_remote_object::(apub_id)?; let uf = UserForm::from_person(&person)?; let existing = User_::read_from_apub_id(conn, &uf.actor_id); Ok(match existing { Err(NotFound {}) => User_::create(conn, &uf)?, Ok(u) => User_::update(conn, u.id, &uf)?, Err(e) => return Err(Error::from(e)), }) } // TODO: in the future, this should only be done when an instance is followed for the first time // after that, we should rely in the inbox, and fetch on demand when needed pub fn fetch_all(conn: &PgConnection) -> Result<(), Error> { for instance in &get_following_instances() { let node_info = fetch_node_info(instance)?; if let Some(community_list) = node_info.metadata.community_list_url { let communities = fetch_communities_from_instance(&community_list, conn)?; for c in communities { fetch_remote_community_posts(instance, &c, conn)?; } } else { warn!( "{} is not a Lemmy instance, federation is not supported", instance ); } } Ok(()) }