imag/libimagentrylink/src/external.rs

417 lines
14 KiB
Rust
Raw Normal View History

//
// imag - the personal information management suite for the commandline
// Copyright (C) 2015, 2016 Matthias Beyer <mail@beyermatthias.de> and contributors
//
// This library is free software; you can redistribute it and/or
// modify it under the terms of the GNU Lesser General Public
// License as published by the Free Software Foundation; version
// 2.1 of the License.
//
// This library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
// Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public
// License along with this library; if not, write to the Free Software
// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
//
2016-04-08 21:35:04 +00:00
/// External linking is a complex implementation to be able to serve a clean and easy-to-use
/// interface.
///
/// Internally, there are no such things as "external links" (plural). Each Entry in the store can
/// only have _one_ external link.
///
/// This library does the following therefor: It allows you to have several external links with one
/// entry, which are internally one file in the store for each link, linked with "internal
/// linking".
///
/// This helps us greatly with deduplication of URLs.
///
2016-04-09 13:49:50 +00:00
use std::ops::DerefMut;
use std::collections::BTreeMap;
use std::fmt::Debug;
use libimagstore::store::Entry;
2016-04-08 21:35:04 +00:00
use libimagstore::store::FileLockEntry;
use libimagstore::store::Store;
use libimagstore::storeid::StoreId;
2016-04-09 13:49:50 +00:00
use libimagstore::storeid::IntoStoreId;
use libimagstore::toml_ext::TomlValueExt;
2016-08-03 09:10:56 +00:00
use libimagutil::debug_result::*;
2016-02-03 14:47:14 +00:00
2016-04-08 21:35:04 +00:00
use error::LinkError as LE;
use error::LinkErrorKind as LEK;
2016-08-03 09:10:56 +00:00
use error::MapErrInto;
2016-02-03 14:47:14 +00:00
use result::Result;
2016-04-08 21:35:04 +00:00
use internal::InternalLinker;
2016-04-09 13:49:50 +00:00
use module_path::ModuleEntryPath;
2016-02-03 14:47:14 +00:00
use self::iter::*;
2016-02-03 18:59:22 +00:00
use toml::Value;
2016-02-23 10:50:42 +00:00
use url::Url;
use crypto::sha1::Sha1;
use crypto::digest::Digest;
2016-02-03 18:59:22 +00:00
/// "Link" Type, just an abstraction over `FileLockEntry` to have some convenience internally.
pub struct Link<'a> {
2016-04-08 21:35:04 +00:00
link: FileLockEntry<'a>
}
2016-04-08 21:35:04 +00:00
impl<'a> Link<'a> {
2016-04-08 21:35:04 +00:00
pub fn new(fle: FileLockEntry<'a>) -> Link<'a> {
Link { link: fle }
}
/// Get a link Url object from a `FileLockEntry`, ignore errors.
2016-04-08 21:35:04 +00:00
fn get_link_uri_from_filelockentry(file: &FileLockEntry<'a>) -> Option<Url> {
2016-04-21 11:19:37 +00:00
file.get_header()
.read("imag.content.url")
2016-04-08 21:35:04 +00:00
.ok()
2016-06-11 04:53:46 +00:00
.and_then(|opt| match opt {
2016-09-05 16:51:35 +00:00
Some(Value::String(s)) => {
debug!("Found url, parsing: {:?}", s);
Url::parse(&s[..]).ok()
},
2016-06-11 04:53:46 +00:00
_ => None
2016-04-08 21:35:04 +00:00
})
}
2016-04-08 21:35:04 +00:00
pub fn get_url(&self) -> Result<Option<Url>> {
let opt = self.link
.get_header()
.read("imag.content.url");
2016-04-08 21:35:04 +00:00
match opt {
Ok(Some(Value::String(s))) => {
Url::parse(&s[..])
.map(Some)
2016-04-08 21:35:04 +00:00
.map_err(|e| LE::new(LEK::EntryHeaderReadError, Some(Box::new(e))))
},
Ok(None) => Ok(None),
_ => Err(LE::new(LEK::EntryHeaderReadError, None))
}
}
}
2016-04-08 21:35:04 +00:00
pub trait ExternalLinker : InternalLinker {
2016-04-08 21:35:04 +00:00
/// Get the external links from the implementor object
fn get_external_links<'a>(&self, store: &'a Store) -> Result<UrlIter<'a>>;
2016-04-08 21:35:04 +00:00
/// Set the external links for the implementor object
2016-04-09 13:49:50 +00:00
fn set_external_links(&mut self, store: &Store, links: Vec<Url>) -> Result<()>;
2016-04-08 21:35:04 +00:00
/// Add an external link to the implementor object
fn add_external_link(&mut self, store: &Store, link: Url) -> Result<()>;
2016-02-03 18:59:22 +00:00
2016-04-08 21:35:04 +00:00
/// Remove an external link from the implementor object
2016-04-10 16:43:02 +00:00
fn remove_external_link(&mut self, store: &Store, link: Url) -> Result<()>;
2016-02-03 18:59:22 +00:00
2016-02-03 14:47:14 +00:00
}
2016-10-15 12:41:20 +00:00
pub mod iter {
2016-10-15 13:20:17 +00:00
//! Iterator helpers for external linking stuff
//!
//! Contains also helpers to filter iterators for external/internal links
//!
2016-10-15 13:33:44 +00:00
//!
//! # Warning
//!
//! This module uses `internal::Link` as link type, so we operate on _store ids_ here.
//!
//! Not to confuse with `external::Link` which is a real `FileLockEntry` under the hood.
//!
2016-10-15 13:20:17 +00:00
2016-10-15 12:41:20 +00:00
use libimagutil::debug_result::*;
use libimagstore::store::Store;
use internal::Link;
use internal::iter::LinkIter;
use error::LinkErrorKind as LEK;
use error::MapErrInto;
use result::Result;
use url::Url;
/// Helper for building `OnlyExternalIter` and `NoExternalIter`
///
/// The boolean value defines, how to interpret the `is_external_link_storeid()` return value
/// (here as "pred"):
///
/// pred | bool | xor | take?
/// ---- | ---- | --- | ----
/// 0 | 0 | 0 | 1
/// 0 | 1 | 1 | 0
2016-12-05 16:17:26 +00:00
/// 1 | 0 | 1 | 0
2016-10-15 12:41:20 +00:00
/// 1 | 1 | 0 | 1
///
/// If `bool` says "take if return value is false", we take the element if the `pred` returns
/// false... and so on.
///
/// As we can see, the operator between these two operants is `!(a ^ b)`.
pub struct ExternalFilterIter(LinkIter, bool);
2016-10-15 12:41:20 +00:00
impl Iterator for ExternalFilterIter {
type Item = Link;
fn next(&mut self) -> Option<Self::Item> {
use super::is_external_link_storeid;
while let Some(elem) = self.0.next() {
if !(self.1 ^ is_external_link_storeid(&elem)) {
return Some(elem);
}
}
None
}
}
/// Helper trait to be implemented on `LinkIter` to select or deselect all external links
///
/// # See also
///
/// Also see `OnlyExternalIter` and `NoExternalIter` and the helper traits/functions
/// `OnlyInteralLinks`/`only_internal_links()` and `OnlyExternalLinks`/`only_external_links()`.
pub trait SelectExternal {
fn select_external_links(self, b: bool) -> ExternalFilterIter;
}
impl SelectExternal for LinkIter {
fn select_external_links(self, b: bool) -> ExternalFilterIter {
ExternalFilterIter(self, b)
}
}
2016-10-15 12:41:20 +00:00
pub struct OnlyExternalIter(ExternalFilterIter);
impl OnlyExternalIter {
pub fn new(li: LinkIter) -> OnlyExternalIter {
OnlyExternalIter(ExternalFilterIter(li, true))
}
pub fn urls<'a>(self, store: &'a Store) -> UrlIter<'a> {
UrlIter(self, store)
}
}
impl Iterator for OnlyExternalIter {
type Item = Link;
fn next(&mut self) -> Option<Self::Item> {
self.0.next()
}
}
pub struct NoExternalIter(ExternalFilterIter);
impl NoExternalIter {
pub fn new(li: LinkIter) -> NoExternalIter {
NoExternalIter(ExternalFilterIter(li, false))
}
}
impl Iterator for NoExternalIter {
type Item = Link;
fn next(&mut self) -> Option<Self::Item> {
self.0.next()
}
}
pub trait OnlyExternalLinks : Sized {
fn only_external_links(self) -> OnlyExternalIter ;
fn no_internal_links(self) -> OnlyExternalIter {
self.only_external_links()
}
}
impl OnlyExternalLinks for LinkIter {
fn only_external_links(self) -> OnlyExternalIter {
OnlyExternalIter::new(self)
}
}
pub trait OnlyInternalLinks : Sized {
fn only_internal_links(self) -> NoExternalIter;
fn no_external_links(self) -> NoExternalIter {
self.only_internal_links()
}
}
impl OnlyInternalLinks for LinkIter {
fn only_internal_links(self) -> NoExternalIter {
NoExternalIter::new(self)
}
}
pub struct UrlIter<'a>(OnlyExternalIter, &'a Store);
impl<'a> Iterator for UrlIter<'a> {
type Item = Result<Url>;
fn next(&mut self) -> Option<Self::Item> {
use super::get_external_link_from_file;
self.0
.next()
.map(|id| {
debug!("Retrieving entry for id: '{:?}'", id);
self.1
.retrieve(id.clone())
.map_err_into(LEK::StoreReadError)
.map_dbg_err(|_| format!("Retrieving entry for id: '{:?}' failed", id))
.and_then(|f| {
debug!("Store::retrieve({:?}) succeeded", id);
debug!("getting external link from file now");
get_external_link_from_file(&f)
.map_dbg_err(|e| format!("URL -> Err = {:?}", e))
})
})
}
}
}
2016-04-09 13:15:13 +00:00
/// Check whether the StoreId starts with `/link/external/`
pub fn is_external_link_storeid<A: AsRef<StoreId> + Debug>(id: A) -> bool {
debug!("Checking whether this is a 'links/external/': '{:?}'", id);
id.as_ref().local().starts_with("links/external")
2016-04-09 13:15:13 +00:00
}
fn get_external_link_from_file(entry: &FileLockEntry) -> Result<Url> {
Link::get_link_uri_from_filelockentry(entry) // TODO: Do not hide error by using this function
.ok_or(LE::new(LEK::StoreReadError, None))
}
/// Implement `ExternalLinker` for `Entry`, hiding the fact that there is no such thing as an external
2016-04-08 21:35:04 +00:00
/// link in an entry, but internal links to other entries which serve as external links, as one
/// entry in the store can only have one external link.
impl ExternalLinker for Entry {
2016-02-07 03:40:43 +00:00
2016-04-08 21:35:04 +00:00
/// Get the external links from the implementor object
fn get_external_links<'a>(&self, store: &'a Store) -> Result<UrlIter<'a>> {
2016-04-08 21:35:04 +00:00
// Iterate through all internal links and filter for FileLockEntries which live in
// /link/external/<SHA> -> load these files and get the external link from their headers,
// put them into the return vector.
2016-04-09 13:15:13 +00:00
self.get_internal_links()
.map_err(|e| LE::new(LEK::StoreReadError, Some(Box::new(e))))
.map(|iter| {
debug!("Getting external links");
iter.only_external_links().urls(store)
2016-04-09 13:15:13 +00:00
})
2016-02-07 03:40:43 +00:00
}
2016-04-08 21:35:04 +00:00
/// Set the external links for the implementor object
2016-04-09 13:49:50 +00:00
fn set_external_links(&mut self, store: &Store, links: Vec<Url>) -> Result<()> {
2016-04-08 21:35:04 +00:00
// Take all the links, generate a SHA sum out of each one, filter out the already existing
// store entries and store the other URIs in the header of one FileLockEntry each, in
// the path /link/external/<SHA of the URL>
2016-04-09 13:49:50 +00:00
debug!("Iterating {} links = {:?}", links.len(), links);
2016-04-09 13:49:50 +00:00
for link in links { // for all links
let hash = {
let mut s = Sha1::new();
2016-05-12 14:40:06 +00:00
s.input_str(&link.as_str()[..]);
s.result_str()
};
let file_id = try!(
ModuleEntryPath::new(format!("external/{}", hash)).into_storeid()
.map_err_into(LEK::StoreWriteError)
.map_dbg_err(|_| {
format!("Failed to build StoreId for this hash '{:?}'", hash)
})
);
2016-04-09 13:49:50 +00:00
debug!("Link = '{:?}'", link);
debug!("Hash = '{:?}'", hash);
debug!("StoreId = '{:?}'", file_id);
2016-04-16 13:34:32 +00:00
// retrieve the file from the store, which implicitely creates the entry if it does not
// exist
2016-08-03 09:10:56 +00:00
let mut file = try!(store
.retrieve(file_id.clone())
.map_err_into(LEK::StoreWriteError)
.map_dbg_err(|_| {
format!("Failed to create or retrieve an file for this link '{:?}'", link)
}));
2016-04-16 13:34:32 +00:00
debug!("Generating header content!");
{
let mut hdr = file.deref_mut().get_header_mut();
let mut table = match hdr.read("imag.content") {
Ok(Some(Value::Table(table))) => table,
Ok(Some(_)) => {
warn!("There is a value at 'imag.content' which is not a table.");
warn!("Going to override this value");
BTreeMap::new()
},
Ok(None) => BTreeMap::new(),
Err(e) => return Err(LE::new(LEK::StoreWriteError, Some(Box::new(e)))),
};
2016-05-12 14:40:06 +00:00
let v = Value::String(link.into_string());
2016-04-16 13:34:32 +00:00
debug!("setting URL = '{:?}", v);
table.insert(String::from("url"), v);
if let Err(e) = hdr.set("imag.content", Value::Table(table)) {
return Err(LE::new(LEK::StoreWriteError, Some(Box::new(e))));
} else {
debug!("Setting URL worked");
2016-04-09 13:49:50 +00:00
}
2016-04-16 13:34:32 +00:00
}
2016-04-09 13:49:50 +00:00
// then add an internal link to the new file or return an error if this fails
if let Err(e) = self.add_internal_link(file.deref_mut()) {
debug!("Error adding internal link");
2016-04-09 13:49:50 +00:00
return Err(LE::new(LEK::StoreWriteError, Some(Box::new(e))));
}
}
debug!("Ready iterating");
2016-04-09 13:49:50 +00:00
Ok(())
2016-02-07 03:40:43 +00:00
}
2016-02-15 12:22:10 +00:00
2016-04-08 21:35:04 +00:00
/// Add an external link to the implementor object
fn add_external_link(&mut self, store: &Store, link: Url) -> Result<()> {
2016-04-08 21:35:04 +00:00
// get external links, add this one, save them
debug!("Getting links");
self.get_external_links(store)
.and_then(|links| {
// TODO: Do not ignore errors here
let mut links = links.filter_map(Result::ok).collect::<Vec<_>>();
debug!("Adding link = '{:?}' to links = {:?}", link, links);
links.push(link);
debug!("Setting {} links = {:?}", links.len(), links);
self.set_external_links(store, links)
})
}
2016-04-08 21:35:04 +00:00
/// Remove an external link from the implementor object
2016-04-10 16:43:02 +00:00
fn remove_external_link(&mut self, store: &Store, link: Url) -> Result<()> {
2016-04-08 21:35:04 +00:00
// get external links, remove this one, save them
2016-04-10 16:43:02 +00:00
self.get_external_links(store)
2016-04-16 20:04:08 +00:00
.and_then(|links| {
debug!("Removing link = '{:?}'", link);
let links = links
.filter_map(Result::ok)
2016-05-12 14:40:06 +00:00
.filter(|l| l.as_str() != link.as_str())
.collect::<Vec<_>>();
2016-04-10 16:43:02 +00:00
self.set_external_links(store, links)
})
}
}
2016-04-08 21:35:04 +00:00