use actix_form_data::{Field, Form, Value}; use actix_web::{ guard, http::header::{CacheControl, CacheDirective, LastModified, ACCEPT_RANGES}, web, App, HttpResponse, HttpResponseBuilder, HttpServer, }; use awc::Client; use futures_util::{stream::once, Stream}; use once_cell::sync::Lazy; use std::{ collections::HashSet, future::ready, path::PathBuf, pin::Pin, task::{Context, Poll}, time::SystemTime, }; use structopt::StructOpt; use tokio::{io::AsyncReadExt, sync::Semaphore}; use tracing::{debug, error, info, instrument, Span}; use tracing_actix_web::TracingLogger; use tracing_awc::Propagate; use tracing_futures::Instrument; use uuid::Uuid; mod concurrent_processor; mod config; mod either; mod error; mod exiftool; mod ffmpeg; mod file; mod init_tracing; mod magick; mod middleware; mod migrate; mod process; mod processor; mod range; mod upload_manager; mod validate; use self::{ concurrent_processor::CancelSafeProcessor, config::{Config, Format}, either::Either, error::{Error, UploadError}, file::CrateError, init_tracing::init_tracing, middleware::{Deadline, Internal}, upload_manager::{Details, UploadManager, UploadManagerSession}, validate::{image_webp, video_mp4}, }; const MEGABYTES: usize = 1024 * 1024; const MINUTES: u32 = 60; const HOURS: u32 = 60 * MINUTES; const DAYS: u32 = 24 * HOURS; static TMP_DIR: Lazy = Lazy::new(|| { let tmp_nonce = Uuid::new_v4(); let mut path = std::env::temp_dir(); path.push(format!("pict-rs-{}", tmp_nonce)); path }); static CONFIG: Lazy = Lazy::new(Config::from_args); static PROCESS_SEMAPHORE: Lazy = Lazy::new(|| Semaphore::new(num_cpus::get().saturating_sub(1).max(1))); // try moving a file #[instrument(name = "Moving file")] async fn safe_move_file(from: PathBuf, to: PathBuf) -> Result<(), Error> { if let Some(path) = to.parent() { debug!("Creating directory {:?}", path); tokio::fs::create_dir_all(path).await?; } debug!("Checking if {:?} already exists", to); if let Err(e) = tokio::fs::metadata(&to).await { if e.kind() != std::io::ErrorKind::NotFound { return Err(e.into()); } } else { return Err(UploadError::FileExists.into()); } debug!("Moving {:?} to {:?}", from, to); tokio::fs::copy(&from, to).await?; tokio::fs::remove_file(from).await?; Ok(()) } async fn safe_create_parent

(path: P) -> Result<(), Error> where P: AsRef, { if let Some(path) = path.as_ref().parent() { debug!("Creating directory {:?}", path); tokio::fs::create_dir_all(path).await?; } Ok(()) } // Try writing to a file #[instrument(name = "Saving file", skip(bytes))] async fn safe_save_file(path: PathBuf, bytes: web::Bytes) -> Result<(), Error> { if let Some(path) = path.parent() { // create the directory for the file debug!("Creating directory {:?}", path); tokio::fs::create_dir_all(path).await?; } // Only write the file if it doesn't already exist debug!("Checking if {:?} already exists", path); if let Err(e) = tokio::fs::metadata(&path).await { if e.kind() != std::io::ErrorKind::NotFound { return Err(e.into()); } } else { return Ok(()); } // Open the file for writing debug!("Creating {:?}", path); let mut file = crate::file::File::create(&path).await?; // try writing debug!("Writing to {:?}", path); if let Err(e) = file.write_from_bytes(bytes).await { error!("Error writing {:?}, {}", path, e); // remove file if writing failed before completion tokio::fs::remove_file(path).await?; return Err(e.into()); } debug!("{:?} written", path); Ok(()) } pub(crate) fn tmp_file() -> PathBuf { let s: String = Uuid::new_v4().to_string(); let name = format!("{}.tmp", s); let mut path = TMP_DIR.clone(); path.push(&name); path } fn to_ext(mime: mime::Mime) -> Result<&'static str, Error> { if mime == mime::IMAGE_PNG { Ok(".png") } else if mime == mime::IMAGE_JPEG { Ok(".jpg") } else if mime == video_mp4() { Ok(".mp4") } else if mime == image_webp() { Ok(".webp") } else { Err(UploadError::UnsupportedFormat.into()) } } /// Handle responding to succesful uploads #[instrument(name = "Uploaded files", skip(value, manager))] async fn upload( value: Value, manager: web::Data, ) -> Result { let images = value .map() .and_then(|mut m| m.remove("images")) .and_then(|images| images.array()) .ok_or(UploadError::NoFiles)?; let mut files = Vec::new(); let images = images .into_iter() .filter_map(|i| i.file()) .collect::>(); for image in &images { if let Some(alias) = image.result.alias() { info!("Uploaded {} as {:?}", image.filename, alias); let delete_token = image.result.delete_token().await?; let name = manager.from_alias(alias.to_owned()).await?; let path = manager.path_from_filename(name.clone()).await?; let details = manager.variant_details(path.clone(), name.clone()).await?; let details = if let Some(details) = details { debug!("details exist"); details } else { debug!("generating new details from {:?}", path); let new_details = Details::from_path(path.clone()).await?; debug!("storing details for {:?} {}", path, name); manager .store_variant_details(path, name, &new_details) .await?; debug!("stored"); new_details }; files.push(serde_json::json!({ "file": alias, "delete_token": delete_token, "details": details, })); } } for image in images { image.result.succeed(); } Ok(HttpResponse::Created().json(&serde_json::json!({ "msg": "ok", "files": files }))) } #[derive(Debug, serde::Deserialize)] struct UrlQuery { url: String, } pin_project_lite::pin_project! { struct Limit { #[pin] inner: S, count: u64, limit: u64, } } impl Limit { fn new(inner: S, limit: u64) -> Self { Limit { inner, count: 0, limit, } } } #[derive(Debug, thiserror::Error)] #[error("Resonse body larger than size limit")] struct LimitError; impl Stream for Limit where S: Stream>, E: From, { type Item = Result; fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll> { let this = self.as_mut().project(); let limit = this.limit; let count = this.count; let inner = this.inner; inner.poll_next(cx).map(|opt| { opt.map(|res| match res { Ok(bytes) => { *count += bytes.len() as u64; if *count > *limit { return Err(LimitError.into()); } Ok(bytes) } Err(e) => Err(e), }) }) } } /// download an image from a URL #[instrument(name = "Downloading file", skip(client, manager))] async fn download( client: web::Data, manager: web::Data, query: web::Query, ) -> Result { let res = client.get(&query.url).propagate().send().await?; if !res.status().is_success() { return Err(UploadError::Download(res.status()).into()); } let mut stream = Limit::new( CrateError::new(res), (CONFIG.max_file_size() * MEGABYTES) as u64, ); // SAFETY: stream is shadowed, so original cannot not be moved let stream = unsafe { Pin::new_unchecked(&mut stream) }; let permit = PROCESS_SEMAPHORE.acquire().await?; let session = manager.session().upload(stream).await?; let alias = session.alias().unwrap().to_owned(); drop(permit); let delete_token = session.delete_token().await?; let name = manager.from_alias(alias.to_owned()).await?; let path = manager.path_from_filename(name.clone()).await?; let details = manager.variant_details(path.clone(), name.clone()).await?; let details = if let Some(details) = details { details } else { let new_details = Details::from_path(path.clone()).await?; manager .store_variant_details(path, name, &new_details) .await?; new_details }; session.succeed(); Ok(HttpResponse::Created().json(&serde_json::json!({ "msg": "ok", "files": [{ "file": alias, "delete_token": delete_token, "details": details, }] }))) } /// Delete aliases and files #[instrument(name = "Deleting file", skip(manager))] async fn delete( manager: web::Data, path_entries: web::Path<(String, String)>, ) -> Result { let (alias, token) = path_entries.into_inner(); manager.delete(token, alias).await?; Ok(HttpResponse::NoContent().finish()) } type ProcessQuery = Vec<(String, String)>; async fn prepare_process( query: web::Query, ext: &str, manager: &UploadManager, filters: &Option>, ) -> Result<(Format, String, PathBuf, Vec), Error> { let (alias, operations) = query .into_inner() .into_iter() .fold((String::new(), Vec::new()), |(s, mut acc), (k, v)| { if k == "src" { (v, acc) } else { acc.push((k, v)); (s, acc) } }); if alias.is_empty() { return Err(UploadError::MissingFilename.into()); } let name = manager.from_alias(alias).await?; let operations = if let Some(filters) = filters.as_ref() { operations .into_iter() .filter(|(k, _)| filters.contains(&k.to_lowercase())) .collect() } else { operations }; let format = ext .parse::() .map_err(|_| UploadError::UnsupportedFormat)?; let processed_name = format!("{}.{}", name, ext); let (thumbnail_path, thumbnail_args) = self::processor::build_chain(&operations, processed_name)?; Ok((format, name, thumbnail_path, thumbnail_args)) } #[instrument(name = "Fetching derived details", skip(manager, filters))] async fn process_details( query: web::Query, ext: web::Path, manager: web::Data, filters: web::Data>>, ) -> Result { let (_, name, thumbnail_path, _) = prepare_process(query, ext.as_str(), &manager, &filters).await?; let real_path = manager .variant_path(&thumbnail_path, &name) .await? .ok_or(UploadError::MissingAlias)?; let details = manager.variant_details(real_path, name).await?; let details = details.ok_or(UploadError::NoFiles)?; Ok(HttpResponse::Ok().json(&details)) } /// Process files #[instrument(name = "Serving processed image", skip(manager, filters))] async fn process( range: Option, query: web::Query, ext: web::Path, manager: web::Data, filters: web::Data>>, ) -> Result { let (format, name, thumbnail_path, thumbnail_args) = prepare_process(query, ext.as_str(), &manager, &filters).await?; let real_path_opt = manager.variant_path(&thumbnail_path, &name).await?; // If the thumbnail doesn't exist, we need to create it let real_path_opt = if let Some(real_path) = real_path_opt { if let Err(e) = tokio::fs::metadata(&real_path) .instrument(tracing::info_span!("Get thumbnail metadata")) .await { if e.kind() != std::io::ErrorKind::NotFound { error!("Error looking up processed image, {}", e); return Err(e.into()); } None } else { Some(real_path) } } else { None }; if let Some(real_path) = real_path_opt { let details_opt = manager .variant_details(real_path.clone(), name.clone()) .await?; let details = if let Some(details) = details_opt { details } else { let details = Details::from_path(real_path.clone()).await?; manager .store_variant_details(real_path.clone(), name, &details) .await?; details }; return ranged_file_resp(real_path, range, details).await; } let original_path = manager.still_path_from_filename(name.clone()).await?; let thumbnail_path2 = thumbnail_path.clone(); let process_fut = async { let thumbnail_path = thumbnail_path2; let permit = PROCESS_SEMAPHORE.acquire().await?; let file = crate::file::File::open(original_path.clone()).await?; let mut processed_reader = crate::magick::process_image_file_read(file, thumbnail_args, format)?; let mut vec = Vec::new(); processed_reader.read_to_end(&mut vec).await?; let bytes = web::Bytes::from(vec); drop(permit); let details = Details::from_bytes(bytes.clone()).await?; let save_span = tracing::info_span!( parent: None, "Saving variant information", path = tracing::field::debug(&thumbnail_path), name = tracing::field::display(&name), ); save_span.follows_from(Span::current()); let details2 = details.clone(); let bytes2 = bytes.clone(); actix_rt::spawn( async move { let real_path = match manager.next_directory() { Ok(real_path) => real_path.join(&name), Err(e) => { tracing::warn!("Failed to generate directory path: {}", e); return; } }; if let Err(e) = safe_save_file(real_path.clone(), bytes2).await { tracing::warn!("Error saving thumbnail: {}", e); return; } if let Err(e) = manager .store_variant_details(real_path.clone(), name.clone(), &details2) .await { tracing::warn!("Error saving variant details: {}", e); return; } if let Err(e) = manager .store_variant(Some(&thumbnail_path), &real_path, &name) .await { tracing::warn!("Error saving variant info: {}", e); } } .instrument(save_span), ); Ok((details, bytes)) as Result<(Details, web::Bytes), Error> }; let (details, bytes) = CancelSafeProcessor::new(thumbnail_path.clone(), process_fut).await?; match range { Some(range_header) => { if !range_header.is_bytes() { return Err(UploadError::Range.into()); } if range_header.is_empty() { Err(UploadError::Range.into()) } else if range_header.len() == 1 { let range = range_header.ranges().next().unwrap(); let content_range = range.to_content_range(bytes.len() as u64); let stream = range.chop_bytes(bytes); let mut builder = HttpResponse::PartialContent(); builder.insert_header(content_range); Ok(srv_response( builder, stream, details.content_type(), 7 * DAYS, details.system_time(), )) } else { Err(UploadError::Range.into()) } } None => Ok(srv_response( HttpResponse::Ok(), once(ready(Ok(bytes) as Result<_, Error>)), details.content_type(), 7 * DAYS, details.system_time(), )), } } /// Fetch file details #[instrument(name = "Fetching details", skip(manager))] async fn details( alias: web::Path, manager: web::Data, ) -> Result { let name = manager.from_alias(alias.into_inner()).await?; let path = manager.path_from_filename(name.clone()).await?; let details = manager.variant_details(path.clone(), name.clone()).await?; let details = if let Some(details) = details { details } else { let new_details = Details::from_path(path.clone()).await?; manager .store_variant_details(path.clone(), name, &new_details) .await?; new_details }; Ok(HttpResponse::Ok().json(&details)) } /// Serve files #[instrument(name = "Serving file", skip(manager))] async fn serve( range: Option, alias: web::Path, manager: web::Data, ) -> Result { let name = manager.from_alias(alias.into_inner()).await?; let path = manager.path_from_filename(name.clone()).await?; let details = manager.variant_details(path.clone(), name.clone()).await?; let details = if let Some(details) = details { details } else { let details = Details::from_path(path.clone()).await?; manager .store_variant_details(path.clone(), name, &details) .await?; details }; ranged_file_resp(path, range, details).await } async fn ranged_file_resp( path: PathBuf, range: Option, details: Details, ) -> Result { let (builder, stream) = match range { //Range header exists - return as ranged Some(range_header) => { if !range_header.is_bytes() { return Err(UploadError::Range.into()); } if range_header.is_empty() { return Err(UploadError::Range.into()); } else if range_header.len() == 1 { let file = crate::file::File::open(path).await?; let meta = file.metadata().await?; let range = range_header.ranges().next().unwrap(); let mut builder = HttpResponse::PartialContent(); builder.insert_header(range.to_content_range(meta.len())); (builder, Either::left(range.chop_file(file).await?)) } else { return Err(UploadError::Range.into()); } } //No Range header in the request - return the entire document None => { let file = crate::file::File::open(path).await?; let stream = file.read_to_stream(None, None).await?; (HttpResponse::Ok(), Either::right(stream)) } }; Ok(srv_response( builder, stream, details.content_type(), 7 * DAYS, details.system_time(), )) } // A helper method to produce responses with proper cache headers fn srv_response( mut builder: HttpResponseBuilder, stream: S, ext: mime::Mime, expires: u32, modified: SystemTime, ) -> HttpResponse where S: Stream> + 'static, E: std::error::Error + 'static, actix_web::Error: From, { builder .insert_header(LastModified(modified.into())) .insert_header(CacheControl(vec![ CacheDirective::Public, CacheDirective::MaxAge(expires), CacheDirective::Extension("immutable".to_owned(), None), ])) .insert_header((ACCEPT_RANGES, "bytes")) .content_type(ext.to_string()) // TODO: remove pin when actix-web drops Unpin requirement .streaming(Box::pin(stream)) } #[derive(Debug, serde::Deserialize)] #[serde(untagged)] enum FileOrAlias { File { file: String }, Alias { alias: String }, } #[instrument(name = "Purging file", skip(upload_manager))] async fn purge( query: web::Query, upload_manager: web::Data, ) -> Result { let aliases = match query.into_inner() { FileOrAlias::File { file } => upload_manager.aliases_by_filename(file).await?, FileOrAlias::Alias { alias } => upload_manager.aliases_by_alias(alias).await?, }; for alias in aliases.iter() { upload_manager .delete_without_token(alias.to_owned()) .await?; } Ok(HttpResponse::Ok().json(&serde_json::json!({ "msg": "ok", "aliases": aliases }))) } #[instrument(name = "Fetching aliases", skip(upload_manager))] async fn aliases( query: web::Query, upload_manager: web::Data, ) -> Result { let aliases = match query.into_inner() { FileOrAlias::File { file } => upload_manager.aliases_by_filename(file).await?, FileOrAlias::Alias { alias } => upload_manager.aliases_by_alias(alias).await?, }; Ok(HttpResponse::Ok().json(&serde_json::json!({ "msg": "ok", "aliases": aliases, }))) } #[derive(Debug, serde::Deserialize)] struct ByAlias { alias: String, } #[instrument(name = "Fetching filename", skip(upload_manager))] async fn filename_by_alias( query: web::Query, upload_manager: web::Data, ) -> Result { let filename = upload_manager.from_alias(query.into_inner().alias).await?; Ok(HttpResponse::Ok().json(&serde_json::json!({ "msg": "ok", "filename": filename, }))) } #[actix_rt::main] async fn main() -> anyhow::Result<()> { let manager = UploadManager::new(CONFIG.data_dir(), CONFIG.format()).await?; init_tracing("pict-rs", CONFIG.opentelemetry_url())?; // Create a new Multipart Form validator // // This form is expecting a single array field, 'images' with at most 10 files in it let manager2 = manager.clone(); let form = Form::new() .max_files(10) .max_file_size(CONFIG.max_file_size() * MEGABYTES) .transform_error(|e| Error::from(e).into()) .field( "images", Field::array(Field::file(move |filename, _, stream| { let manager = manager2.clone(); let span = tracing::info_span!("file-upload", ?filename); async move { let permit = PROCESS_SEMAPHORE.acquire().await?; let res = manager.session().upload(stream).await; drop(permit); res } .instrument(span) })), ); // Create a new Multipart Form validator for internal imports // // This form is expecting a single array field, 'images' with at most 10 files in it let validate_imports = CONFIG.validate_imports(); let manager2 = manager.clone(); let import_form = Form::new() .max_files(10) .max_file_size(CONFIG.max_file_size() * MEGABYTES) .transform_error(|e| Error::from(e).into()) .field( "images", Field::array(Field::file(move |filename, content_type, stream| { let manager = manager2.clone(); let span = tracing::info_span!("file-import", ?filename); async move { let permit = PROCESS_SEMAPHORE.acquire().await?; let res = manager .session() .import(filename, content_type, validate_imports, stream) .await; drop(permit); res } .instrument(span) })), ); HttpServer::new(move || { let client = Client::builder() .header("User-Agent", "pict-rs v0.3.0-main") .finish(); App::new() .wrap(TracingLogger::default()) .wrap(Deadline) .app_data(web::Data::new(manager.clone())) .app_data(web::Data::new(client)) .app_data(web::Data::new(CONFIG.allowed_filters())) .service( web::scope("/image") .service( web::resource("") .guard(guard::Post()) .wrap(form.clone()) .route(web::post().to(upload)), ) .service(web::resource("/download").route(web::get().to(download))) .service( web::resource("/delete/{delete_token}/{filename}") .route(web::delete().to(delete)) .route(web::get().to(delete)), ) .service(web::resource("/original/{filename}").route(web::get().to(serve))) .service(web::resource("/process.{ext}").route(web::get().to(process))) .service( web::scope("/details") .service( web::resource("/original/{filename}").route(web::get().to(details)), ) .service( web::resource("/process.{ext}") .route(web::get().to(process_details)), ), ), ) .service( web::scope("/internal") .wrap(Internal(CONFIG.api_key().map(|s| s.to_owned()))) .service( web::resource("/import") .wrap(import_form.clone()) .route(web::post().to(upload)), ) .service(web::resource("/purge").route(web::post().to(purge))) .service(web::resource("/aliases").route(web::get().to(aliases))) .service(web::resource("/filename").route(web::get().to(filename_by_alias))), ) }) .bind(CONFIG.bind_address())? .run() .await?; if tokio::fs::metadata(&*TMP_DIR).await.is_ok() { tokio::fs::remove_dir_all(&*TMP_DIR).await?; } Ok(()) }