From edb063f288a496e79496b02c854af90d394280be Mon Sep 17 00:00:00 2001 From: Dessalines Date: Tue, 21 Jan 2025 04:01:00 -0500 Subject: [PATCH] Upgrading html2text. (#5336) --- Cargo.lock | 73 ++++++++++++++++++++++++--------- Cargo.toml | 6 +-- crates/apub/Cargo.toml | 4 +- crates/apub/src/objects/post.rs | 4 +- crates/utils/Cargo.toml | 2 +- crates/utils/src/email.rs | 2 +- 6 files changed, 63 insertions(+), 28 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index b3106adc0..c9b05b77b 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -832,9 +832,9 @@ dependencies = [ [[package]] name = "clap" -version = "4.5.26" +version = "4.5.27" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a8eb5e908ef3a6efbe1ed62520fb7287959888c88485abe072543190ecc66783" +checksum = "769b0145982b4b48713e01ec42d61614425f27b7058bda7180a3a41f30104796" dependencies = [ "clap_builder", "clap_derive", @@ -842,9 +842,9 @@ dependencies = [ [[package]] name = "clap_builder" -version = "4.5.26" +version = "4.5.27" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "96b01801b5fc6a0a232407abc821660c9c6d25a1cafc0d4f85f29fb8d9afc121" +checksum = "1b26884eb4b57140e4d2d93652abfa49498b938b3c9179f9fc487b0acc3edad7" dependencies = [ "anstream", "anstyle", @@ -1371,7 +1371,7 @@ dependencies = [ "diff", "regex", "same-file", - "unicode-width", + "unicode-width 0.1.13", ] [[package]] @@ -1930,15 +1930,16 @@ dependencies = [ [[package]] name = "html2text" -version = "0.12.6" +version = "0.13.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "042a9677c258ac2952dd026bb0cd21972f00f644a5a38f5a215cb22cdaf6834e" +checksum = "1bf7722c2ffdd62628b6e13065b6ab6cf154a236bd476c6e89af1352d745b83e" dependencies = [ - "html5ever 0.27.0", - "markup5ever 0.12.1", + "html5ever 0.29.0", + "markup5ever 0.14.0", + "nom", "tendril", - "thiserror 1.0.69", - "unicode-width", + "thiserror 2.0.11", + "unicode-width 0.2.0", ] [[package]] @@ -1969,6 +1970,20 @@ dependencies = [ "syn 2.0.96", ] +[[package]] +name = "html5ever" +version = "0.29.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2e15626aaf9c351bc696217cbe29cb9b5e86c43f8a46b5e2f5c6c5cf7cb904ce" +dependencies = [ + "log", + "mac", + "markup5ever 0.14.0", + "proc-macro2", + "quote", + "syn 2.0.96", +] + [[package]] name = "http" version = "0.2.12" @@ -2957,7 +2972,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "fc2f4eb4bc735547cfed7c0a4922cbd04a4655978c09b54f1f7b228750664c34" dependencies = [ "cfg-if", - "windows-targets 0.48.5", + "windows-targets 0.52.6", ] [[package]] @@ -3155,6 +3170,20 @@ dependencies = [ "tendril", ] +[[package]] +name = "markup5ever" +version = "0.14.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "82c88c6129bd24319e62a0359cb6b958fa7e8be6e19bb1663bc396b90883aca5" +dependencies = [ + "log", + "phf 0.11.3", + "phf_codegen 0.11.3", + "string_cache", + "string_cache_codegen", + "tendril", +] + [[package]] name = "markup5ever_rcdom" version = "0.2.0" @@ -4443,9 +4472,9 @@ dependencies = [ [[package]] name = "semver" -version = "1.0.24" +version = "1.0.25" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3cb6eb87a131f756572d7fb904f6e7b68633f09cca868c5df1c4b8d1a694bbba" +checksum = "f79dfe2d285b0488816f30e700a7438c5a73d816b5b7d3ac72fbc48b0d185e03" [[package]] name = "serde" @@ -4469,9 +4498,9 @@ dependencies = [ [[package]] name = "serde_json" -version = "1.0.135" +version = "1.0.137" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2b0d7ba2887406110130a978386c4e1befb98c674b4fba677954e4db976630d9" +checksum = "930cfb6e6abf99298aaad7d29abbef7a9999a9a8806a40088f55f0dcec03146b" dependencies = [ "indexmap 2.7.0", "itoa", @@ -5466,6 +5495,12 @@ version = "0.1.13" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "0336d538f7abc86d282a4189614dfaa90810dfc2c6f6427eaf88e16311dd225d" +[[package]] +name = "unicode-width" +version = "0.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "1fc81956842c57dac11422a97c3b8195a1ff727f06e85c84ed2e8aa277c9a0fd" + [[package]] name = "unicode-xid" version = "0.2.6" @@ -5528,9 +5563,9 @@ checksum = "06abde3611657adf66d383f00b093d7faecc7fa57071cce2578660c9f1010821" [[package]] name = "uuid" -version = "1.12.0" +version = "1.12.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "744018581f9a3454a9e15beb8a33b017183f1e7c0cd170232a2d1453b23a51c4" +checksum = "b3758f5e68192bb96cc8f9b7e2c2cfdabb435499a28499a42f8f984092adad4b" dependencies = [ "getrandom", "serde", @@ -5766,7 +5801,7 @@ version = "0.1.9" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "cf221c93e13a30d793f7645a0e7762c55d169dbb0a49671918a2319d289b10bb" dependencies = [ - "windows-sys 0.48.0", + "windows-sys 0.59.0", ] [[package]] diff --git a/Cargo.toml b/Cargo.toml index 3c83037a5..ad88bd610 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -128,9 +128,9 @@ chrono = { version = "0.4.39", features = [ "now", "serde", ], default-features = false } -serde_json = { version = "1.0.135", features = ["preserve_order"] } +serde_json = { version = "1.0.137", features = ["preserve_order"] } base64 = "0.22.1" -uuid = { version = "1.12.0", features = ["serde"] } +uuid = { version = "1.12.1", features = ["serde"] } async-trait = "0.1.85" captcha = "0.0.9" anyhow = { version = "1.0.95", features = ["backtrace"] } @@ -158,7 +158,7 @@ urlencoding = "2.1.3" enum-map = "2.7" moka = { version = "0.12.10", features = ["future"] } i-love-jesus = { version = "0.1.0" } -clap = { version = "4.5.26", features = ["derive", "env"] } +clap = { version = "4.5.27", features = ["derive", "env"] } pretty_assertions = "1.4.1" derive-new = "0.7.0" diesel-bind-if-some = "0.1.0" diff --git a/crates/apub/Cargo.toml b/crates/apub/Cargo.toml index bd6fe3d28..75d16ff0f 100644 --- a/crates/apub/Cargo.toml +++ b/crates/apub/Cargo.toml @@ -42,10 +42,10 @@ reqwest = { workspace = true } moka.workspace = true serde_with.workspace = true html2md = "0.2.15" -html2text = "0.12.6" +html2text = "0.13.6" stringreader = "0.1.1" enum_delegate = "0.2.0" -semver = "1.0.24" +semver = "1.0.25" [dev-dependencies] serial_test = { workspace = true } diff --git a/crates/apub/src/objects/post.rs b/crates/apub/src/objects/post.rs index 73e940a3c..64effbe6a 100644 --- a/crates/apub/src/objects/post.rs +++ b/crates/apub/src/objects/post.rs @@ -21,7 +21,7 @@ use activitypub_federation::{ }; use anyhow::anyhow; use chrono::{DateTime, Utc}; -use html2text::{from_read_with_decorator, render::text_renderer::TrivialDecorator}; +use html2text::{from_read_with_decorator, render::TrivialDecorator}; use lemmy_api_common::{ context::LemmyContext, request::generate_post_link_metadata, @@ -198,7 +198,7 @@ impl Object for ApubPost { .map(StringReader::new) .map(|c| from_read_with_decorator(c, MAX_TITLE_LENGTH, TrivialDecorator::new())) .and_then(|c| { - c.lines().next().map(|s| { + c.unwrap_or_default().lines().next().map(|s| { s.replace(&format!("@{}", community.name), "") .trim() .to_string() diff --git a/crates/utils/Cargo.toml b/crates/utils/Cargo.toml index e6af866d5..72e2e7f52 100644 --- a/crates/utils/Cargo.toml +++ b/crates/utils/Cargo.toml @@ -72,7 +72,7 @@ uuid = { workspace = true, optional = true, features = ["v4"] } rosetta-i18n = { workspace = true, optional = true } tokio = { workspace = true, optional = true } urlencoding = { workspace = true, optional = true } -html2text = { version = "0.12.6", optional = true } +html2text = { version = "0.13.6", optional = true } deser-hjson = { version = "2.2.4", optional = true } smart-default = { version = "0.7.1", optional = true } lettre = { version = "0.11.11", default-features = false, features = [ diff --git a/crates/utils/src/email.rs b/crates/utils/src/email.rs index 46abb47ea..aa06ba1b9 100644 --- a/crates/utils/src/email.rs +++ b/crates/utils/src/email.rs @@ -43,7 +43,7 @@ pub async fn send_email( }; // use usize::MAX as the line wrap length, since lettre handles the wrapping for us - let plain_text = html2text::from_read(html.as_bytes(), usize::MAX); + let plain_text = html2text::from_read(html.as_bytes(), usize::MAX)?; let smtp_from_address = &email_config.smtp_from_address;